diff options
| author | Linus Torvalds <torvalds@linux-foundation.org> | 2010-11-26 17:28:17 -0500 |
|---|---|---|
| committer | Linus Torvalds <torvalds@linux-foundation.org> | 2010-11-26 17:28:17 -0500 |
| commit | d2f30c73aba19be828c759edcd21140390cd06e4 (patch) | |
| tree | b9bad75b11e21680f8f9443f0143d62be23cae78 /kernel | |
| parent | 1b065fdff1c950d96e4c571abe873a9a8aaa6d51 (diff) | |
| parent | 02a9d03772aa1ff33a26180a2da0bfb191240eda (diff) | |
Merge branch 'perf-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/linux-2.6-tip
* 'perf-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/linux-2.6-tip:
perf symbols: Remove incorrect open-coded container_of()
perf record: Handle restrictive permissions in /proc/{kallsyms,modules}
x86/kprobes: Prevent kprobes to probe on save_args()
irq_work: Drop cmpxchg() result
perf: Fix owner-list vs exit
x86, hw_nmi: Move backtrace_mask declaration under ARCH_HAS_NMI_WATCHDOG
tracing: Fix recursive user stack trace
perf,hw_breakpoint: Initialize hardware api earlier
x86: Ignore trap bits on single step exceptions
tracing: Force arch_local_irq_* notrace for paravirt
tracing: Fix module use of trace_bprintk()
Diffstat (limited to 'kernel')
| -rw-r--r-- | kernel/hw_breakpoint.c | 3 | ||||
| -rw-r--r-- | kernel/irq_work.c | 4 | ||||
| -rw-r--r-- | kernel/module.c | 12 | ||||
| -rw-r--r-- | kernel/perf_event.c | 69 | ||||
| -rw-r--r-- | kernel/trace/trace.c | 19 |
5 files changed, 92 insertions, 15 deletions
diff --git a/kernel/hw_breakpoint.c b/kernel/hw_breakpoint.c index 2c9120f0afc..e5325825aeb 100644 --- a/kernel/hw_breakpoint.c +++ b/kernel/hw_breakpoint.c | |||
| @@ -620,7 +620,7 @@ static struct pmu perf_breakpoint = { | |||
| 620 | .read = hw_breakpoint_pmu_read, | 620 | .read = hw_breakpoint_pmu_read, |
| 621 | }; | 621 | }; |
| 622 | 622 | ||
| 623 | static int __init init_hw_breakpoint(void) | 623 | int __init init_hw_breakpoint(void) |
| 624 | { | 624 | { |
| 625 | unsigned int **task_bp_pinned; | 625 | unsigned int **task_bp_pinned; |
| 626 | int cpu, err_cpu; | 626 | int cpu, err_cpu; |
| @@ -655,6 +655,5 @@ static int __init init_hw_breakpoint(void) | |||
| 655 | 655 | ||
| 656 | return -ENOMEM; | 656 | return -ENOMEM; |
| 657 | } | 657 | } |
| 658 | core_initcall(init_hw_breakpoint); | ||
| 659 | 658 | ||
| 660 | 659 | ||
diff --git a/kernel/irq_work.c b/kernel/irq_work.c index f16763ff848..90f881904bb 100644 --- a/kernel/irq_work.c +++ b/kernel/irq_work.c | |||
| @@ -145,7 +145,9 @@ void irq_work_run(void) | |||
| 145 | * Clear the BUSY bit and return to the free state if | 145 | * Clear the BUSY bit and return to the free state if |
| 146 | * no-one else claimed it meanwhile. | 146 | * no-one else claimed it meanwhile. |
| 147 | */ | 147 | */ |
| 148 | cmpxchg(&entry->next, next_flags(NULL, IRQ_WORK_BUSY), NULL); | 148 | (void)cmpxchg(&entry->next, |
| 149 | next_flags(NULL, IRQ_WORK_BUSY), | ||
| 150 | NULL); | ||
| 149 | } | 151 | } |
| 150 | } | 152 | } |
| 151 | EXPORT_SYMBOL_GPL(irq_work_run); | 153 | EXPORT_SYMBOL_GPL(irq_work_run); |
diff --git a/kernel/module.c b/kernel/module.c index 437a74a7524..d190664f25f 100644 --- a/kernel/module.c +++ b/kernel/module.c | |||
| @@ -2326,6 +2326,18 @@ static void find_module_sections(struct module *mod, struct load_info *info) | |||
| 2326 | kmemleak_scan_area(mod->trace_events, sizeof(*mod->trace_events) * | 2326 | kmemleak_scan_area(mod->trace_events, sizeof(*mod->trace_events) * |
| 2327 | mod->num_trace_events, GFP_KERNEL); | 2327 | mod->num_trace_events, GFP_KERNEL); |
| 2328 | #endif | 2328 | #endif |
| 2329 | #ifdef CONFIG_TRACING | ||
| 2330 | mod->trace_bprintk_fmt_start = section_objs(info, "__trace_printk_fmt", | ||
| 2331 | sizeof(*mod->trace_bprintk_fmt_start), | ||
| 2332 | &mod->num_trace_bprintk_fmt); | ||
| 2333 | /* | ||
| 2334 | * This section contains pointers to allocated objects in the trace | ||
| 2335 | * code and not scanning it leads to false positives. | ||
| 2336 | */ | ||
| 2337 | kmemleak_scan_area(mod->trace_bprintk_fmt_start, | ||
| 2338 | sizeof(*mod->trace_bprintk_fmt_start) * | ||
| 2339 | mod->num_trace_bprintk_fmt, GFP_KERNEL); | ||
| 2340 | #endif | ||
| 2329 | #ifdef CONFIG_FTRACE_MCOUNT_RECORD | 2341 | #ifdef CONFIG_FTRACE_MCOUNT_RECORD |
| 2330 | /* sechdrs[0].sh_size is always zero */ | 2342 | /* sechdrs[0].sh_size is always zero */ |
| 2331 | mod->ftrace_callsites = section_objs(info, "__mcount_loc", | 2343 | mod->ftrace_callsites = section_objs(info, "__mcount_loc", |
diff --git a/kernel/perf_event.c b/kernel/perf_event.c index cb6c0d2af68..671f6c8c8a3 100644 --- a/kernel/perf_event.c +++ b/kernel/perf_event.c | |||
| @@ -31,6 +31,7 @@ | |||
| 31 | #include <linux/kernel_stat.h> | 31 | #include <linux/kernel_stat.h> |
| 32 | #include <linux/perf_event.h> | 32 | #include <linux/perf_event.h> |
| 33 | #include <linux/ftrace_event.h> | 33 | #include <linux/ftrace_event.h> |
| 34 | #include <linux/hw_breakpoint.h> | ||
| 34 | 35 | ||
| 35 | #include <asm/irq_regs.h> | 36 | #include <asm/irq_regs.h> |
| 36 | 37 | ||
| @@ -2234,11 +2235,6 @@ int perf_event_release_kernel(struct perf_event *event) | |||
| 2234 | raw_spin_unlock_irq(&ctx->lock); | 2235 | raw_spin_unlock_irq(&ctx->lock); |
| 2235 | mutex_unlock(&ctx->mutex); | 2236 | mutex_unlock(&ctx->mutex); |
| 2236 | 2237 | ||
| 2237 | mutex_lock(&event->owner->perf_event_mutex); | ||
| 2238 | list_del_init(&event->owner_entry); | ||
| 2239 | mutex_unlock(&event->owner->perf_event_mutex); | ||
| 2240 | put_task_struct(event->owner); | ||
| 2241 | |||
| 2242 | free_event(event); | 2238 | free_event(event); |
| 2243 | 2239 | ||
| 2244 | return 0; | 2240 | return 0; |
| @@ -2251,9 +2247,43 @@ EXPORT_SYMBOL_GPL(perf_event_release_kernel); | |||
| 2251 | static int perf_release(struct inode *inode, struct file *file) | 2247 | static int perf_release(struct inode *inode, struct file *file) |
| 2252 | { | 2248 | { |
| 2253 | struct perf_event *event = file->private_data; | 2249 | struct perf_event *event = file->private_data; |
| 2250 | struct task_struct *owner; | ||
| 2254 | 2251 | ||
| 2255 | file->private_data = NULL; | 2252 | file->private_data = NULL; |
| 2256 | 2253 | ||
| 2254 | rcu_read_lock(); | ||
| 2255 | owner = ACCESS_ONCE(event->owner); | ||
| 2256 | /* | ||
| 2257 | * Matches the smp_wmb() in perf_event_exit_task(). If we observe | ||
| 2258 | * !owner it means the list deletion is complete and we can indeed | ||
| 2259 | * free this event, otherwise we need to serialize on | ||
| 2260 | * owner->perf_event_mutex. | ||
| 2261 | */ | ||
| 2262 | smp_read_barrier_depends(); | ||
| 2263 | if (owner) { | ||
| 2264 | /* | ||
| 2265 | * Since delayed_put_task_struct() also drops the last | ||
| 2266 | * task reference we can safely take a new reference | ||
| 2267 | * while holding the rcu_read_lock(). | ||
| 2268 | */ | ||
| 2269 | get_task_struct(owner); | ||
| 2270 | } | ||
| 2271 | rcu_read_unlock(); | ||
| 2272 | |||
| 2273 | if (owner) { | ||
| 2274 | mutex_lock(&owner->perf_event_mutex); | ||
| 2275 | /* | ||
| 2276 | * We have to re-check the event->owner field, if it is cleared | ||
| 2277 | * we raced with perf_event_exit_task(), acquiring the mutex | ||
| 2278 | * ensured they're done, and we can proceed with freeing the | ||
| 2279 | * event. | ||
| 2280 | */ | ||
| 2281 | if (event->owner) | ||
| 2282 | list_del_init(&event->owner_entry); | ||
| 2283 | mutex_unlock(&owner->perf_event_mutex); | ||
| 2284 | put_task_struct(owner); | ||
| 2285 | } | ||
| 2286 | |||
| 2257 | return perf_event_release_kernel(event); | 2287 | return perf_event_release_kernel(event); |
| 2258 | } | 2288 | } |
| 2259 | 2289 | ||
| @@ -5677,7 +5707,7 @@ SYSCALL_DEFINE5(perf_event_open, | |||
| 5677 | mutex_unlock(&ctx->mutex); | 5707 | mutex_unlock(&ctx->mutex); |
| 5678 | 5708 | ||
| 5679 | event->owner = current; | 5709 | event->owner = current; |
| 5680 | get_task_struct(current); | 5710 | |
| 5681 | mutex_lock(¤t->perf_event_mutex); | 5711 | mutex_lock(¤t->perf_event_mutex); |
| 5682 | list_add_tail(&event->owner_entry, ¤t->perf_event_list); | 5712 | list_add_tail(&event->owner_entry, ¤t->perf_event_list); |
| 5683 | mutex_unlock(¤t->perf_event_mutex); | 5713 | mutex_unlock(¤t->perf_event_mutex); |
| @@ -5745,12 +5775,6 @@ perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu, | |||
| 5745 | ++ctx->generation; | 5775 | ++ctx->generation; |
| 5746 | mutex_unlock(&ctx->mutex); | 5776 | mutex_unlock(&ctx->mutex); |
| 5747 | 5777 | ||
| 5748 | event->owner = current; | ||
| 5749 | get_task_struct(current); | ||
| 5750 | mutex_lock(¤t->perf_event_mutex); | ||
| 5751 | list_add_tail(&event->owner_entry, ¤t->perf_event_list); | ||
| 5752 | mutex_unlock(¤t->perf_event_mutex); | ||
| 5753 | |||
| 5754 | return event; | 5778 | return event; |
| 5755 | 5779 | ||
| 5756 | err_free: | 5780 | err_free: |
| @@ -5901,8 +5925,24 @@ again: | |||
| 5901 | */ | 5925 | */ |
| 5902 | void perf_event_exit_task(struct task_struct *child) | 5926 | void perf_event_exit_task(struct task_struct *child) |
| 5903 | { | 5927 | { |
| 5928 | struct perf_event *event, *tmp; | ||
| 5904 | int ctxn; | 5929 | int ctxn; |
| 5905 | 5930 | ||
| 5931 | mutex_lock(&child->perf_event_mutex); | ||
| 5932 | list_for_each_entry_safe(event, tmp, &child->perf_event_list, | ||
| 5933 | owner_entry) { | ||
| 5934 | list_del_init(&event->owner_entry); | ||
| 5935 | |||
| 5936 | /* | ||
| 5937 | * Ensure the list deletion is visible before we clear | ||
| 5938 | * the owner, closes a race against perf_release() where | ||
| 5939 | * we need to serialize on the owner->perf_event_mutex. | ||
| 5940 | */ | ||
| 5941 | smp_wmb(); | ||
| 5942 | event->owner = NULL; | ||
| 5943 | } | ||
| 5944 | mutex_unlock(&child->perf_event_mutex); | ||
| 5945 | |||
| 5906 | for_each_task_context_nr(ctxn) | 5946 | for_each_task_context_nr(ctxn) |
| 5907 | perf_event_exit_task_context(child, ctxn); | 5947 | perf_event_exit_task_context(child, ctxn); |
| 5908 | } | 5948 | } |
| @@ -6321,6 +6361,8 @@ perf_cpu_notify(struct notifier_block *self, unsigned long action, void *hcpu) | |||
| 6321 | 6361 | ||
| 6322 | void __init perf_event_init(void) | 6362 | void __init perf_event_init(void) |
| 6323 | { | 6363 | { |
| 6364 | int ret; | ||
| 6365 | |||
| 6324 | perf_event_init_all_cpus(); | 6366 | perf_event_init_all_cpus(); |
| 6325 | init_srcu_struct(&pmus_srcu); | 6367 | init_srcu_struct(&pmus_srcu); |
| 6326 | perf_pmu_register(&perf_swevent); | 6368 | perf_pmu_register(&perf_swevent); |
| @@ -6328,4 +6370,7 @@ void __init perf_event_init(void) | |||
| 6328 | perf_pmu_register(&perf_task_clock); | 6370 | perf_pmu_register(&perf_task_clock); |
| 6329 | perf_tp_register(); | 6371 | perf_tp_register(); |
| 6330 | perf_cpu_notifier(perf_cpu_notify); | 6372 | perf_cpu_notifier(perf_cpu_notify); |
| 6373 | |||
| 6374 | ret = init_hw_breakpoint(); | ||
| 6375 | WARN(ret, "hw_breakpoint initialization failed with: %d", ret); | ||
| 6331 | } | 6376 | } |
diff --git a/kernel/trace/trace.c b/kernel/trace/trace.c index 04208415798..c380612273b 100644 --- a/kernel/trace/trace.c +++ b/kernel/trace/trace.c | |||
| @@ -1283,6 +1283,8 @@ void trace_dump_stack(void) | |||
| 1283 | __ftrace_trace_stack(global_trace.buffer, flags, 3, preempt_count()); | 1283 | __ftrace_trace_stack(global_trace.buffer, flags, 3, preempt_count()); |
| 1284 | } | 1284 | } |
| 1285 | 1285 | ||
| 1286 | static DEFINE_PER_CPU(int, user_stack_count); | ||
| 1287 | |||
| 1286 | void | 1288 | void |
| 1287 | ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc) | 1289 | ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc) |
| 1288 | { | 1290 | { |
| @@ -1301,6 +1303,18 @@ ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc) | |||
| 1301 | if (unlikely(in_nmi())) | 1303 | if (unlikely(in_nmi())) |
| 1302 | return; | 1304 | return; |
| 1303 | 1305 | ||
| 1306 | /* | ||
| 1307 | * prevent recursion, since the user stack tracing may | ||
| 1308 | * trigger other kernel events. | ||
| 1309 | */ | ||
| 1310 | preempt_disable(); | ||
| 1311 | if (__this_cpu_read(user_stack_count)) | ||
| 1312 | goto out; | ||
| 1313 | |||
| 1314 | __this_cpu_inc(user_stack_count); | ||
| 1315 | |||
| 1316 | |||
| 1317 | |||
| 1304 | event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK, | 1318 | event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK, |
| 1305 | sizeof(*entry), flags, pc); | 1319 | sizeof(*entry), flags, pc); |
| 1306 | if (!event) | 1320 | if (!event) |
| @@ -1318,6 +1332,11 @@ ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc) | |||
| 1318 | save_stack_trace_user(&trace); | 1332 | save_stack_trace_user(&trace); |
| 1319 | if (!filter_check_discard(call, entry, buffer, event)) | 1333 | if (!filter_check_discard(call, entry, buffer, event)) |
| 1320 | ring_buffer_unlock_commit(buffer, event); | 1334 | ring_buffer_unlock_commit(buffer, event); |
| 1335 | |||
| 1336 | __this_cpu_dec(user_stack_count); | ||
| 1337 | |||
| 1338 | out: | ||
| 1339 | preempt_enable(); | ||
| 1321 | } | 1340 | } |
| 1322 | 1341 | ||
| 1323 | #ifdef UNUSED | 1342 | #ifdef UNUSED |
