diff options
author | Robert Richter <robert.richter@amd.com> | 2009-01-08 08:27:34 -0500 |
---|---|---|
committer | Robert Richter <robert.richter@amd.com> | 2009-01-08 08:27:34 -0500 |
commit | d2852b932f0bb5e89177aa27c7bcf07f4167e129 (patch) | |
tree | 96d975ae155ba307acd07968939fff22afedddf7 /drivers | |
parent | 4a6908a3a050aacc9c3a2f36b276b46c0629ad91 (diff) | |
parent | 14f0ca8eaea42a5b5a69cfcb699665dd2618db5f (diff) |
Merge branch 'oprofile/ring_buffer' into oprofile/oprofile-for-tip
Diffstat (limited to 'drivers')
-rw-r--r-- | drivers/oprofile/buffer_sync.c | 229 | ||||
-rw-r--r-- | drivers/oprofile/cpu_buffer.c | 393 | ||||
-rw-r--r-- | drivers/oprofile/cpu_buffer.h | 72 | ||||
-rw-r--r-- | drivers/oprofile/event_buffer.c | 4 | ||||
-rw-r--r-- | drivers/oprofile/oprof.c | 4 | ||||
-rw-r--r-- | drivers/oprofile/oprof.h | 8 | ||||
-rw-r--r-- | drivers/oprofile/oprofile_files.c | 24 |
7 files changed, 408 insertions, 326 deletions
diff --git a/drivers/oprofile/buffer_sync.c b/drivers/oprofile/buffer_sync.c index b55cd23ffdef..ac014cb27915 100644 --- a/drivers/oprofile/buffer_sync.c +++ b/drivers/oprofile/buffer_sync.c | |||
@@ -1,11 +1,12 @@ | |||
1 | /** | 1 | /** |
2 | * @file buffer_sync.c | 2 | * @file buffer_sync.c |
3 | * | 3 | * |
4 | * @remark Copyright 2002 OProfile authors | 4 | * @remark Copyright 2002-2009 OProfile authors |
5 | * @remark Read the file COPYING | 5 | * @remark Read the file COPYING |
6 | * | 6 | * |
7 | * @author John Levon <levon@movementarian.org> | 7 | * @author John Levon <levon@movementarian.org> |
8 | * @author Barry Kasindorf | 8 | * @author Barry Kasindorf |
9 | * @author Robert Richter <robert.richter@amd.com> | ||
9 | * | 10 | * |
10 | * This is the core of the buffer management. Each | 11 | * This is the core of the buffer management. Each |
11 | * CPU buffer is processed and entered into the | 12 | * CPU buffer is processed and entered into the |
@@ -268,18 +269,6 @@ lookup_dcookie(struct mm_struct *mm, unsigned long addr, off_t *offset) | |||
268 | return cookie; | 269 | return cookie; |
269 | } | 270 | } |
270 | 271 | ||
271 | static void increment_tail(struct oprofile_cpu_buffer *b) | ||
272 | { | ||
273 | unsigned long new_tail = b->tail_pos + 1; | ||
274 | |||
275 | rmb(); /* be sure fifo pointers are synchromized */ | ||
276 | |||
277 | if (new_tail < b->buffer_size) | ||
278 | b->tail_pos = new_tail; | ||
279 | else | ||
280 | b->tail_pos = 0; | ||
281 | } | ||
282 | |||
283 | static unsigned long last_cookie = INVALID_COOKIE; | 272 | static unsigned long last_cookie = INVALID_COOKIE; |
284 | 273 | ||
285 | static void add_cpu_switch(int i) | 274 | static void add_cpu_switch(int i) |
@@ -327,84 +316,73 @@ static void add_trace_begin(void) | |||
327 | add_event_entry(TRACE_BEGIN_CODE); | 316 | add_event_entry(TRACE_BEGIN_CODE); |
328 | } | 317 | } |
329 | 318 | ||
330 | #ifdef CONFIG_OPROFILE_IBS | 319 | static void add_data(struct op_entry *entry, struct mm_struct *mm) |
331 | |||
332 | #define IBS_FETCH_CODE_SIZE 2 | ||
333 | #define IBS_OP_CODE_SIZE 5 | ||
334 | #define IBS_EIP(offset) \ | ||
335 | (((struct op_sample *)&cpu_buf->buffer[(offset)])->eip) | ||
336 | #define IBS_EVENT(offset) \ | ||
337 | (((struct op_sample *)&cpu_buf->buffer[(offset)])->event) | ||
338 | |||
339 | /* | ||
340 | * Add IBS fetch and op entries to event buffer | ||
341 | */ | ||
342 | static void add_ibs_begin(struct oprofile_cpu_buffer *cpu_buf, int code, | ||
343 | struct mm_struct *mm) | ||
344 | { | 320 | { |
345 | unsigned long rip; | 321 | unsigned long code, pc, val; |
346 | int i, count; | 322 | unsigned long cookie; |
347 | unsigned long ibs_cookie = 0; | ||
348 | off_t offset; | 323 | off_t offset; |
349 | 324 | ||
350 | increment_tail(cpu_buf); /* move to RIP entry */ | 325 | if (!op_cpu_buffer_get_data(entry, &code)) |
351 | 326 | return; | |
352 | rip = IBS_EIP(cpu_buf->tail_pos); | 327 | if (!op_cpu_buffer_get_data(entry, &pc)) |
353 | 328 | return; | |
354 | #ifdef __LP64__ | 329 | if (!op_cpu_buffer_get_size(entry)) |
355 | rip += IBS_EVENT(cpu_buf->tail_pos) << 32; | 330 | return; |
356 | #endif | ||
357 | 331 | ||
358 | if (mm) { | 332 | if (mm) { |
359 | ibs_cookie = lookup_dcookie(mm, rip, &offset); | 333 | cookie = lookup_dcookie(mm, pc, &offset); |
360 | 334 | ||
361 | if (ibs_cookie == NO_COOKIE) | 335 | if (cookie == NO_COOKIE) |
362 | offset = rip; | 336 | offset = pc; |
363 | if (ibs_cookie == INVALID_COOKIE) { | 337 | if (cookie == INVALID_COOKIE) { |
364 | atomic_inc(&oprofile_stats.sample_lost_no_mapping); | 338 | atomic_inc(&oprofile_stats.sample_lost_no_mapping); |
365 | offset = rip; | 339 | offset = pc; |
366 | } | 340 | } |
367 | if (ibs_cookie != last_cookie) { | 341 | if (cookie != last_cookie) { |
368 | add_cookie_switch(ibs_cookie); | 342 | add_cookie_switch(cookie); |
369 | last_cookie = ibs_cookie; | 343 | last_cookie = cookie; |
370 | } | 344 | } |
371 | } else | 345 | } else |
372 | offset = rip; | 346 | offset = pc; |
373 | 347 | ||
374 | add_event_entry(ESCAPE_CODE); | 348 | add_event_entry(ESCAPE_CODE); |
375 | add_event_entry(code); | 349 | add_event_entry(code); |
376 | add_event_entry(offset); /* Offset from Dcookie */ | 350 | add_event_entry(offset); /* Offset from Dcookie */ |
377 | 351 | ||
378 | /* we send the Dcookie offset, but send the raw Linear Add also*/ | 352 | while (op_cpu_buffer_get_data(entry, &val)) |
379 | add_event_entry(IBS_EIP(cpu_buf->tail_pos)); | 353 | add_event_entry(val); |
380 | add_event_entry(IBS_EVENT(cpu_buf->tail_pos)); | ||
381 | |||
382 | if (code == IBS_FETCH_CODE) | ||
383 | count = IBS_FETCH_CODE_SIZE; /*IBS FETCH is 2 int64s*/ | ||
384 | else | ||
385 | count = IBS_OP_CODE_SIZE; /*IBS OP is 5 int64s*/ | ||
386 | |||
387 | for (i = 0; i < count; i++) { | ||
388 | increment_tail(cpu_buf); | ||
389 | add_event_entry(IBS_EIP(cpu_buf->tail_pos)); | ||
390 | add_event_entry(IBS_EVENT(cpu_buf->tail_pos)); | ||
391 | } | ||
392 | } | 354 | } |
393 | 355 | ||
394 | #endif | 356 | static inline void add_sample_entry(unsigned long offset, unsigned long event) |
395 | |||
396 | static void add_sample_entry(unsigned long offset, unsigned long event) | ||
397 | { | 357 | { |
398 | add_event_entry(offset); | 358 | add_event_entry(offset); |
399 | add_event_entry(event); | 359 | add_event_entry(event); |
400 | } | 360 | } |
401 | 361 | ||
402 | 362 | ||
403 | static int add_us_sample(struct mm_struct *mm, struct op_sample *s) | 363 | /* |
364 | * Add a sample to the global event buffer. If possible the | ||
365 | * sample is converted into a persistent dentry/offset pair | ||
366 | * for later lookup from userspace. Return 0 on failure. | ||
367 | */ | ||
368 | static int | ||
369 | add_sample(struct mm_struct *mm, struct op_sample *s, int in_kernel) | ||
404 | { | 370 | { |
405 | unsigned long cookie; | 371 | unsigned long cookie; |
406 | off_t offset; | 372 | off_t offset; |
407 | 373 | ||
374 | if (in_kernel) { | ||
375 | add_sample_entry(s->eip, s->event); | ||
376 | return 1; | ||
377 | } | ||
378 | |||
379 | /* add userspace sample */ | ||
380 | |||
381 | if (!mm) { | ||
382 | atomic_inc(&oprofile_stats.sample_lost_no_mm); | ||
383 | return 0; | ||
384 | } | ||
385 | |||
408 | cookie = lookup_dcookie(mm, s->eip, &offset); | 386 | cookie = lookup_dcookie(mm, s->eip, &offset); |
409 | 387 | ||
410 | if (cookie == INVALID_COOKIE) { | 388 | if (cookie == INVALID_COOKIE) { |
@@ -423,25 +401,6 @@ static int add_us_sample(struct mm_struct *mm, struct op_sample *s) | |||
423 | } | 401 | } |
424 | 402 | ||
425 | 403 | ||
426 | /* Add a sample to the global event buffer. If possible the | ||
427 | * sample is converted into a persistent dentry/offset pair | ||
428 | * for later lookup from userspace. | ||
429 | */ | ||
430 | static int | ||
431 | add_sample(struct mm_struct *mm, struct op_sample *s, int in_kernel) | ||
432 | { | ||
433 | if (in_kernel) { | ||
434 | add_sample_entry(s->eip, s->event); | ||
435 | return 1; | ||
436 | } else if (mm) { | ||
437 | return add_us_sample(mm, s); | ||
438 | } else { | ||
439 | atomic_inc(&oprofile_stats.sample_lost_no_mm); | ||
440 | } | ||
441 | return 0; | ||
442 | } | ||
443 | |||
444 | |||
445 | static void release_mm(struct mm_struct *mm) | 404 | static void release_mm(struct mm_struct *mm) |
446 | { | 405 | { |
447 | if (!mm) | 406 | if (!mm) |
@@ -466,33 +425,6 @@ static inline int is_code(unsigned long val) | |||
466 | } | 425 | } |
467 | 426 | ||
468 | 427 | ||
469 | /* "acquire" as many cpu buffer slots as we can */ | ||
470 | static unsigned long get_slots(struct oprofile_cpu_buffer *b) | ||
471 | { | ||
472 | unsigned long head = b->head_pos; | ||
473 | unsigned long tail = b->tail_pos; | ||
474 | |||
475 | /* | ||
476 | * Subtle. This resets the persistent last_task | ||
477 | * and in_kernel values used for switching notes. | ||
478 | * BUT, there is a small window between reading | ||
479 | * head_pos, and this call, that means samples | ||
480 | * can appear at the new head position, but not | ||
481 | * be prefixed with the notes for switching | ||
482 | * kernel mode or a task switch. This small hole | ||
483 | * can lead to mis-attribution or samples where | ||
484 | * we don't know if it's in the kernel or not, | ||
485 | * at the start of an event buffer. | ||
486 | */ | ||
487 | cpu_buffer_reset(b); | ||
488 | |||
489 | if (head >= tail) | ||
490 | return head - tail; | ||
491 | |||
492 | return head + (b->buffer_size - tail); | ||
493 | } | ||
494 | |||
495 | |||
496 | /* Move tasks along towards death. Any tasks on dead_tasks | 428 | /* Move tasks along towards death. Any tasks on dead_tasks |
497 | * will definitely have no remaining references in any | 429 | * will definitely have no remaining references in any |
498 | * CPU buffers at this point, because we use two lists, | 430 | * CPU buffers at this point, because we use two lists, |
@@ -559,71 +491,72 @@ typedef enum { | |||
559 | */ | 491 | */ |
560 | void sync_buffer(int cpu) | 492 | void sync_buffer(int cpu) |
561 | { | 493 | { |
562 | struct oprofile_cpu_buffer *cpu_buf = &per_cpu(cpu_buffer, cpu); | ||
563 | struct mm_struct *mm = NULL; | 494 | struct mm_struct *mm = NULL; |
495 | struct mm_struct *oldmm; | ||
496 | unsigned long val; | ||
564 | struct task_struct *new; | 497 | struct task_struct *new; |
565 | unsigned long cookie = 0; | 498 | unsigned long cookie = 0; |
566 | int in_kernel = 1; | 499 | int in_kernel = 1; |
567 | sync_buffer_state state = sb_buffer_start; | 500 | sync_buffer_state state = sb_buffer_start; |
568 | #ifndef CONFIG_OPROFILE_IBS | ||
569 | unsigned int i; | 501 | unsigned int i; |
570 | unsigned long available; | 502 | unsigned long available; |
571 | #endif | 503 | unsigned long flags; |
504 | struct op_entry entry; | ||
505 | struct op_sample *sample; | ||
572 | 506 | ||
573 | mutex_lock(&buffer_mutex); | 507 | mutex_lock(&buffer_mutex); |
574 | 508 | ||
575 | add_cpu_switch(cpu); | 509 | add_cpu_switch(cpu); |
576 | 510 | ||
577 | /* Remember, only we can modify tail_pos */ | 511 | op_cpu_buffer_reset(cpu); |
578 | 512 | available = op_cpu_buffer_entries(cpu); | |
579 | #ifndef CONFIG_OPROFILE_IBS | ||
580 | available = get_slots(cpu_buf); | ||
581 | 513 | ||
582 | for (i = 0; i < available; ++i) { | 514 | for (i = 0; i < available; ++i) { |
583 | #else | 515 | sample = op_cpu_buffer_read_entry(&entry, cpu); |
584 | while (get_slots(cpu_buf)) { | 516 | if (!sample) |
585 | #endif | 517 | break; |
586 | struct op_sample *s = &cpu_buf->buffer[cpu_buf->tail_pos]; | ||
587 | 518 | ||
588 | if (is_code(s->eip)) { | 519 | if (is_code(sample->eip)) { |
589 | if (s->event <= CPU_IS_KERNEL) { | 520 | flags = sample->event; |
521 | if (flags & TRACE_BEGIN) { | ||
522 | state = sb_bt_start; | ||
523 | add_trace_begin(); | ||
524 | } | ||
525 | if (flags & KERNEL_CTX_SWITCH) { | ||
590 | /* kernel/userspace switch */ | 526 | /* kernel/userspace switch */ |
591 | in_kernel = s->event; | 527 | in_kernel = flags & IS_KERNEL; |
592 | if (state == sb_buffer_start) | 528 | if (state == sb_buffer_start) |
593 | state = sb_sample_start; | 529 | state = sb_sample_start; |
594 | add_kernel_ctx_switch(s->event); | 530 | add_kernel_ctx_switch(flags & IS_KERNEL); |
595 | } else if (s->event == CPU_TRACE_BEGIN) { | 531 | } |
596 | state = sb_bt_start; | 532 | if (flags & USER_CTX_SWITCH |
597 | add_trace_begin(); | 533 | && op_cpu_buffer_get_data(&entry, &val)) { |
598 | #ifdef CONFIG_OPROFILE_IBS | ||
599 | } else if (s->event == IBS_FETCH_BEGIN) { | ||
600 | state = sb_bt_start; | ||
601 | add_ibs_begin(cpu_buf, IBS_FETCH_CODE, mm); | ||
602 | } else if (s->event == IBS_OP_BEGIN) { | ||
603 | state = sb_bt_start; | ||
604 | add_ibs_begin(cpu_buf, IBS_OP_CODE, mm); | ||
605 | #endif | ||
606 | } else { | ||
607 | struct mm_struct *oldmm = mm; | ||
608 | |||
609 | /* userspace context switch */ | 534 | /* userspace context switch */ |
610 | new = (struct task_struct *)s->event; | 535 | new = (struct task_struct *)val; |
611 | 536 | oldmm = mm; | |
612 | release_mm(oldmm); | 537 | release_mm(oldmm); |
613 | mm = take_tasks_mm(new); | 538 | mm = take_tasks_mm(new); |
614 | if (mm != oldmm) | 539 | if (mm != oldmm) |
615 | cookie = get_exec_dcookie(mm); | 540 | cookie = get_exec_dcookie(mm); |
616 | add_user_ctx_switch(new, cookie); | 541 | add_user_ctx_switch(new, cookie); |
617 | } | 542 | } |
618 | } else if (state >= sb_bt_start && | 543 | if (op_cpu_buffer_get_size(&entry)) |
619 | !add_sample(mm, s, in_kernel)) { | 544 | add_data(&entry, mm); |
620 | if (state == sb_bt_start) { | 545 | continue; |
621 | state = sb_bt_ignore; | ||
622 | atomic_inc(&oprofile_stats.bt_lost_no_mapping); | ||
623 | } | ||
624 | } | 546 | } |
625 | 547 | ||
626 | increment_tail(cpu_buf); | 548 | if (state < sb_bt_start) |
549 | /* ignore sample */ | ||
550 | continue; | ||
551 | |||
552 | if (add_sample(mm, sample, in_kernel)) | ||
553 | continue; | ||
554 | |||
555 | /* ignore backtraces if failed to add a sample */ | ||
556 | if (state == sb_bt_start) { | ||
557 | state = sb_bt_ignore; | ||
558 | atomic_inc(&oprofile_stats.bt_lost_no_mapping); | ||
559 | } | ||
627 | } | 560 | } |
628 | release_mm(mm); | 561 | release_mm(mm); |
629 | 562 | ||
diff --git a/drivers/oprofile/cpu_buffer.c b/drivers/oprofile/cpu_buffer.c index 01d38e78cde1..2e03b6d796d3 100644 --- a/drivers/oprofile/cpu_buffer.c +++ b/drivers/oprofile/cpu_buffer.c | |||
@@ -1,11 +1,12 @@ | |||
1 | /** | 1 | /** |
2 | * @file cpu_buffer.c | 2 | * @file cpu_buffer.c |
3 | * | 3 | * |
4 | * @remark Copyright 2002 OProfile authors | 4 | * @remark Copyright 2002-2009 OProfile authors |
5 | * @remark Read the file COPYING | 5 | * @remark Read the file COPYING |
6 | * | 6 | * |
7 | * @author John Levon <levon@movementarian.org> | 7 | * @author John Levon <levon@movementarian.org> |
8 | * @author Barry Kasindorf <barry.kasindorf@amd.com> | 8 | * @author Barry Kasindorf <barry.kasindorf@amd.com> |
9 | * @author Robert Richter <robert.richter@amd.com> | ||
9 | * | 10 | * |
10 | * Each CPU has a local buffer that stores PC value/event | 11 | * Each CPU has a local buffer that stores PC value/event |
11 | * pairs. We also log context switches when we notice them. | 12 | * pairs. We also log context switches when we notice them. |
@@ -28,6 +29,25 @@ | |||
28 | #include "buffer_sync.h" | 29 | #include "buffer_sync.h" |
29 | #include "oprof.h" | 30 | #include "oprof.h" |
30 | 31 | ||
32 | #define OP_BUFFER_FLAGS 0 | ||
33 | |||
34 | /* | ||
35 | * Read and write access is using spin locking. Thus, writing to the | ||
36 | * buffer by NMI handler (x86) could occur also during critical | ||
37 | * sections when reading the buffer. To avoid this, there are 2 | ||
38 | * buffers for independent read and write access. Read access is in | ||
39 | * process context only, write access only in the NMI handler. If the | ||
40 | * read buffer runs empty, both buffers are swapped atomically. There | ||
41 | * is potentially a small window during swapping where the buffers are | ||
42 | * disabled and samples could be lost. | ||
43 | * | ||
44 | * Using 2 buffers is a little bit overhead, but the solution is clear | ||
45 | * and does not require changes in the ring buffer implementation. It | ||
46 | * can be changed to a single buffer solution when the ring buffer | ||
47 | * access is implemented as non-locking atomic code. | ||
48 | */ | ||
49 | static struct ring_buffer *op_ring_buffer_read; | ||
50 | static struct ring_buffer *op_ring_buffer_write; | ||
31 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); | 51 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); |
32 | 52 | ||
33 | static void wq_sync_buffer(struct work_struct *work); | 53 | static void wq_sync_buffer(struct work_struct *work); |
@@ -35,19 +55,9 @@ static void wq_sync_buffer(struct work_struct *work); | |||
35 | #define DEFAULT_TIMER_EXPIRE (HZ / 10) | 55 | #define DEFAULT_TIMER_EXPIRE (HZ / 10) |
36 | static int work_enabled; | 56 | static int work_enabled; |
37 | 57 | ||
38 | void free_cpu_buffers(void) | ||
39 | { | ||
40 | int i; | ||
41 | |||
42 | for_each_possible_cpu(i) { | ||
43 | vfree(per_cpu(cpu_buffer, i).buffer); | ||
44 | per_cpu(cpu_buffer, i).buffer = NULL; | ||
45 | } | ||
46 | } | ||
47 | |||
48 | unsigned long oprofile_get_cpu_buffer_size(void) | 58 | unsigned long oprofile_get_cpu_buffer_size(void) |
49 | { | 59 | { |
50 | return fs_cpu_buffer_size; | 60 | return oprofile_cpu_buffer_size; |
51 | } | 61 | } |
52 | 62 | ||
53 | void oprofile_cpu_buffer_inc_smpl_lost(void) | 63 | void oprofile_cpu_buffer_inc_smpl_lost(void) |
@@ -58,26 +68,36 @@ void oprofile_cpu_buffer_inc_smpl_lost(void) | |||
58 | cpu_buf->sample_lost_overflow++; | 68 | cpu_buf->sample_lost_overflow++; |
59 | } | 69 | } |
60 | 70 | ||
71 | void free_cpu_buffers(void) | ||
72 | { | ||
73 | if (op_ring_buffer_read) | ||
74 | ring_buffer_free(op_ring_buffer_read); | ||
75 | op_ring_buffer_read = NULL; | ||
76 | if (op_ring_buffer_write) | ||
77 | ring_buffer_free(op_ring_buffer_write); | ||
78 | op_ring_buffer_write = NULL; | ||
79 | } | ||
80 | |||
61 | int alloc_cpu_buffers(void) | 81 | int alloc_cpu_buffers(void) |
62 | { | 82 | { |
63 | int i; | 83 | int i; |
64 | 84 | ||
65 | unsigned long buffer_size = fs_cpu_buffer_size; | 85 | unsigned long buffer_size = oprofile_cpu_buffer_size; |
86 | |||
87 | op_ring_buffer_read = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); | ||
88 | if (!op_ring_buffer_read) | ||
89 | goto fail; | ||
90 | op_ring_buffer_write = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); | ||
91 | if (!op_ring_buffer_write) | ||
92 | goto fail; | ||
66 | 93 | ||
67 | for_each_possible_cpu(i) { | 94 | for_each_possible_cpu(i) { |
68 | struct oprofile_cpu_buffer *b = &per_cpu(cpu_buffer, i); | 95 | struct oprofile_cpu_buffer *b = &per_cpu(cpu_buffer, i); |
69 | 96 | ||
70 | b->buffer = vmalloc_node(sizeof(struct op_sample) * buffer_size, | ||
71 | cpu_to_node(i)); | ||
72 | if (!b->buffer) | ||
73 | goto fail; | ||
74 | |||
75 | b->last_task = NULL; | 97 | b->last_task = NULL; |
76 | b->last_is_kernel = -1; | 98 | b->last_is_kernel = -1; |
77 | b->tracing = 0; | 99 | b->tracing = 0; |
78 | b->buffer_size = buffer_size; | 100 | b->buffer_size = buffer_size; |
79 | b->tail_pos = 0; | ||
80 | b->head_pos = 0; | ||
81 | b->sample_received = 0; | 101 | b->sample_received = 0; |
82 | b->sample_lost_overflow = 0; | 102 | b->sample_lost_overflow = 0; |
83 | b->backtrace_aborted = 0; | 103 | b->backtrace_aborted = 0; |
@@ -124,73 +144,156 @@ void end_cpu_work(void) | |||
124 | flush_scheduled_work(); | 144 | flush_scheduled_work(); |
125 | } | 145 | } |
126 | 146 | ||
127 | /* Resets the cpu buffer to a sane state. */ | 147 | /* |
128 | void cpu_buffer_reset(struct oprofile_cpu_buffer *cpu_buf) | 148 | * This function prepares the cpu buffer to write a sample. |
149 | * | ||
150 | * Struct op_entry is used during operations on the ring buffer while | ||
151 | * struct op_sample contains the data that is stored in the ring | ||
152 | * buffer. Struct entry can be uninitialized. The function reserves a | ||
153 | * data array that is specified by size. Use | ||
154 | * op_cpu_buffer_write_commit() after preparing the sample. In case of | ||
155 | * errors a null pointer is returned, otherwise the pointer to the | ||
156 | * sample. | ||
157 | * | ||
158 | */ | ||
159 | struct op_sample | ||
160 | *op_cpu_buffer_write_reserve(struct op_entry *entry, unsigned long size) | ||
129 | { | 161 | { |
130 | /* reset these to invalid values; the next sample | 162 | entry->event = ring_buffer_lock_reserve |
131 | * collected will populate the buffer with proper | 163 | (op_ring_buffer_write, sizeof(struct op_sample) + |
132 | * values to initialize the buffer | 164 | size * sizeof(entry->sample->data[0]), &entry->irq_flags); |
133 | */ | 165 | if (entry->event) |
134 | cpu_buf->last_is_kernel = -1; | 166 | entry->sample = ring_buffer_event_data(entry->event); |
135 | cpu_buf->last_task = NULL; | 167 | else |
168 | entry->sample = NULL; | ||
169 | |||
170 | if (!entry->sample) | ||
171 | return NULL; | ||
172 | |||
173 | entry->size = size; | ||
174 | entry->data = entry->sample->data; | ||
175 | |||
176 | return entry->sample; | ||
136 | } | 177 | } |
137 | 178 | ||
138 | /* compute number of available slots in cpu_buffer queue */ | 179 | int op_cpu_buffer_write_commit(struct op_entry *entry) |
139 | static unsigned long nr_available_slots(struct oprofile_cpu_buffer const *b) | ||
140 | { | 180 | { |
141 | unsigned long head = b->head_pos; | 181 | return ring_buffer_unlock_commit(op_ring_buffer_write, entry->event, |
142 | unsigned long tail = b->tail_pos; | 182 | entry->irq_flags); |
183 | } | ||
143 | 184 | ||
144 | if (tail > head) | 185 | struct op_sample *op_cpu_buffer_read_entry(struct op_entry *entry, int cpu) |
145 | return (tail - head) - 1; | 186 | { |
187 | struct ring_buffer_event *e; | ||
188 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
189 | if (e) | ||
190 | goto event; | ||
191 | if (ring_buffer_swap_cpu(op_ring_buffer_read, | ||
192 | op_ring_buffer_write, | ||
193 | cpu)) | ||
194 | return NULL; | ||
195 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
196 | if (e) | ||
197 | goto event; | ||
198 | return NULL; | ||
199 | |||
200 | event: | ||
201 | entry->event = e; | ||
202 | entry->sample = ring_buffer_event_data(e); | ||
203 | entry->size = (ring_buffer_event_length(e) - sizeof(struct op_sample)) | ||
204 | / sizeof(entry->sample->data[0]); | ||
205 | entry->data = entry->sample->data; | ||
206 | return entry->sample; | ||
207 | } | ||
146 | 208 | ||
147 | return tail + (b->buffer_size - head) - 1; | 209 | unsigned long op_cpu_buffer_entries(int cpu) |
210 | { | ||
211 | return ring_buffer_entries_cpu(op_ring_buffer_read, cpu) | ||
212 | + ring_buffer_entries_cpu(op_ring_buffer_write, cpu); | ||
148 | } | 213 | } |
149 | 214 | ||
150 | static void increment_head(struct oprofile_cpu_buffer *b) | 215 | static int |
216 | op_add_code(struct oprofile_cpu_buffer *cpu_buf, unsigned long backtrace, | ||
217 | int is_kernel, struct task_struct *task) | ||
151 | { | 218 | { |
152 | unsigned long new_head = b->head_pos + 1; | 219 | struct op_entry entry; |
220 | struct op_sample *sample; | ||
221 | unsigned long flags; | ||
222 | int size; | ||
223 | |||
224 | flags = 0; | ||
153 | 225 | ||
154 | /* Ensure anything written to the slot before we | 226 | if (backtrace) |
155 | * increment is visible */ | 227 | flags |= TRACE_BEGIN; |
156 | wmb(); | 228 | |
229 | /* notice a switch from user->kernel or vice versa */ | ||
230 | is_kernel = !!is_kernel; | ||
231 | if (cpu_buf->last_is_kernel != is_kernel) { | ||
232 | cpu_buf->last_is_kernel = is_kernel; | ||
233 | flags |= KERNEL_CTX_SWITCH; | ||
234 | if (is_kernel) | ||
235 | flags |= IS_KERNEL; | ||
236 | } | ||
237 | |||
238 | /* notice a task switch */ | ||
239 | if (cpu_buf->last_task != task) { | ||
240 | cpu_buf->last_task = task; | ||
241 | flags |= USER_CTX_SWITCH; | ||
242 | } | ||
243 | |||
244 | if (!flags) | ||
245 | /* nothing to do */ | ||
246 | return 0; | ||
157 | 247 | ||
158 | if (new_head < b->buffer_size) | 248 | if (flags & USER_CTX_SWITCH) |
159 | b->head_pos = new_head; | 249 | size = 1; |
160 | else | 250 | else |
161 | b->head_pos = 0; | 251 | size = 0; |
162 | } | ||
163 | 252 | ||
164 | static inline void | 253 | sample = op_cpu_buffer_write_reserve(&entry, size); |
165 | add_sample(struct oprofile_cpu_buffer *cpu_buf, | 254 | if (!sample) |
166 | unsigned long pc, unsigned long event) | 255 | return -ENOMEM; |
167 | { | 256 | |
168 | struct op_sample *entry = &cpu_buf->buffer[cpu_buf->head_pos]; | 257 | sample->eip = ESCAPE_CODE; |
169 | entry->eip = pc; | 258 | sample->event = flags; |
170 | entry->event = event; | 259 | |
171 | increment_head(cpu_buf); | 260 | if (size) |
261 | op_cpu_buffer_add_data(&entry, (unsigned long)task); | ||
262 | |||
263 | op_cpu_buffer_write_commit(&entry); | ||
264 | |||
265 | return 0; | ||
172 | } | 266 | } |
173 | 267 | ||
174 | static inline void | 268 | static inline int |
175 | add_code(struct oprofile_cpu_buffer *buffer, unsigned long value) | 269 | op_add_sample(struct oprofile_cpu_buffer *cpu_buf, |
270 | unsigned long pc, unsigned long event) | ||
176 | { | 271 | { |
177 | add_sample(buffer, ESCAPE_CODE, value); | 272 | struct op_entry entry; |
273 | struct op_sample *sample; | ||
274 | |||
275 | sample = op_cpu_buffer_write_reserve(&entry, 0); | ||
276 | if (!sample) | ||
277 | return -ENOMEM; | ||
278 | |||
279 | sample->eip = pc; | ||
280 | sample->event = event; | ||
281 | |||
282 | return op_cpu_buffer_write_commit(&entry); | ||
178 | } | 283 | } |
179 | 284 | ||
180 | /* This must be safe from any context. It's safe writing here | 285 | /* |
181 | * because of the head/tail separation of the writer and reader | 286 | * This must be safe from any context. |
182 | * of the CPU buffer. | ||
183 | * | 287 | * |
184 | * is_kernel is needed because on some architectures you cannot | 288 | * is_kernel is needed because on some architectures you cannot |
185 | * tell if you are in kernel or user space simply by looking at | 289 | * tell if you are in kernel or user space simply by looking at |
186 | * pc. We tag this in the buffer by generating kernel enter/exit | 290 | * pc. We tag this in the buffer by generating kernel enter/exit |
187 | * events whenever is_kernel changes | 291 | * events whenever is_kernel changes |
188 | */ | 292 | */ |
189 | static int log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, | 293 | static int |
190 | int is_kernel, unsigned long event) | 294 | log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, |
295 | unsigned long backtrace, int is_kernel, unsigned long event) | ||
191 | { | 296 | { |
192 | struct task_struct *task; | ||
193 | |||
194 | cpu_buf->sample_received++; | 297 | cpu_buf->sample_received++; |
195 | 298 | ||
196 | if (pc == ESCAPE_CODE) { | 299 | if (pc == ESCAPE_CODE) { |
@@ -198,131 +301,115 @@ static int log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, | |||
198 | return 0; | 301 | return 0; |
199 | } | 302 | } |
200 | 303 | ||
201 | if (nr_available_slots(cpu_buf) < 3) { | 304 | if (op_add_code(cpu_buf, backtrace, is_kernel, current)) |
202 | cpu_buf->sample_lost_overflow++; | 305 | goto fail; |
203 | return 0; | ||
204 | } | ||
205 | |||
206 | is_kernel = !!is_kernel; | ||
207 | 306 | ||
208 | task = current; | 307 | if (op_add_sample(cpu_buf, pc, event)) |
308 | goto fail; | ||
209 | 309 | ||
210 | /* notice a switch from user->kernel or vice versa */ | ||
211 | if (cpu_buf->last_is_kernel != is_kernel) { | ||
212 | cpu_buf->last_is_kernel = is_kernel; | ||
213 | add_code(cpu_buf, is_kernel); | ||
214 | } | ||
215 | |||
216 | /* notice a task switch */ | ||
217 | if (cpu_buf->last_task != task) { | ||
218 | cpu_buf->last_task = task; | ||
219 | add_code(cpu_buf, (unsigned long)task); | ||
220 | } | ||
221 | |||
222 | add_sample(cpu_buf, pc, event); | ||
223 | return 1; | 310 | return 1; |
311 | |||
312 | fail: | ||
313 | cpu_buf->sample_lost_overflow++; | ||
314 | return 0; | ||
224 | } | 315 | } |
225 | 316 | ||
226 | static int oprofile_begin_trace(struct oprofile_cpu_buffer *cpu_buf) | 317 | static inline void oprofile_begin_trace(struct oprofile_cpu_buffer *cpu_buf) |
227 | { | 318 | { |
228 | if (nr_available_slots(cpu_buf) < 4) { | ||
229 | cpu_buf->sample_lost_overflow++; | ||
230 | return 0; | ||
231 | } | ||
232 | |||
233 | add_code(cpu_buf, CPU_TRACE_BEGIN); | ||
234 | cpu_buf->tracing = 1; | 319 | cpu_buf->tracing = 1; |
235 | return 1; | ||
236 | } | 320 | } |
237 | 321 | ||
238 | static void oprofile_end_trace(struct oprofile_cpu_buffer *cpu_buf) | 322 | static inline void oprofile_end_trace(struct oprofile_cpu_buffer *cpu_buf) |
239 | { | 323 | { |
240 | cpu_buf->tracing = 0; | 324 | cpu_buf->tracing = 0; |
241 | } | 325 | } |
242 | 326 | ||
243 | void oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, | 327 | static inline void |
244 | unsigned long event, int is_kernel) | 328 | __oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, |
329 | unsigned long event, int is_kernel) | ||
245 | { | 330 | { |
246 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 331 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
332 | unsigned long backtrace = oprofile_backtrace_depth; | ||
247 | 333 | ||
248 | if (!backtrace_depth) { | 334 | /* |
249 | log_sample(cpu_buf, pc, is_kernel, event); | 335 | * if log_sample() fail we can't backtrace since we lost the |
336 | * source of this event | ||
337 | */ | ||
338 | if (!log_sample(cpu_buf, pc, backtrace, is_kernel, event)) | ||
339 | /* failed */ | ||
250 | return; | 340 | return; |
251 | } | ||
252 | 341 | ||
253 | if (!oprofile_begin_trace(cpu_buf)) | 342 | if (!backtrace) |
254 | return; | 343 | return; |
255 | 344 | ||
256 | /* if log_sample() fail we can't backtrace since we lost the source | 345 | oprofile_begin_trace(cpu_buf); |
257 | * of this event */ | 346 | oprofile_ops.backtrace(regs, backtrace); |
258 | if (log_sample(cpu_buf, pc, is_kernel, event)) | ||
259 | oprofile_ops.backtrace(regs, backtrace_depth); | ||
260 | oprofile_end_trace(cpu_buf); | 347 | oprofile_end_trace(cpu_buf); |
261 | } | 348 | } |
262 | 349 | ||
350 | void oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, | ||
351 | unsigned long event, int is_kernel) | ||
352 | { | ||
353 | __oprofile_add_ext_sample(pc, regs, event, is_kernel); | ||
354 | } | ||
355 | |||
263 | void oprofile_add_sample(struct pt_regs * const regs, unsigned long event) | 356 | void oprofile_add_sample(struct pt_regs * const regs, unsigned long event) |
264 | { | 357 | { |
265 | int is_kernel = !user_mode(regs); | 358 | int is_kernel = !user_mode(regs); |
266 | unsigned long pc = profile_pc(regs); | 359 | unsigned long pc = profile_pc(regs); |
267 | 360 | ||
268 | oprofile_add_ext_sample(pc, regs, event, is_kernel); | 361 | __oprofile_add_ext_sample(pc, regs, event, is_kernel); |
269 | } | 362 | } |
270 | 363 | ||
271 | #ifdef CONFIG_OPROFILE_IBS | 364 | /* |
272 | 365 | * Add samples with data to the ring buffer. | |
273 | #define MAX_IBS_SAMPLE_SIZE 14 | 366 | * |
274 | 367 | * Use oprofile_add_data(&entry, val) to add data and | |
275 | void oprofile_add_ibs_sample(struct pt_regs *const regs, | 368 | * oprofile_write_commit(&entry) to commit the sample. |
276 | unsigned int *const ibs_sample, int ibs_code) | 369 | */ |
370 | void | ||
371 | oprofile_write_reserve(struct op_entry *entry, struct pt_regs * const regs, | ||
372 | unsigned long pc, int code, int size) | ||
277 | { | 373 | { |
374 | struct op_sample *sample; | ||
278 | int is_kernel = !user_mode(regs); | 375 | int is_kernel = !user_mode(regs); |
279 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 376 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
280 | struct task_struct *task; | ||
281 | 377 | ||
282 | cpu_buf->sample_received++; | 378 | cpu_buf->sample_received++; |
283 | 379 | ||
284 | if (nr_available_slots(cpu_buf) < MAX_IBS_SAMPLE_SIZE) { | 380 | /* no backtraces for samples with data */ |
285 | /* we can't backtrace since we lost the source of this event */ | 381 | if (op_add_code(cpu_buf, 0, is_kernel, current)) |
286 | cpu_buf->sample_lost_overflow++; | 382 | goto fail; |
287 | return; | ||
288 | } | ||
289 | 383 | ||
290 | /* notice a switch from user->kernel or vice versa */ | 384 | sample = op_cpu_buffer_write_reserve(entry, size + 2); |
291 | if (cpu_buf->last_is_kernel != is_kernel) { | 385 | if (!sample) |
292 | cpu_buf->last_is_kernel = is_kernel; | 386 | goto fail; |
293 | add_code(cpu_buf, is_kernel); | 387 | sample->eip = ESCAPE_CODE; |
294 | } | 388 | sample->event = 0; /* no flags */ |
295 | 389 | ||
296 | /* notice a task switch */ | 390 | op_cpu_buffer_add_data(entry, code); |
297 | if (!is_kernel) { | 391 | op_cpu_buffer_add_data(entry, pc); |
298 | task = current; | ||
299 | if (cpu_buf->last_task != task) { | ||
300 | cpu_buf->last_task = task; | ||
301 | add_code(cpu_buf, (unsigned long)task); | ||
302 | } | ||
303 | } | ||
304 | 392 | ||
305 | add_code(cpu_buf, ibs_code); | 393 | return; |
306 | add_sample(cpu_buf, ibs_sample[0], ibs_sample[1]); | ||
307 | add_sample(cpu_buf, ibs_sample[2], ibs_sample[3]); | ||
308 | add_sample(cpu_buf, ibs_sample[4], ibs_sample[5]); | ||
309 | 394 | ||
310 | if (ibs_code == IBS_OP_BEGIN) { | 395 | fail: |
311 | add_sample(cpu_buf, ibs_sample[6], ibs_sample[7]); | 396 | cpu_buf->sample_lost_overflow++; |
312 | add_sample(cpu_buf, ibs_sample[8], ibs_sample[9]); | 397 | } |
313 | add_sample(cpu_buf, ibs_sample[10], ibs_sample[11]); | ||
314 | } | ||
315 | 398 | ||
316 | if (backtrace_depth) | 399 | int oprofile_add_data(struct op_entry *entry, unsigned long val) |
317 | oprofile_ops.backtrace(regs, backtrace_depth); | 400 | { |
401 | return op_cpu_buffer_add_data(entry, val); | ||
318 | } | 402 | } |
319 | 403 | ||
320 | #endif | 404 | int oprofile_write_commit(struct op_entry *entry) |
405 | { | ||
406 | return op_cpu_buffer_write_commit(entry); | ||
407 | } | ||
321 | 408 | ||
322 | void oprofile_add_pc(unsigned long pc, int is_kernel, unsigned long event) | 409 | void oprofile_add_pc(unsigned long pc, int is_kernel, unsigned long event) |
323 | { | 410 | { |
324 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 411 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
325 | log_sample(cpu_buf, pc, is_kernel, event); | 412 | log_sample(cpu_buf, pc, 0, is_kernel, event); |
326 | } | 413 | } |
327 | 414 | ||
328 | void oprofile_add_trace(unsigned long pc) | 415 | void oprofile_add_trace(unsigned long pc) |
@@ -332,21 +419,21 @@ void oprofile_add_trace(unsigned long pc) | |||
332 | if (!cpu_buf->tracing) | 419 | if (!cpu_buf->tracing) |
333 | return; | 420 | return; |
334 | 421 | ||
335 | if (nr_available_slots(cpu_buf) < 1) { | 422 | /* |
336 | cpu_buf->tracing = 0; | 423 | * broken frame can give an eip with the same value as an |
337 | cpu_buf->sample_lost_overflow++; | 424 | * escape code, abort the trace if we get it |
338 | return; | 425 | */ |
339 | } | 426 | if (pc == ESCAPE_CODE) |
427 | goto fail; | ||
340 | 428 | ||
341 | /* broken frame can give an eip with the same value as an escape code, | 429 | if (op_add_sample(cpu_buf, pc, 0)) |
342 | * abort the trace if we get it */ | 430 | goto fail; |
343 | if (pc == ESCAPE_CODE) { | ||
344 | cpu_buf->tracing = 0; | ||
345 | cpu_buf->backtrace_aborted++; | ||
346 | return; | ||
347 | } | ||
348 | 431 | ||
349 | add_sample(cpu_buf, pc, 0); | 432 | return; |
433 | fail: | ||
434 | cpu_buf->tracing = 0; | ||
435 | cpu_buf->backtrace_aborted++; | ||
436 | return; | ||
350 | } | 437 | } |
351 | 438 | ||
352 | /* | 439 | /* |
diff --git a/drivers/oprofile/cpu_buffer.h b/drivers/oprofile/cpu_buffer.h index d3cc26264db5..63f81c44846a 100644 --- a/drivers/oprofile/cpu_buffer.h +++ b/drivers/oprofile/cpu_buffer.h | |||
@@ -1,10 +1,11 @@ | |||
1 | /** | 1 | /** |
2 | * @file cpu_buffer.h | 2 | * @file cpu_buffer.h |
3 | * | 3 | * |
4 | * @remark Copyright 2002 OProfile authors | 4 | * @remark Copyright 2002-2009 OProfile authors |
5 | * @remark Read the file COPYING | 5 | * @remark Read the file COPYING |
6 | * | 6 | * |
7 | * @author John Levon <levon@movementarian.org> | 7 | * @author John Levon <levon@movementarian.org> |
8 | * @author Robert Richter <robert.richter@amd.com> | ||
8 | */ | 9 | */ |
9 | 10 | ||
10 | #ifndef OPROFILE_CPU_BUFFER_H | 11 | #ifndef OPROFILE_CPU_BUFFER_H |
@@ -15,6 +16,7 @@ | |||
15 | #include <linux/workqueue.h> | 16 | #include <linux/workqueue.h> |
16 | #include <linux/cache.h> | 17 | #include <linux/cache.h> |
17 | #include <linux/sched.h> | 18 | #include <linux/sched.h> |
19 | #include <linux/ring_buffer.h> | ||
18 | 20 | ||
19 | struct task_struct; | 21 | struct task_struct; |
20 | 22 | ||
@@ -30,16 +32,16 @@ void end_cpu_work(void); | |||
30 | struct op_sample { | 32 | struct op_sample { |
31 | unsigned long eip; | 33 | unsigned long eip; |
32 | unsigned long event; | 34 | unsigned long event; |
35 | unsigned long data[0]; | ||
33 | }; | 36 | }; |
34 | 37 | ||
38 | struct op_entry; | ||
39 | |||
35 | struct oprofile_cpu_buffer { | 40 | struct oprofile_cpu_buffer { |
36 | volatile unsigned long head_pos; | ||
37 | volatile unsigned long tail_pos; | ||
38 | unsigned long buffer_size; | 41 | unsigned long buffer_size; |
39 | struct task_struct *last_task; | 42 | struct task_struct *last_task; |
40 | int last_is_kernel; | 43 | int last_is_kernel; |
41 | int tracing; | 44 | int tracing; |
42 | struct op_sample *buffer; | ||
43 | unsigned long sample_received; | 45 | unsigned long sample_received; |
44 | unsigned long sample_lost_overflow; | 46 | unsigned long sample_lost_overflow; |
45 | unsigned long backtrace_aborted; | 47 | unsigned long backtrace_aborted; |
@@ -50,12 +52,62 @@ struct oprofile_cpu_buffer { | |||
50 | 52 | ||
51 | DECLARE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); | 53 | DECLARE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); |
52 | 54 | ||
53 | void cpu_buffer_reset(struct oprofile_cpu_buffer *cpu_buf); | 55 | /* |
56 | * Resets the cpu buffer to a sane state. | ||
57 | * | ||
58 | * reset these to invalid values; the next sample collected will | ||
59 | * populate the buffer with proper values to initialize the buffer | ||
60 | */ | ||
61 | static inline void op_cpu_buffer_reset(int cpu) | ||
62 | { | ||
63 | struct oprofile_cpu_buffer *cpu_buf = &per_cpu(cpu_buffer, cpu); | ||
64 | |||
65 | cpu_buf->last_is_kernel = -1; | ||
66 | cpu_buf->last_task = NULL; | ||
67 | } | ||
68 | |||
69 | struct op_sample | ||
70 | *op_cpu_buffer_write_reserve(struct op_entry *entry, unsigned long size); | ||
71 | int op_cpu_buffer_write_commit(struct op_entry *entry); | ||
72 | struct op_sample *op_cpu_buffer_read_entry(struct op_entry *entry, int cpu); | ||
73 | unsigned long op_cpu_buffer_entries(int cpu); | ||
74 | |||
75 | /* returns the remaining free size of data in the entry */ | ||
76 | static inline | ||
77 | int op_cpu_buffer_add_data(struct op_entry *entry, unsigned long val) | ||
78 | { | ||
79 | if (!entry->size) | ||
80 | return 0; | ||
81 | *entry->data = val; | ||
82 | entry->size--; | ||
83 | entry->data++; | ||
84 | return entry->size; | ||
85 | } | ||
86 | |||
87 | /* returns the size of data in the entry */ | ||
88 | static inline | ||
89 | int op_cpu_buffer_get_size(struct op_entry *entry) | ||
90 | { | ||
91 | return entry->size; | ||
92 | } | ||
93 | |||
94 | /* returns 0 if empty or the size of data including the current value */ | ||
95 | static inline | ||
96 | int op_cpu_buffer_get_data(struct op_entry *entry, unsigned long *val) | ||
97 | { | ||
98 | int size = entry->size; | ||
99 | if (!size) | ||
100 | return 0; | ||
101 | *val = *entry->data; | ||
102 | entry->size--; | ||
103 | entry->data++; | ||
104 | return size; | ||
105 | } | ||
54 | 106 | ||
55 | /* transient events for the CPU buffer -> event buffer */ | 107 | /* extra data flags */ |
56 | #define CPU_IS_KERNEL 1 | 108 | #define KERNEL_CTX_SWITCH (1UL << 0) |
57 | #define CPU_TRACE_BEGIN 2 | 109 | #define IS_KERNEL (1UL << 1) |
58 | #define IBS_FETCH_BEGIN 3 | 110 | #define TRACE_BEGIN (1UL << 2) |
59 | #define IBS_OP_BEGIN 4 | 111 | #define USER_CTX_SWITCH (1UL << 3) |
60 | 112 | ||
61 | #endif /* OPROFILE_CPU_BUFFER_H */ | 113 | #endif /* OPROFILE_CPU_BUFFER_H */ |
diff --git a/drivers/oprofile/event_buffer.c b/drivers/oprofile/event_buffer.c index 191a3202cecc..2b7ae366ceb1 100644 --- a/drivers/oprofile/event_buffer.c +++ b/drivers/oprofile/event_buffer.c | |||
@@ -73,8 +73,8 @@ int alloc_event_buffer(void) | |||
73 | unsigned long flags; | 73 | unsigned long flags; |
74 | 74 | ||
75 | spin_lock_irqsave(&oprofilefs_lock, flags); | 75 | spin_lock_irqsave(&oprofilefs_lock, flags); |
76 | buffer_size = fs_buffer_size; | 76 | buffer_size = oprofile_buffer_size; |
77 | buffer_watershed = fs_buffer_watershed; | 77 | buffer_watershed = oprofile_buffer_watershed; |
78 | spin_unlock_irqrestore(&oprofilefs_lock, flags); | 78 | spin_unlock_irqrestore(&oprofilefs_lock, flags); |
79 | 79 | ||
80 | if (buffer_watershed >= buffer_size) | 80 | if (buffer_watershed >= buffer_size) |
diff --git a/drivers/oprofile/oprof.c b/drivers/oprofile/oprof.c index cd375907f26f..3cffce90f82a 100644 --- a/drivers/oprofile/oprof.c +++ b/drivers/oprofile/oprof.c | |||
@@ -23,7 +23,7 @@ | |||
23 | struct oprofile_operations oprofile_ops; | 23 | struct oprofile_operations oprofile_ops; |
24 | 24 | ||
25 | unsigned long oprofile_started; | 25 | unsigned long oprofile_started; |
26 | unsigned long backtrace_depth; | 26 | unsigned long oprofile_backtrace_depth; |
27 | static unsigned long is_setup; | 27 | static unsigned long is_setup; |
28 | static DEFINE_MUTEX(start_mutex); | 28 | static DEFINE_MUTEX(start_mutex); |
29 | 29 | ||
@@ -172,7 +172,7 @@ int oprofile_set_backtrace(unsigned long val) | |||
172 | goto out; | 172 | goto out; |
173 | } | 173 | } |
174 | 174 | ||
175 | backtrace_depth = val; | 175 | oprofile_backtrace_depth = val; |
176 | 176 | ||
177 | out: | 177 | out: |
178 | mutex_unlock(&start_mutex); | 178 | mutex_unlock(&start_mutex); |
diff --git a/drivers/oprofile/oprof.h b/drivers/oprofile/oprof.h index 5df0c21a608f..c288d3c24b50 100644 --- a/drivers/oprofile/oprof.h +++ b/drivers/oprofile/oprof.h | |||
@@ -21,12 +21,12 @@ void oprofile_stop(void); | |||
21 | 21 | ||
22 | struct oprofile_operations; | 22 | struct oprofile_operations; |
23 | 23 | ||
24 | extern unsigned long fs_buffer_size; | 24 | extern unsigned long oprofile_buffer_size; |
25 | extern unsigned long fs_cpu_buffer_size; | 25 | extern unsigned long oprofile_cpu_buffer_size; |
26 | extern unsigned long fs_buffer_watershed; | 26 | extern unsigned long oprofile_buffer_watershed; |
27 | extern struct oprofile_operations oprofile_ops; | 27 | extern struct oprofile_operations oprofile_ops; |
28 | extern unsigned long oprofile_started; | 28 | extern unsigned long oprofile_started; |
29 | extern unsigned long backtrace_depth; | 29 | extern unsigned long oprofile_backtrace_depth; |
30 | 30 | ||
31 | struct super_block; | 31 | struct super_block; |
32 | struct dentry; | 32 | struct dentry; |
diff --git a/drivers/oprofile/oprofile_files.c b/drivers/oprofile/oprofile_files.c index cc106d503ace..5d36ffc30dd5 100644 --- a/drivers/oprofile/oprofile_files.c +++ b/drivers/oprofile/oprofile_files.c | |||
@@ -14,13 +14,18 @@ | |||
14 | #include "oprofile_stats.h" | 14 | #include "oprofile_stats.h" |
15 | #include "oprof.h" | 15 | #include "oprof.h" |
16 | 16 | ||
17 | unsigned long fs_buffer_size = 131072; | 17 | #define BUFFER_SIZE_DEFAULT 131072 |
18 | unsigned long fs_cpu_buffer_size = 8192; | 18 | #define CPU_BUFFER_SIZE_DEFAULT 8192 |
19 | unsigned long fs_buffer_watershed = 32768; /* FIXME: tune */ | 19 | #define BUFFER_WATERSHED_DEFAULT 32768 /* FIXME: tune */ |
20 | |||
21 | unsigned long oprofile_buffer_size; | ||
22 | unsigned long oprofile_cpu_buffer_size; | ||
23 | unsigned long oprofile_buffer_watershed; | ||
20 | 24 | ||
21 | static ssize_t depth_read(struct file *file, char __user *buf, size_t count, loff_t *offset) | 25 | static ssize_t depth_read(struct file *file, char __user *buf, size_t count, loff_t *offset) |
22 | { | 26 | { |
23 | return oprofilefs_ulong_to_user(backtrace_depth, buf, count, offset); | 27 | return oprofilefs_ulong_to_user(oprofile_backtrace_depth, buf, count, |
28 | offset); | ||
24 | } | 29 | } |
25 | 30 | ||
26 | 31 | ||
@@ -120,12 +125,17 @@ static const struct file_operations dump_fops = { | |||
120 | 125 | ||
121 | void oprofile_create_files(struct super_block *sb, struct dentry *root) | 126 | void oprofile_create_files(struct super_block *sb, struct dentry *root) |
122 | { | 127 | { |
128 | /* reinitialize default values */ | ||
129 | oprofile_buffer_size = BUFFER_SIZE_DEFAULT; | ||
130 | oprofile_cpu_buffer_size = CPU_BUFFER_SIZE_DEFAULT; | ||
131 | oprofile_buffer_watershed = BUFFER_WATERSHED_DEFAULT; | ||
132 | |||
123 | oprofilefs_create_file(sb, root, "enable", &enable_fops); | 133 | oprofilefs_create_file(sb, root, "enable", &enable_fops); |
124 | oprofilefs_create_file_perm(sb, root, "dump", &dump_fops, 0666); | 134 | oprofilefs_create_file_perm(sb, root, "dump", &dump_fops, 0666); |
125 | oprofilefs_create_file(sb, root, "buffer", &event_buffer_fops); | 135 | oprofilefs_create_file(sb, root, "buffer", &event_buffer_fops); |
126 | oprofilefs_create_ulong(sb, root, "buffer_size", &fs_buffer_size); | 136 | oprofilefs_create_ulong(sb, root, "buffer_size", &oprofile_buffer_size); |
127 | oprofilefs_create_ulong(sb, root, "buffer_watershed", &fs_buffer_watershed); | 137 | oprofilefs_create_ulong(sb, root, "buffer_watershed", &oprofile_buffer_watershed); |
128 | oprofilefs_create_ulong(sb, root, "cpu_buffer_size", &fs_cpu_buffer_size); | 138 | oprofilefs_create_ulong(sb, root, "cpu_buffer_size", &oprofile_cpu_buffer_size); |
129 | oprofilefs_create_file(sb, root, "cpu_type", &cpu_type_fops); | 139 | oprofilefs_create_file(sb, root, "cpu_type", &cpu_type_fops); |
130 | oprofilefs_create_file(sb, root, "backtrace_depth", &depth_fops); | 140 | oprofilefs_create_file(sb, root, "backtrace_depth", &depth_fops); |
131 | oprofilefs_create_file(sb, root, "pointer_size", &pointer_size_fops); | 141 | oprofilefs_create_file(sb, root, "pointer_size", &pointer_size_fops); |