diff options
-rw-r--r-- | drivers/oprofile/buffer_sync.c | 65 | ||||
-rw-r--r-- | drivers/oprofile/cpu_buffer.c | 63 | ||||
-rw-r--r-- | drivers/oprofile/cpu_buffer.h | 71 |
3 files changed, 114 insertions, 85 deletions
diff --git a/drivers/oprofile/buffer_sync.c b/drivers/oprofile/buffer_sync.c index 944a5832d9e4..737bd9484822 100644 --- a/drivers/oprofile/buffer_sync.c +++ b/drivers/oprofile/buffer_sync.c | |||
@@ -268,18 +268,6 @@ lookup_dcookie(struct mm_struct *mm, unsigned long addr, off_t *offset) | |||
268 | return cookie; | 268 | return cookie; |
269 | } | 269 | } |
270 | 270 | ||
271 | static void increment_tail(struct oprofile_cpu_buffer *b) | ||
272 | { | ||
273 | unsigned long new_tail = b->tail_pos + 1; | ||
274 | |||
275 | rmb(); /* be sure fifo pointers are synchronized */ | ||
276 | |||
277 | if (new_tail < b->buffer_size) | ||
278 | b->tail_pos = new_tail; | ||
279 | else | ||
280 | b->tail_pos = 0; | ||
281 | } | ||
282 | |||
283 | static unsigned long last_cookie = INVALID_COOKIE; | 271 | static unsigned long last_cookie = INVALID_COOKIE; |
284 | 272 | ||
285 | static void add_cpu_switch(int i) | 273 | static void add_cpu_switch(int i) |
@@ -331,26 +319,25 @@ static void add_trace_begin(void) | |||
331 | 319 | ||
332 | #define IBS_FETCH_CODE_SIZE 2 | 320 | #define IBS_FETCH_CODE_SIZE 2 |
333 | #define IBS_OP_CODE_SIZE 5 | 321 | #define IBS_OP_CODE_SIZE 5 |
334 | #define IBS_EIP(cpu_buf) ((cpu_buffer_read_entry(cpu_buf))->eip) | ||
335 | #define IBS_EVENT(cpu_buf) ((cpu_buffer_read_entry(cpu_buf))->event) | ||
336 | 322 | ||
337 | /* | 323 | /* |
338 | * Add IBS fetch and op entries to event buffer | 324 | * Add IBS fetch and op entries to event buffer |
339 | */ | 325 | */ |
340 | static void add_ibs_begin(struct oprofile_cpu_buffer *cpu_buf, int code, | 326 | static void add_ibs_begin(int cpu, int code, struct mm_struct *mm) |
341 | struct mm_struct *mm) | ||
342 | { | 327 | { |
343 | unsigned long rip; | 328 | unsigned long rip; |
344 | int i, count; | 329 | int i, count; |
345 | unsigned long ibs_cookie = 0; | 330 | unsigned long ibs_cookie = 0; |
346 | off_t offset; | 331 | off_t offset; |
332 | struct op_sample *sample; | ||
347 | 333 | ||
348 | increment_tail(cpu_buf); /* move to RIP entry */ | 334 | sample = cpu_buffer_read_entry(cpu); |
349 | 335 | if (!sample) | |
350 | rip = IBS_EIP(cpu_buf); | 336 | goto Error; |
337 | rip = sample->eip; | ||
351 | 338 | ||
352 | #ifdef __LP64__ | 339 | #ifdef __LP64__ |
353 | rip += IBS_EVENT(cpu_buf) << 32; | 340 | rip += sample->event << 32; |
354 | #endif | 341 | #endif |
355 | 342 | ||
356 | if (mm) { | 343 | if (mm) { |
@@ -374,8 +361,8 @@ static void add_ibs_begin(struct oprofile_cpu_buffer *cpu_buf, int code, | |||
374 | add_event_entry(offset); /* Offset from Dcookie */ | 361 | add_event_entry(offset); /* Offset from Dcookie */ |
375 | 362 | ||
376 | /* we send the Dcookie offset, but send the raw Linear Add also*/ | 363 | /* we send the Dcookie offset, but send the raw Linear Add also*/ |
377 | add_event_entry(IBS_EIP(cpu_buf)); | 364 | add_event_entry(sample->eip); |
378 | add_event_entry(IBS_EVENT(cpu_buf)); | 365 | add_event_entry(sample->event); |
379 | 366 | ||
380 | if (code == IBS_FETCH_CODE) | 367 | if (code == IBS_FETCH_CODE) |
381 | count = IBS_FETCH_CODE_SIZE; /*IBS FETCH is 2 int64s*/ | 368 | count = IBS_FETCH_CODE_SIZE; /*IBS FETCH is 2 int64s*/ |
@@ -383,10 +370,17 @@ static void add_ibs_begin(struct oprofile_cpu_buffer *cpu_buf, int code, | |||
383 | count = IBS_OP_CODE_SIZE; /*IBS OP is 5 int64s*/ | 370 | count = IBS_OP_CODE_SIZE; /*IBS OP is 5 int64s*/ |
384 | 371 | ||
385 | for (i = 0; i < count; i++) { | 372 | for (i = 0; i < count; i++) { |
386 | increment_tail(cpu_buf); | 373 | sample = cpu_buffer_read_entry(cpu); |
387 | add_event_entry(IBS_EIP(cpu_buf)); | 374 | if (!sample) |
388 | add_event_entry(IBS_EVENT(cpu_buf)); | 375 | goto Error; |
376 | add_event_entry(sample->eip); | ||
377 | add_event_entry(sample->event); | ||
389 | } | 378 | } |
379 | |||
380 | return; | ||
381 | |||
382 | Error: | ||
383 | return; | ||
390 | } | 384 | } |
391 | 385 | ||
392 | #endif | 386 | #endif |
@@ -530,33 +524,26 @@ typedef enum { | |||
530 | */ | 524 | */ |
531 | void sync_buffer(int cpu) | 525 | void sync_buffer(int cpu) |
532 | { | 526 | { |
533 | struct oprofile_cpu_buffer *cpu_buf = &per_cpu(cpu_buffer, cpu); | ||
534 | struct mm_struct *mm = NULL; | 527 | struct mm_struct *mm = NULL; |
535 | struct mm_struct *oldmm; | 528 | struct mm_struct *oldmm; |
536 | struct task_struct *new; | 529 | struct task_struct *new; |
537 | unsigned long cookie = 0; | 530 | unsigned long cookie = 0; |
538 | int in_kernel = 1; | 531 | int in_kernel = 1; |
539 | sync_buffer_state state = sb_buffer_start; | 532 | sync_buffer_state state = sb_buffer_start; |
540 | #ifndef CONFIG_OPROFILE_IBS | ||
541 | unsigned int i; | 533 | unsigned int i; |
542 | unsigned long available; | 534 | unsigned long available; |
543 | #endif | ||
544 | 535 | ||
545 | mutex_lock(&buffer_mutex); | 536 | mutex_lock(&buffer_mutex); |
546 | 537 | ||
547 | add_cpu_switch(cpu); | 538 | add_cpu_switch(cpu); |
548 | 539 | ||
549 | /* Remember, only we can modify tail_pos */ | ||
550 | |||
551 | cpu_buffer_reset(cpu); | 540 | cpu_buffer_reset(cpu); |
552 | #ifndef CONFIG_OPROFILE_IBS | 541 | available = cpu_buffer_entries(cpu); |
553 | available = cpu_buffer_entries(cpu_buf); | ||
554 | 542 | ||
555 | for (i = 0; i < available; ++i) { | 543 | for (i = 0; i < available; ++i) { |
556 | #else | 544 | struct op_sample *s = cpu_buffer_read_entry(cpu); |
557 | while (cpu_buffer_entries(cpu_buf)) { | 545 | if (!s) |
558 | #endif | 546 | break; |
559 | struct op_sample *s = cpu_buffer_read_entry(cpu_buf); | ||
560 | 547 | ||
561 | if (is_code(s->eip)) { | 548 | if (is_code(s->eip)) { |
562 | switch (s->event) { | 549 | switch (s->event) { |
@@ -575,11 +562,11 @@ void sync_buffer(int cpu) | |||
575 | #ifdef CONFIG_OPROFILE_IBS | 562 | #ifdef CONFIG_OPROFILE_IBS |
576 | case IBS_FETCH_BEGIN: | 563 | case IBS_FETCH_BEGIN: |
577 | state = sb_bt_start; | 564 | state = sb_bt_start; |
578 | add_ibs_begin(cpu_buf, IBS_FETCH_CODE, mm); | 565 | add_ibs_begin(cpu, IBS_FETCH_CODE, mm); |
579 | break; | 566 | break; |
580 | case IBS_OP_BEGIN: | 567 | case IBS_OP_BEGIN: |
581 | state = sb_bt_start; | 568 | state = sb_bt_start; |
582 | add_ibs_begin(cpu_buf, IBS_OP_CODE, mm); | 569 | add_ibs_begin(cpu, IBS_OP_CODE, mm); |
583 | break; | 570 | break; |
584 | #endif | 571 | #endif |
585 | default: | 572 | default: |
@@ -600,8 +587,6 @@ void sync_buffer(int cpu) | |||
600 | atomic_inc(&oprofile_stats.bt_lost_no_mapping); | 587 | atomic_inc(&oprofile_stats.bt_lost_no_mapping); |
601 | } | 588 | } |
602 | } | 589 | } |
603 | |||
604 | increment_tail(cpu_buf); | ||
605 | } | 590 | } |
606 | release_mm(mm); | 591 | release_mm(mm); |
607 | 592 | ||
diff --git a/drivers/oprofile/cpu_buffer.c b/drivers/oprofile/cpu_buffer.c index 5cf7efe38e67..eb280ec96e24 100644 --- a/drivers/oprofile/cpu_buffer.c +++ b/drivers/oprofile/cpu_buffer.c | |||
@@ -28,6 +28,25 @@ | |||
28 | #include "buffer_sync.h" | 28 | #include "buffer_sync.h" |
29 | #include "oprof.h" | 29 | #include "oprof.h" |
30 | 30 | ||
31 | #define OP_BUFFER_FLAGS 0 | ||
32 | |||
33 | /* | ||
34 | * Read and write access is using spin locking. Thus, writing to the | ||
35 | * buffer by NMI handler (x86) could occur also during critical | ||
36 | * sections when reading the buffer. To avoid this, there are 2 | ||
37 | * buffers for independent read and write access. Read access is in | ||
38 | * process context only, write access only in the NMI handler. If the | ||
39 | * read buffer runs empty, both buffers are swapped atomically. There | ||
40 | * is potentially a small window during swapping where the buffers are | ||
41 | * disabled and samples could be lost. | ||
42 | * | ||
43 | * Using 2 buffers is a little bit overhead, but the solution is clear | ||
44 | * and does not require changes in the ring buffer implementation. It | ||
45 | * can be changed to a single buffer solution when the ring buffer | ||
46 | * access is implemented as non-locking atomic code. | ||
47 | */ | ||
48 | struct ring_buffer *op_ring_buffer_read; | ||
49 | struct ring_buffer *op_ring_buffer_write; | ||
31 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); | 50 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); |
32 | 51 | ||
33 | static void wq_sync_buffer(struct work_struct *work); | 52 | static void wq_sync_buffer(struct work_struct *work); |
@@ -37,12 +56,12 @@ static int work_enabled; | |||
37 | 56 | ||
38 | void free_cpu_buffers(void) | 57 | void free_cpu_buffers(void) |
39 | { | 58 | { |
40 | int i; | 59 | if (op_ring_buffer_read) |
41 | 60 | ring_buffer_free(op_ring_buffer_read); | |
42 | for_each_possible_cpu(i) { | 61 | op_ring_buffer_read = NULL; |
43 | vfree(per_cpu(cpu_buffer, i).buffer); | 62 | if (op_ring_buffer_write) |
44 | per_cpu(cpu_buffer, i).buffer = NULL; | 63 | ring_buffer_free(op_ring_buffer_write); |
45 | } | 64 | op_ring_buffer_write = NULL; |
46 | } | 65 | } |
47 | 66 | ||
48 | unsigned long oprofile_get_cpu_buffer_size(void) | 67 | unsigned long oprofile_get_cpu_buffer_size(void) |
@@ -64,14 +83,16 @@ int alloc_cpu_buffers(void) | |||
64 | 83 | ||
65 | unsigned long buffer_size = fs_cpu_buffer_size; | 84 | unsigned long buffer_size = fs_cpu_buffer_size; |
66 | 85 | ||
86 | op_ring_buffer_read = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); | ||
87 | if (!op_ring_buffer_read) | ||
88 | goto fail; | ||
89 | op_ring_buffer_write = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); | ||
90 | if (!op_ring_buffer_write) | ||
91 | goto fail; | ||
92 | |||
67 | for_each_possible_cpu(i) { | 93 | for_each_possible_cpu(i) { |
68 | struct oprofile_cpu_buffer *b = &per_cpu(cpu_buffer, i); | 94 | struct oprofile_cpu_buffer *b = &per_cpu(cpu_buffer, i); |
69 | 95 | ||
70 | b->buffer = vmalloc_node(sizeof(struct op_sample) * buffer_size, | ||
71 | cpu_to_node(i)); | ||
72 | if (!b->buffer) | ||
73 | goto fail; | ||
74 | |||
75 | b->last_task = NULL; | 96 | b->last_task = NULL; |
76 | b->last_is_kernel = -1; | 97 | b->last_is_kernel = -1; |
77 | b->tracing = 0; | 98 | b->tracing = 0; |
@@ -140,10 +161,22 @@ static inline void | |||
140 | add_sample(struct oprofile_cpu_buffer *cpu_buf, | 161 | add_sample(struct oprofile_cpu_buffer *cpu_buf, |
141 | unsigned long pc, unsigned long event) | 162 | unsigned long pc, unsigned long event) |
142 | { | 163 | { |
143 | struct op_sample *entry = cpu_buffer_write_entry(cpu_buf); | 164 | struct op_entry entry; |
144 | entry->eip = pc; | 165 | |
145 | entry->event = event; | 166 | if (cpu_buffer_write_entry(&entry)) |
146 | cpu_buffer_write_commit(cpu_buf); | 167 | goto Error; |
168 | |||
169 | entry.sample->eip = pc; | ||
170 | entry.sample->event = event; | ||
171 | |||
172 | if (cpu_buffer_write_commit(&entry)) | ||
173 | goto Error; | ||
174 | |||
175 | return; | ||
176 | |||
177 | Error: | ||
178 | cpu_buf->sample_lost_overflow++; | ||
179 | return; | ||
147 | } | 180 | } |
148 | 181 | ||
149 | static inline void | 182 | static inline void |
diff --git a/drivers/oprofile/cpu_buffer.h b/drivers/oprofile/cpu_buffer.h index 895763f065e9..aacb0f0bc566 100644 --- a/drivers/oprofile/cpu_buffer.h +++ b/drivers/oprofile/cpu_buffer.h | |||
@@ -15,6 +15,7 @@ | |||
15 | #include <linux/workqueue.h> | 15 | #include <linux/workqueue.h> |
16 | #include <linux/cache.h> | 16 | #include <linux/cache.h> |
17 | #include <linux/sched.h> | 17 | #include <linux/sched.h> |
18 | #include <linux/ring_buffer.h> | ||
18 | 19 | ||
19 | struct task_struct; | 20 | struct task_struct; |
20 | 21 | ||
@@ -32,6 +33,12 @@ struct op_sample { | |||
32 | unsigned long event; | 33 | unsigned long event; |
33 | }; | 34 | }; |
34 | 35 | ||
36 | struct op_entry { | ||
37 | struct ring_buffer_event *event; | ||
38 | struct op_sample *sample; | ||
39 | unsigned long irq_flags; | ||
40 | }; | ||
41 | |||
35 | struct oprofile_cpu_buffer { | 42 | struct oprofile_cpu_buffer { |
36 | volatile unsigned long head_pos; | 43 | volatile unsigned long head_pos; |
37 | volatile unsigned long tail_pos; | 44 | volatile unsigned long tail_pos; |
@@ -39,7 +46,6 @@ struct oprofile_cpu_buffer { | |||
39 | struct task_struct *last_task; | 46 | struct task_struct *last_task; |
40 | int last_is_kernel; | 47 | int last_is_kernel; |
41 | int tracing; | 48 | int tracing; |
42 | struct op_sample *buffer; | ||
43 | unsigned long sample_received; | 49 | unsigned long sample_received; |
44 | unsigned long sample_lost_overflow; | 50 | unsigned long sample_lost_overflow; |
45 | unsigned long backtrace_aborted; | 51 | unsigned long backtrace_aborted; |
@@ -48,6 +54,8 @@ struct oprofile_cpu_buffer { | |||
48 | struct delayed_work work; | 54 | struct delayed_work work; |
49 | }; | 55 | }; |
50 | 56 | ||
57 | extern struct ring_buffer *op_ring_buffer_read; | ||
58 | extern struct ring_buffer *op_ring_buffer_write; | ||
51 | DECLARE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); | 59 | DECLARE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); |
52 | 60 | ||
53 | /* | 61 | /* |
@@ -64,46 +72,49 @@ static inline void cpu_buffer_reset(int cpu) | |||
64 | cpu_buf->last_task = NULL; | 72 | cpu_buf->last_task = NULL; |
65 | } | 73 | } |
66 | 74 | ||
67 | static inline | 75 | static inline int cpu_buffer_write_entry(struct op_entry *entry) |
68 | struct op_sample *cpu_buffer_write_entry(struct oprofile_cpu_buffer *cpu_buf) | ||
69 | { | 76 | { |
70 | return &cpu_buf->buffer[cpu_buf->head_pos]; | 77 | entry->event = ring_buffer_lock_reserve(op_ring_buffer_write, |
71 | } | 78 | sizeof(struct op_sample), |
79 | &entry->irq_flags); | ||
80 | if (entry->event) | ||
81 | entry->sample = ring_buffer_event_data(entry->event); | ||
82 | else | ||
83 | entry->sample = NULL; | ||
72 | 84 | ||
73 | static inline | 85 | if (!entry->sample) |
74 | void cpu_buffer_write_commit(struct oprofile_cpu_buffer *b) | 86 | return -ENOMEM; |
75 | { | ||
76 | unsigned long new_head = b->head_pos + 1; | ||
77 | 87 | ||
78 | /* | 88 | return 0; |
79 | * Ensure anything written to the slot before we increment is | 89 | } |
80 | * visible | ||
81 | */ | ||
82 | wmb(); | ||
83 | 90 | ||
84 | if (new_head < b->buffer_size) | 91 | static inline int cpu_buffer_write_commit(struct op_entry *entry) |
85 | b->head_pos = new_head; | 92 | { |
86 | else | 93 | return ring_buffer_unlock_commit(op_ring_buffer_write, entry->event, |
87 | b->head_pos = 0; | 94 | entry->irq_flags); |
88 | } | 95 | } |
89 | 96 | ||
90 | static inline | 97 | static inline struct op_sample *cpu_buffer_read_entry(int cpu) |
91 | struct op_sample *cpu_buffer_read_entry(struct oprofile_cpu_buffer *cpu_buf) | ||
92 | { | 98 | { |
93 | return &cpu_buf->buffer[cpu_buf->tail_pos]; | 99 | struct ring_buffer_event *e; |
100 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
101 | if (e) | ||
102 | return ring_buffer_event_data(e); | ||
103 | if (ring_buffer_swap_cpu(op_ring_buffer_read, | ||
104 | op_ring_buffer_write, | ||
105 | cpu)) | ||
106 | return NULL; | ||
107 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
108 | if (e) | ||
109 | return ring_buffer_event_data(e); | ||
110 | return NULL; | ||
94 | } | 111 | } |
95 | 112 | ||
96 | /* "acquire" as many cpu buffer slots as we can */ | 113 | /* "acquire" as many cpu buffer slots as we can */ |
97 | static inline | 114 | static inline unsigned long cpu_buffer_entries(int cpu) |
98 | unsigned long cpu_buffer_entries(struct oprofile_cpu_buffer *b) | ||
99 | { | 115 | { |
100 | unsigned long head = b->head_pos; | 116 | return ring_buffer_entries_cpu(op_ring_buffer_read, cpu) |
101 | unsigned long tail = b->tail_pos; | 117 | + ring_buffer_entries_cpu(op_ring_buffer_write, cpu); |
102 | |||
103 | if (head >= tail) | ||
104 | return head - tail; | ||
105 | |||
106 | return head + (b->buffer_size - tail); | ||
107 | } | 118 | } |
108 | 119 | ||
109 | /* transient events for the CPU buffer -> event buffer */ | 120 | /* transient events for the CPU buffer -> event buffer */ |