diff options
Diffstat (limited to 'drivers/oprofile/cpu_buffer.c')
-rw-r--r-- | drivers/oprofile/cpu_buffer.c | 316 |
1 files changed, 201 insertions, 115 deletions
diff --git a/drivers/oprofile/cpu_buffer.c b/drivers/oprofile/cpu_buffer.c index 61090969158f..2e03b6d796d3 100644 --- a/drivers/oprofile/cpu_buffer.c +++ b/drivers/oprofile/cpu_buffer.c | |||
@@ -1,11 +1,12 @@ | |||
1 | /** | 1 | /** |
2 | * @file cpu_buffer.c | 2 | * @file cpu_buffer.c |
3 | * | 3 | * |
4 | * @remark Copyright 2002 OProfile authors | 4 | * @remark Copyright 2002-2009 OProfile authors |
5 | * @remark Read the file COPYING | 5 | * @remark Read the file COPYING |
6 | * | 6 | * |
7 | * @author John Levon <levon@movementarian.org> | 7 | * @author John Levon <levon@movementarian.org> |
8 | * @author Barry Kasindorf <barry.kasindorf@amd.com> | 8 | * @author Barry Kasindorf <barry.kasindorf@amd.com> |
9 | * @author Robert Richter <robert.richter@amd.com> | ||
9 | * | 10 | * |
10 | * Each CPU has a local buffer that stores PC value/event | 11 | * Each CPU has a local buffer that stores PC value/event |
11 | * pairs. We also log context switches when we notice them. | 12 | * pairs. We also log context switches when we notice them. |
@@ -45,8 +46,8 @@ | |||
45 | * can be changed to a single buffer solution when the ring buffer | 46 | * can be changed to a single buffer solution when the ring buffer |
46 | * access is implemented as non-locking atomic code. | 47 | * access is implemented as non-locking atomic code. |
47 | */ | 48 | */ |
48 | struct ring_buffer *op_ring_buffer_read; | 49 | static struct ring_buffer *op_ring_buffer_read; |
49 | struct ring_buffer *op_ring_buffer_write; | 50 | static struct ring_buffer *op_ring_buffer_write; |
50 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); | 51 | DEFINE_PER_CPU(struct oprofile_cpu_buffer, cpu_buffer); |
51 | 52 | ||
52 | static void wq_sync_buffer(struct work_struct *work); | 53 | static void wq_sync_buffer(struct work_struct *work); |
@@ -54,19 +55,9 @@ static void wq_sync_buffer(struct work_struct *work); | |||
54 | #define DEFAULT_TIMER_EXPIRE (HZ / 10) | 55 | #define DEFAULT_TIMER_EXPIRE (HZ / 10) |
55 | static int work_enabled; | 56 | static int work_enabled; |
56 | 57 | ||
57 | void free_cpu_buffers(void) | ||
58 | { | ||
59 | if (op_ring_buffer_read) | ||
60 | ring_buffer_free(op_ring_buffer_read); | ||
61 | op_ring_buffer_read = NULL; | ||
62 | if (op_ring_buffer_write) | ||
63 | ring_buffer_free(op_ring_buffer_write); | ||
64 | op_ring_buffer_write = NULL; | ||
65 | } | ||
66 | |||
67 | unsigned long oprofile_get_cpu_buffer_size(void) | 58 | unsigned long oprofile_get_cpu_buffer_size(void) |
68 | { | 59 | { |
69 | return fs_cpu_buffer_size; | 60 | return oprofile_cpu_buffer_size; |
70 | } | 61 | } |
71 | 62 | ||
72 | void oprofile_cpu_buffer_inc_smpl_lost(void) | 63 | void oprofile_cpu_buffer_inc_smpl_lost(void) |
@@ -77,11 +68,21 @@ void oprofile_cpu_buffer_inc_smpl_lost(void) | |||
77 | cpu_buf->sample_lost_overflow++; | 68 | cpu_buf->sample_lost_overflow++; |
78 | } | 69 | } |
79 | 70 | ||
71 | void free_cpu_buffers(void) | ||
72 | { | ||
73 | if (op_ring_buffer_read) | ||
74 | ring_buffer_free(op_ring_buffer_read); | ||
75 | op_ring_buffer_read = NULL; | ||
76 | if (op_ring_buffer_write) | ||
77 | ring_buffer_free(op_ring_buffer_write); | ||
78 | op_ring_buffer_write = NULL; | ||
79 | } | ||
80 | |||
80 | int alloc_cpu_buffers(void) | 81 | int alloc_cpu_buffers(void) |
81 | { | 82 | { |
82 | int i; | 83 | int i; |
83 | 84 | ||
84 | unsigned long buffer_size = fs_cpu_buffer_size; | 85 | unsigned long buffer_size = oprofile_cpu_buffer_size; |
85 | 86 | ||
86 | op_ring_buffer_read = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); | 87 | op_ring_buffer_read = ring_buffer_alloc(buffer_size, OP_BUFFER_FLAGS); |
87 | if (!op_ring_buffer_read) | 88 | if (!op_ring_buffer_read) |
@@ -97,8 +98,6 @@ int alloc_cpu_buffers(void) | |||
97 | b->last_is_kernel = -1; | 98 | b->last_is_kernel = -1; |
98 | b->tracing = 0; | 99 | b->tracing = 0; |
99 | b->buffer_size = buffer_size; | 100 | b->buffer_size = buffer_size; |
100 | b->tail_pos = 0; | ||
101 | b->head_pos = 0; | ||
102 | b->sample_received = 0; | 101 | b->sample_received = 0; |
103 | b->sample_lost_overflow = 0; | 102 | b->sample_lost_overflow = 0; |
104 | b->backtrace_aborted = 0; | 103 | b->backtrace_aborted = 0; |
@@ -145,47 +144,156 @@ void end_cpu_work(void) | |||
145 | flush_scheduled_work(); | 144 | flush_scheduled_work(); |
146 | } | 145 | } |
147 | 146 | ||
148 | static inline int | 147 | /* |
149 | add_sample(struct oprofile_cpu_buffer *cpu_buf, | 148 | * This function prepares the cpu buffer to write a sample. |
150 | unsigned long pc, unsigned long event) | 149 | * |
150 | * Struct op_entry is used during operations on the ring buffer while | ||
151 | * struct op_sample contains the data that is stored in the ring | ||
152 | * buffer. Struct entry can be uninitialized. The function reserves a | ||
153 | * data array that is specified by size. Use | ||
154 | * op_cpu_buffer_write_commit() after preparing the sample. In case of | ||
155 | * errors a null pointer is returned, otherwise the pointer to the | ||
156 | * sample. | ||
157 | * | ||
158 | */ | ||
159 | struct op_sample | ||
160 | *op_cpu_buffer_write_reserve(struct op_entry *entry, unsigned long size) | ||
161 | { | ||
162 | entry->event = ring_buffer_lock_reserve | ||
163 | (op_ring_buffer_write, sizeof(struct op_sample) + | ||
164 | size * sizeof(entry->sample->data[0]), &entry->irq_flags); | ||
165 | if (entry->event) | ||
166 | entry->sample = ring_buffer_event_data(entry->event); | ||
167 | else | ||
168 | entry->sample = NULL; | ||
169 | |||
170 | if (!entry->sample) | ||
171 | return NULL; | ||
172 | |||
173 | entry->size = size; | ||
174 | entry->data = entry->sample->data; | ||
175 | |||
176 | return entry->sample; | ||
177 | } | ||
178 | |||
179 | int op_cpu_buffer_write_commit(struct op_entry *entry) | ||
180 | { | ||
181 | return ring_buffer_unlock_commit(op_ring_buffer_write, entry->event, | ||
182 | entry->irq_flags); | ||
183 | } | ||
184 | |||
185 | struct op_sample *op_cpu_buffer_read_entry(struct op_entry *entry, int cpu) | ||
186 | { | ||
187 | struct ring_buffer_event *e; | ||
188 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
189 | if (e) | ||
190 | goto event; | ||
191 | if (ring_buffer_swap_cpu(op_ring_buffer_read, | ||
192 | op_ring_buffer_write, | ||
193 | cpu)) | ||
194 | return NULL; | ||
195 | e = ring_buffer_consume(op_ring_buffer_read, cpu, NULL); | ||
196 | if (e) | ||
197 | goto event; | ||
198 | return NULL; | ||
199 | |||
200 | event: | ||
201 | entry->event = e; | ||
202 | entry->sample = ring_buffer_event_data(e); | ||
203 | entry->size = (ring_buffer_event_length(e) - sizeof(struct op_sample)) | ||
204 | / sizeof(entry->sample->data[0]); | ||
205 | entry->data = entry->sample->data; | ||
206 | return entry->sample; | ||
207 | } | ||
208 | |||
209 | unsigned long op_cpu_buffer_entries(int cpu) | ||
210 | { | ||
211 | return ring_buffer_entries_cpu(op_ring_buffer_read, cpu) | ||
212 | + ring_buffer_entries_cpu(op_ring_buffer_write, cpu); | ||
213 | } | ||
214 | |||
215 | static int | ||
216 | op_add_code(struct oprofile_cpu_buffer *cpu_buf, unsigned long backtrace, | ||
217 | int is_kernel, struct task_struct *task) | ||
151 | { | 218 | { |
152 | struct op_entry entry; | 219 | struct op_entry entry; |
153 | int ret; | 220 | struct op_sample *sample; |
221 | unsigned long flags; | ||
222 | int size; | ||
223 | |||
224 | flags = 0; | ||
225 | |||
226 | if (backtrace) | ||
227 | flags |= TRACE_BEGIN; | ||
228 | |||
229 | /* notice a switch from user->kernel or vice versa */ | ||
230 | is_kernel = !!is_kernel; | ||
231 | if (cpu_buf->last_is_kernel != is_kernel) { | ||
232 | cpu_buf->last_is_kernel = is_kernel; | ||
233 | flags |= KERNEL_CTX_SWITCH; | ||
234 | if (is_kernel) | ||
235 | flags |= IS_KERNEL; | ||
236 | } | ||
237 | |||
238 | /* notice a task switch */ | ||
239 | if (cpu_buf->last_task != task) { | ||
240 | cpu_buf->last_task = task; | ||
241 | flags |= USER_CTX_SWITCH; | ||
242 | } | ||
243 | |||
244 | if (!flags) | ||
245 | /* nothing to do */ | ||
246 | return 0; | ||
247 | |||
248 | if (flags & USER_CTX_SWITCH) | ||
249 | size = 1; | ||
250 | else | ||
251 | size = 0; | ||
252 | |||
253 | sample = op_cpu_buffer_write_reserve(&entry, size); | ||
254 | if (!sample) | ||
255 | return -ENOMEM; | ||
154 | 256 | ||
155 | ret = cpu_buffer_write_entry(&entry); | 257 | sample->eip = ESCAPE_CODE; |
156 | if (ret) | 258 | sample->event = flags; |
157 | return ret; | ||
158 | 259 | ||
159 | entry.sample->eip = pc; | 260 | if (size) |
160 | entry.sample->event = event; | 261 | op_cpu_buffer_add_data(&entry, (unsigned long)task); |
161 | 262 | ||
162 | ret = cpu_buffer_write_commit(&entry); | 263 | op_cpu_buffer_write_commit(&entry); |
163 | if (ret) | ||
164 | return ret; | ||
165 | 264 | ||
166 | return 0; | 265 | return 0; |
167 | } | 266 | } |
168 | 267 | ||
169 | static inline int | 268 | static inline int |
170 | add_code(struct oprofile_cpu_buffer *buffer, unsigned long value) | 269 | op_add_sample(struct oprofile_cpu_buffer *cpu_buf, |
270 | unsigned long pc, unsigned long event) | ||
171 | { | 271 | { |
172 | return add_sample(buffer, ESCAPE_CODE, value); | 272 | struct op_entry entry; |
273 | struct op_sample *sample; | ||
274 | |||
275 | sample = op_cpu_buffer_write_reserve(&entry, 0); | ||
276 | if (!sample) | ||
277 | return -ENOMEM; | ||
278 | |||
279 | sample->eip = pc; | ||
280 | sample->event = event; | ||
281 | |||
282 | return op_cpu_buffer_write_commit(&entry); | ||
173 | } | 283 | } |
174 | 284 | ||
175 | /* This must be safe from any context. It's safe writing here | 285 | /* |
176 | * because of the head/tail separation of the writer and reader | 286 | * This must be safe from any context. |
177 | * of the CPU buffer. | ||
178 | * | 287 | * |
179 | * is_kernel is needed because on some architectures you cannot | 288 | * is_kernel is needed because on some architectures you cannot |
180 | * tell if you are in kernel or user space simply by looking at | 289 | * tell if you are in kernel or user space simply by looking at |
181 | * pc. We tag this in the buffer by generating kernel enter/exit | 290 | * pc. We tag this in the buffer by generating kernel enter/exit |
182 | * events whenever is_kernel changes | 291 | * events whenever is_kernel changes |
183 | */ | 292 | */ |
184 | static int log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, | 293 | static int |
185 | int is_kernel, unsigned long event) | 294 | log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, |
295 | unsigned long backtrace, int is_kernel, unsigned long event) | ||
186 | { | 296 | { |
187 | struct task_struct *task; | ||
188 | |||
189 | cpu_buf->sample_received++; | 297 | cpu_buf->sample_received++; |
190 | 298 | ||
191 | if (pc == ESCAPE_CODE) { | 299 | if (pc == ESCAPE_CODE) { |
@@ -193,25 +301,10 @@ static int log_sample(struct oprofile_cpu_buffer *cpu_buf, unsigned long pc, | |||
193 | return 0; | 301 | return 0; |
194 | } | 302 | } |
195 | 303 | ||
196 | is_kernel = !!is_kernel; | 304 | if (op_add_code(cpu_buf, backtrace, is_kernel, current)) |
197 | 305 | goto fail; | |
198 | task = current; | ||
199 | |||
200 | /* notice a switch from user->kernel or vice versa */ | ||
201 | if (cpu_buf->last_is_kernel != is_kernel) { | ||
202 | cpu_buf->last_is_kernel = is_kernel; | ||
203 | if (add_code(cpu_buf, is_kernel)) | ||
204 | goto fail; | ||
205 | } | ||
206 | |||
207 | /* notice a task switch */ | ||
208 | if (cpu_buf->last_task != task) { | ||
209 | cpu_buf->last_task = task; | ||
210 | if (add_code(cpu_buf, (unsigned long)task)) | ||
211 | goto fail; | ||
212 | } | ||
213 | 306 | ||
214 | if (add_sample(cpu_buf, pc, event)) | 307 | if (op_add_sample(cpu_buf, pc, event)) |
215 | goto fail; | 308 | goto fail; |
216 | 309 | ||
217 | return 1; | 310 | return 1; |
@@ -221,109 +314,102 @@ fail: | |||
221 | return 0; | 314 | return 0; |
222 | } | 315 | } |
223 | 316 | ||
224 | static int oprofile_begin_trace(struct oprofile_cpu_buffer *cpu_buf) | 317 | static inline void oprofile_begin_trace(struct oprofile_cpu_buffer *cpu_buf) |
225 | { | 318 | { |
226 | add_code(cpu_buf, CPU_TRACE_BEGIN); | ||
227 | cpu_buf->tracing = 1; | 319 | cpu_buf->tracing = 1; |
228 | return 1; | ||
229 | } | 320 | } |
230 | 321 | ||
231 | static void oprofile_end_trace(struct oprofile_cpu_buffer *cpu_buf) | 322 | static inline void oprofile_end_trace(struct oprofile_cpu_buffer *cpu_buf) |
232 | { | 323 | { |
233 | cpu_buf->tracing = 0; | 324 | cpu_buf->tracing = 0; |
234 | } | 325 | } |
235 | 326 | ||
236 | void oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, | 327 | static inline void |
237 | unsigned long event, int is_kernel) | 328 | __oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, |
329 | unsigned long event, int is_kernel) | ||
238 | { | 330 | { |
239 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 331 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
240 | 332 | unsigned long backtrace = oprofile_backtrace_depth; | |
241 | if (!backtrace_depth) { | ||
242 | log_sample(cpu_buf, pc, is_kernel, event); | ||
243 | return; | ||
244 | } | ||
245 | |||
246 | if (!oprofile_begin_trace(cpu_buf)) | ||
247 | return; | ||
248 | 333 | ||
249 | /* | 334 | /* |
250 | * if log_sample() fail we can't backtrace since we lost the | 335 | * if log_sample() fail we can't backtrace since we lost the |
251 | * source of this event | 336 | * source of this event |
252 | */ | 337 | */ |
253 | if (log_sample(cpu_buf, pc, is_kernel, event)) | 338 | if (!log_sample(cpu_buf, pc, backtrace, is_kernel, event)) |
254 | oprofile_ops.backtrace(regs, backtrace_depth); | 339 | /* failed */ |
340 | return; | ||
341 | |||
342 | if (!backtrace) | ||
343 | return; | ||
344 | |||
345 | oprofile_begin_trace(cpu_buf); | ||
346 | oprofile_ops.backtrace(regs, backtrace); | ||
255 | oprofile_end_trace(cpu_buf); | 347 | oprofile_end_trace(cpu_buf); |
256 | } | 348 | } |
257 | 349 | ||
350 | void oprofile_add_ext_sample(unsigned long pc, struct pt_regs * const regs, | ||
351 | unsigned long event, int is_kernel) | ||
352 | { | ||
353 | __oprofile_add_ext_sample(pc, regs, event, is_kernel); | ||
354 | } | ||
355 | |||
258 | void oprofile_add_sample(struct pt_regs * const regs, unsigned long event) | 356 | void oprofile_add_sample(struct pt_regs * const regs, unsigned long event) |
259 | { | 357 | { |
260 | int is_kernel = !user_mode(regs); | 358 | int is_kernel = !user_mode(regs); |
261 | unsigned long pc = profile_pc(regs); | 359 | unsigned long pc = profile_pc(regs); |
262 | 360 | ||
263 | oprofile_add_ext_sample(pc, regs, event, is_kernel); | 361 | __oprofile_add_ext_sample(pc, regs, event, is_kernel); |
264 | } | 362 | } |
265 | 363 | ||
266 | #ifdef CONFIG_OPROFILE_IBS | 364 | /* |
267 | 365 | * Add samples with data to the ring buffer. | |
268 | #define MAX_IBS_SAMPLE_SIZE 14 | 366 | * |
269 | 367 | * Use oprofile_add_data(&entry, val) to add data and | |
270 | void oprofile_add_ibs_sample(struct pt_regs * const regs, | 368 | * oprofile_write_commit(&entry) to commit the sample. |
271 | unsigned int * const ibs_sample, int ibs_code) | 369 | */ |
370 | void | ||
371 | oprofile_write_reserve(struct op_entry *entry, struct pt_regs * const regs, | ||
372 | unsigned long pc, int code, int size) | ||
272 | { | 373 | { |
374 | struct op_sample *sample; | ||
273 | int is_kernel = !user_mode(regs); | 375 | int is_kernel = !user_mode(regs); |
274 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 376 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
275 | struct task_struct *task; | ||
276 | int fail = 0; | ||
277 | 377 | ||
278 | cpu_buf->sample_received++; | 378 | cpu_buf->sample_received++; |
279 | 379 | ||
280 | /* notice a switch from user->kernel or vice versa */ | 380 | /* no backtraces for samples with data */ |
281 | if (cpu_buf->last_is_kernel != is_kernel) { | 381 | if (op_add_code(cpu_buf, 0, is_kernel, current)) |
282 | if (add_code(cpu_buf, is_kernel)) | 382 | goto fail; |
283 | goto fail; | ||
284 | cpu_buf->last_is_kernel = is_kernel; | ||
285 | } | ||
286 | |||
287 | /* notice a task switch */ | ||
288 | if (!is_kernel) { | ||
289 | task = current; | ||
290 | if (cpu_buf->last_task != task) { | ||
291 | if (add_code(cpu_buf, (unsigned long)task)) | ||
292 | goto fail; | ||
293 | cpu_buf->last_task = task; | ||
294 | } | ||
295 | } | ||
296 | |||
297 | fail = fail || add_code(cpu_buf, ibs_code); | ||
298 | fail = fail || add_sample(cpu_buf, ibs_sample[0], ibs_sample[1]); | ||
299 | fail = fail || add_sample(cpu_buf, ibs_sample[2], ibs_sample[3]); | ||
300 | fail = fail || add_sample(cpu_buf, ibs_sample[4], ibs_sample[5]); | ||
301 | |||
302 | if (ibs_code == IBS_OP_BEGIN) { | ||
303 | fail = fail || add_sample(cpu_buf, ibs_sample[6], ibs_sample[7]); | ||
304 | fail = fail || add_sample(cpu_buf, ibs_sample[8], ibs_sample[9]); | ||
305 | fail = fail || add_sample(cpu_buf, ibs_sample[10], ibs_sample[11]); | ||
306 | } | ||
307 | 383 | ||
308 | if (fail) | 384 | sample = op_cpu_buffer_write_reserve(entry, size + 2); |
385 | if (!sample) | ||
309 | goto fail; | 386 | goto fail; |
387 | sample->eip = ESCAPE_CODE; | ||
388 | sample->event = 0; /* no flags */ | ||
310 | 389 | ||
311 | if (backtrace_depth) | 390 | op_cpu_buffer_add_data(entry, code); |
312 | oprofile_ops.backtrace(regs, backtrace_depth); | 391 | op_cpu_buffer_add_data(entry, pc); |
313 | 392 | ||
314 | return; | 393 | return; |
315 | 394 | ||
316 | fail: | 395 | fail: |
317 | cpu_buf->sample_lost_overflow++; | 396 | cpu_buf->sample_lost_overflow++; |
318 | return; | ||
319 | } | 397 | } |
320 | 398 | ||
321 | #endif | 399 | int oprofile_add_data(struct op_entry *entry, unsigned long val) |
400 | { | ||
401 | return op_cpu_buffer_add_data(entry, val); | ||
402 | } | ||
403 | |||
404 | int oprofile_write_commit(struct op_entry *entry) | ||
405 | { | ||
406 | return op_cpu_buffer_write_commit(entry); | ||
407 | } | ||
322 | 408 | ||
323 | void oprofile_add_pc(unsigned long pc, int is_kernel, unsigned long event) | 409 | void oprofile_add_pc(unsigned long pc, int is_kernel, unsigned long event) |
324 | { | 410 | { |
325 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); | 411 | struct oprofile_cpu_buffer *cpu_buf = &__get_cpu_var(cpu_buffer); |
326 | log_sample(cpu_buf, pc, is_kernel, event); | 412 | log_sample(cpu_buf, pc, 0, is_kernel, event); |
327 | } | 413 | } |
328 | 414 | ||
329 | void oprofile_add_trace(unsigned long pc) | 415 | void oprofile_add_trace(unsigned long pc) |
@@ -340,7 +426,7 @@ void oprofile_add_trace(unsigned long pc) | |||
340 | if (pc == ESCAPE_CODE) | 426 | if (pc == ESCAPE_CODE) |
341 | goto fail; | 427 | goto fail; |
342 | 428 | ||
343 | if (add_sample(cpu_buf, pc, 0)) | 429 | if (op_add_sample(cpu_buf, pc, 0)) |
344 | goto fail; | 430 | goto fail; |
345 | 431 | ||
346 | return; | 432 | return; |