diff options
Diffstat (limited to 'kernel/tracepoint.c')
| -rw-r--r-- | kernel/tracepoint.c | 295 |
1 files changed, 193 insertions, 102 deletions
diff --git a/kernel/tracepoint.c b/kernel/tracepoint.c index af8c85664882..79602740bbb5 100644 --- a/kernel/tracepoint.c +++ b/kernel/tracepoint.c | |||
| @@ -43,6 +43,7 @@ static DEFINE_MUTEX(tracepoints_mutex); | |||
| 43 | */ | 43 | */ |
| 44 | #define TRACEPOINT_HASH_BITS 6 | 44 | #define TRACEPOINT_HASH_BITS 6 |
| 45 | #define TRACEPOINT_TABLE_SIZE (1 << TRACEPOINT_HASH_BITS) | 45 | #define TRACEPOINT_TABLE_SIZE (1 << TRACEPOINT_HASH_BITS) |
| 46 | static struct hlist_head tracepoint_table[TRACEPOINT_TABLE_SIZE]; | ||
| 46 | 47 | ||
| 47 | /* | 48 | /* |
| 48 | * Note about RCU : | 49 | * Note about RCU : |
| @@ -54,40 +55,43 @@ struct tracepoint_entry { | |||
| 54 | struct hlist_node hlist; | 55 | struct hlist_node hlist; |
| 55 | void **funcs; | 56 | void **funcs; |
| 56 | int refcount; /* Number of times armed. 0 if disarmed. */ | 57 | int refcount; /* Number of times armed. 0 if disarmed. */ |
| 57 | struct rcu_head rcu; | ||
| 58 | void *oldptr; | ||
| 59 | unsigned char rcu_pending:1; | ||
| 60 | char name[0]; | 58 | char name[0]; |
| 61 | }; | 59 | }; |
| 62 | 60 | ||
| 63 | static struct hlist_head tracepoint_table[TRACEPOINT_TABLE_SIZE]; | 61 | struct tp_probes { |
| 62 | union { | ||
| 63 | struct rcu_head rcu; | ||
| 64 | struct list_head list; | ||
| 65 | } u; | ||
| 66 | void *probes[0]; | ||
| 67 | }; | ||
| 64 | 68 | ||
| 65 | static void free_old_closure(struct rcu_head *head) | 69 | static inline void *allocate_probes(int count) |
| 66 | { | 70 | { |
| 67 | struct tracepoint_entry *entry = container_of(head, | 71 | struct tp_probes *p = kmalloc(count * sizeof(void *) |
| 68 | struct tracepoint_entry, rcu); | 72 | + sizeof(struct tp_probes), GFP_KERNEL); |
| 69 | kfree(entry->oldptr); | 73 | return p == NULL ? NULL : p->probes; |
| 70 | /* Make sure we free the data before setting the pending flag to 0 */ | ||
| 71 | smp_wmb(); | ||
| 72 | entry->rcu_pending = 0; | ||
| 73 | } | 74 | } |
| 74 | 75 | ||
| 75 | static void tracepoint_entry_free_old(struct tracepoint_entry *entry, void *old) | 76 | static void rcu_free_old_probes(struct rcu_head *head) |
| 76 | { | 77 | { |
| 77 | if (!old) | 78 | kfree(container_of(head, struct tp_probes, u.rcu)); |
| 78 | return; | 79 | } |
| 79 | entry->oldptr = old; | 80 | |
| 80 | entry->rcu_pending = 1; | 81 | static inline void release_probes(void *old) |
| 81 | /* write rcu_pending before calling the RCU callback */ | 82 | { |
| 82 | smp_wmb(); | 83 | if (old) { |
| 83 | call_rcu_sched(&entry->rcu, free_old_closure); | 84 | struct tp_probes *tp_probes = container_of(old, |
| 85 | struct tp_probes, probes[0]); | ||
| 86 | call_rcu_sched(&tp_probes->u.rcu, rcu_free_old_probes); | ||
| 87 | } | ||
| 84 | } | 88 | } |
| 85 | 89 | ||
| 86 | static void debug_print_probes(struct tracepoint_entry *entry) | 90 | static void debug_print_probes(struct tracepoint_entry *entry) |
| 87 | { | 91 | { |
| 88 | int i; | 92 | int i; |
| 89 | 93 | ||
| 90 | if (!tracepoint_debug) | 94 | if (!tracepoint_debug || !entry->funcs) |
| 91 | return; | 95 | return; |
| 92 | 96 | ||
| 93 | for (i = 0; entry->funcs[i]; i++) | 97 | for (i = 0; entry->funcs[i]; i++) |
| @@ -111,12 +115,13 @@ tracepoint_entry_add_probe(struct tracepoint_entry *entry, void *probe) | |||
| 111 | return ERR_PTR(-EEXIST); | 115 | return ERR_PTR(-EEXIST); |
| 112 | } | 116 | } |
| 113 | /* + 2 : one for new probe, one for NULL func */ | 117 | /* + 2 : one for new probe, one for NULL func */ |
| 114 | new = kzalloc((nr_probes + 2) * sizeof(void *), GFP_KERNEL); | 118 | new = allocate_probes(nr_probes + 2); |
| 115 | if (new == NULL) | 119 | if (new == NULL) |
| 116 | return ERR_PTR(-ENOMEM); | 120 | return ERR_PTR(-ENOMEM); |
| 117 | if (old) | 121 | if (old) |
| 118 | memcpy(new, old, nr_probes * sizeof(void *)); | 122 | memcpy(new, old, nr_probes * sizeof(void *)); |
| 119 | new[nr_probes] = probe; | 123 | new[nr_probes] = probe; |
| 124 | new[nr_probes + 1] = NULL; | ||
| 120 | entry->refcount = nr_probes + 1; | 125 | entry->refcount = nr_probes + 1; |
| 121 | entry->funcs = new; | 126 | entry->funcs = new; |
| 122 | debug_print_probes(entry); | 127 | debug_print_probes(entry); |
| @@ -132,7 +137,7 @@ tracepoint_entry_remove_probe(struct tracepoint_entry *entry, void *probe) | |||
| 132 | old = entry->funcs; | 137 | old = entry->funcs; |
| 133 | 138 | ||
| 134 | if (!old) | 139 | if (!old) |
| 135 | return NULL; | 140 | return ERR_PTR(-ENOENT); |
| 136 | 141 | ||
| 137 | debug_print_probes(entry); | 142 | debug_print_probes(entry); |
| 138 | /* (N -> M), (N > 1, M >= 0) probes */ | 143 | /* (N -> M), (N > 1, M >= 0) probes */ |
| @@ -151,13 +156,13 @@ tracepoint_entry_remove_probe(struct tracepoint_entry *entry, void *probe) | |||
| 151 | int j = 0; | 156 | int j = 0; |
| 152 | /* N -> M, (N > 1, M > 0) */ | 157 | /* N -> M, (N > 1, M > 0) */ |
| 153 | /* + 1 for NULL */ | 158 | /* + 1 for NULL */ |
| 154 | new = kzalloc((nr_probes - nr_del + 1) | 159 | new = allocate_probes(nr_probes - nr_del + 1); |
| 155 | * sizeof(void *), GFP_KERNEL); | ||
| 156 | if (new == NULL) | 160 | if (new == NULL) |
| 157 | return ERR_PTR(-ENOMEM); | 161 | return ERR_PTR(-ENOMEM); |
| 158 | for (i = 0; old[i]; i++) | 162 | for (i = 0; old[i]; i++) |
| 159 | if ((probe && old[i] != probe)) | 163 | if ((probe && old[i] != probe)) |
| 160 | new[j++] = old[i]; | 164 | new[j++] = old[i]; |
| 165 | new[nr_probes - nr_del] = NULL; | ||
| 161 | entry->refcount = nr_probes - nr_del; | 166 | entry->refcount = nr_probes - nr_del; |
| 162 | entry->funcs = new; | 167 | entry->funcs = new; |
| 163 | } | 168 | } |
| @@ -215,7 +220,6 @@ static struct tracepoint_entry *add_tracepoint(const char *name) | |||
| 215 | memcpy(&e->name[0], name, name_len); | 220 | memcpy(&e->name[0], name, name_len); |
| 216 | e->funcs = NULL; | 221 | e->funcs = NULL; |
| 217 | e->refcount = 0; | 222 | e->refcount = 0; |
| 218 | e->rcu_pending = 0; | ||
| 219 | hlist_add_head(&e->hlist, head); | 223 | hlist_add_head(&e->hlist, head); |
| 220 | return e; | 224 | return e; |
| 221 | } | 225 | } |
| @@ -224,32 +228,10 @@ static struct tracepoint_entry *add_tracepoint(const char *name) | |||
| 224 | * Remove the tracepoint from the tracepoint hash table. Must be called with | 228 | * Remove the tracepoint from the tracepoint hash table. Must be called with |
| 225 | * mutex_lock held. | 229 | * mutex_lock held. |
| 226 | */ | 230 | */ |
| 227 | static int remove_tracepoint(const char *name) | 231 | static inline void remove_tracepoint(struct tracepoint_entry *e) |
| 228 | { | 232 | { |
| 229 | struct hlist_head *head; | ||
| 230 | struct hlist_node *node; | ||
| 231 | struct tracepoint_entry *e; | ||
| 232 | int found = 0; | ||
| 233 | size_t len = strlen(name) + 1; | ||
| 234 | u32 hash = jhash(name, len-1, 0); | ||
| 235 | |||
| 236 | head = &tracepoint_table[hash & (TRACEPOINT_TABLE_SIZE - 1)]; | ||
| 237 | hlist_for_each_entry(e, node, head, hlist) { | ||
| 238 | if (!strcmp(name, e->name)) { | ||
| 239 | found = 1; | ||
| 240 | break; | ||
| 241 | } | ||
| 242 | } | ||
| 243 | if (!found) | ||
| 244 | return -ENOENT; | ||
| 245 | if (e->refcount) | ||
| 246 | return -EBUSY; | ||
| 247 | hlist_del(&e->hlist); | 233 | hlist_del(&e->hlist); |
| 248 | /* Make sure the call_rcu_sched has been executed */ | ||
| 249 | if (e->rcu_pending) | ||
| 250 | rcu_barrier_sched(); | ||
| 251 | kfree(e); | 234 | kfree(e); |
| 252 | return 0; | ||
| 253 | } | 235 | } |
| 254 | 236 | ||
| 255 | /* | 237 | /* |
| @@ -280,6 +262,7 @@ static void set_tracepoint(struct tracepoint_entry **entry, | |||
| 280 | static void disable_tracepoint(struct tracepoint *elem) | 262 | static void disable_tracepoint(struct tracepoint *elem) |
| 281 | { | 263 | { |
| 282 | elem->state = 0; | 264 | elem->state = 0; |
| 265 | rcu_assign_pointer(elem->funcs, NULL); | ||
| 283 | } | 266 | } |
| 284 | 267 | ||
| 285 | /** | 268 | /** |
| @@ -320,6 +303,23 @@ static void tracepoint_update_probes(void) | |||
| 320 | module_update_tracepoints(); | 303 | module_update_tracepoints(); |
| 321 | } | 304 | } |
| 322 | 305 | ||
| 306 | static void *tracepoint_add_probe(const char *name, void *probe) | ||
| 307 | { | ||
| 308 | struct tracepoint_entry *entry; | ||
| 309 | void *old; | ||
| 310 | |||
| 311 | entry = get_tracepoint(name); | ||
| 312 | if (!entry) { | ||
| 313 | entry = add_tracepoint(name); | ||
| 314 | if (IS_ERR(entry)) | ||
| 315 | return entry; | ||
| 316 | } | ||
| 317 | old = tracepoint_entry_add_probe(entry, probe); | ||
| 318 | if (IS_ERR(old) && !entry->refcount) | ||
| 319 | remove_tracepoint(entry); | ||
| 320 | return old; | ||
| 321 | } | ||
| 322 | |||
| 323 | /** | 323 | /** |
| 324 | * tracepoint_probe_register - Connect a probe to a tracepoint | 324 | * tracepoint_probe_register - Connect a probe to a tracepoint |
| 325 | * @name: tracepoint name | 325 | * @name: tracepoint name |
| @@ -330,44 +330,36 @@ static void tracepoint_update_probes(void) | |||
| 330 | */ | 330 | */ |
| 331 | int tracepoint_probe_register(const char *name, void *probe) | 331 | int tracepoint_probe_register(const char *name, void *probe) |
| 332 | { | 332 | { |
| 333 | struct tracepoint_entry *entry; | ||
| 334 | int ret = 0; | ||
| 335 | void *old; | 333 | void *old; |
| 336 | 334 | ||
| 337 | mutex_lock(&tracepoints_mutex); | 335 | mutex_lock(&tracepoints_mutex); |
| 338 | entry = get_tracepoint(name); | 336 | old = tracepoint_add_probe(name, probe); |
| 339 | if (!entry) { | ||
| 340 | entry = add_tracepoint(name); | ||
| 341 | if (IS_ERR(entry)) { | ||
| 342 | ret = PTR_ERR(entry); | ||
| 343 | goto end; | ||
| 344 | } | ||
| 345 | } | ||
| 346 | /* | ||
| 347 | * If we detect that a call_rcu_sched is pending for this tracepoint, | ||
| 348 | * make sure it's executed now. | ||
| 349 | */ | ||
| 350 | if (entry->rcu_pending) | ||
| 351 | rcu_barrier_sched(); | ||
| 352 | old = tracepoint_entry_add_probe(entry, probe); | ||
| 353 | if (IS_ERR(old)) { | ||
| 354 | ret = PTR_ERR(old); | ||
| 355 | goto end; | ||
| 356 | } | ||
| 357 | mutex_unlock(&tracepoints_mutex); | 337 | mutex_unlock(&tracepoints_mutex); |
| 338 | if (IS_ERR(old)) | ||
| 339 | return PTR_ERR(old); | ||
| 340 | |||
| 358 | tracepoint_update_probes(); /* may update entry */ | 341 | tracepoint_update_probes(); /* may update entry */ |
| 359 | mutex_lock(&tracepoints_mutex); | 342 | release_probes(old); |
| 360 | entry = get_tracepoint(name); | 343 | return 0; |
| 361 | WARN_ON(!entry); | ||
| 362 | if (entry->rcu_pending) | ||
| 363 | rcu_barrier_sched(); | ||
| 364 | tracepoint_entry_free_old(entry, old); | ||
| 365 | end: | ||
| 366 | mutex_unlock(&tracepoints_mutex); | ||
| 367 | return ret; | ||
| 368 | } | 344 | } |
| 369 | EXPORT_SYMBOL_GPL(tracepoint_probe_register); | 345 | EXPORT_SYMBOL_GPL(tracepoint_probe_register); |
| 370 | 346 | ||
| 347 | static void *tracepoint_remove_probe(const char *name, void *probe) | ||
| 348 | { | ||
| 349 | struct tracepoint_entry *entry; | ||
| 350 | void *old; | ||
| 351 | |||
| 352 | entry = get_tracepoint(name); | ||
| 353 | if (!entry) | ||
| 354 | return ERR_PTR(-ENOENT); | ||
| 355 | old = tracepoint_entry_remove_probe(entry, probe); | ||
| 356 | if (IS_ERR(old)) | ||
| 357 | return old; | ||
| 358 | if (!entry->refcount) | ||
| 359 | remove_tracepoint(entry); | ||
| 360 | return old; | ||
| 361 | } | ||
| 362 | |||
| 371 | /** | 363 | /** |
| 372 | * tracepoint_probe_unregister - Disconnect a probe from a tracepoint | 364 | * tracepoint_probe_unregister - Disconnect a probe from a tracepoint |
| 373 | * @name: tracepoint name | 365 | * @name: tracepoint name |
| @@ -380,38 +372,104 @@ EXPORT_SYMBOL_GPL(tracepoint_probe_register); | |||
| 380 | */ | 372 | */ |
| 381 | int tracepoint_probe_unregister(const char *name, void *probe) | 373 | int tracepoint_probe_unregister(const char *name, void *probe) |
| 382 | { | 374 | { |
| 383 | struct tracepoint_entry *entry; | ||
| 384 | void *old; | 375 | void *old; |
| 385 | int ret = -ENOENT; | ||
| 386 | 376 | ||
| 387 | mutex_lock(&tracepoints_mutex); | 377 | mutex_lock(&tracepoints_mutex); |
| 388 | entry = get_tracepoint(name); | 378 | old = tracepoint_remove_probe(name, probe); |
| 389 | if (!entry) | ||
| 390 | goto end; | ||
| 391 | if (entry->rcu_pending) | ||
| 392 | rcu_barrier_sched(); | ||
| 393 | old = tracepoint_entry_remove_probe(entry, probe); | ||
| 394 | if (!old) { | ||
| 395 | printk(KERN_WARNING "Warning: Trying to unregister a probe" | ||
| 396 | "that doesn't exist\n"); | ||
| 397 | goto end; | ||
| 398 | } | ||
| 399 | mutex_unlock(&tracepoints_mutex); | 379 | mutex_unlock(&tracepoints_mutex); |
| 380 | if (IS_ERR(old)) | ||
| 381 | return PTR_ERR(old); | ||
| 382 | |||
| 400 | tracepoint_update_probes(); /* may update entry */ | 383 | tracepoint_update_probes(); /* may update entry */ |
| 384 | release_probes(old); | ||
| 385 | return 0; | ||
| 386 | } | ||
| 387 | EXPORT_SYMBOL_GPL(tracepoint_probe_unregister); | ||
| 388 | |||
| 389 | static LIST_HEAD(old_probes); | ||
| 390 | static int need_update; | ||
| 391 | |||
| 392 | static void tracepoint_add_old_probes(void *old) | ||
| 393 | { | ||
| 394 | need_update = 1; | ||
| 395 | if (old) { | ||
| 396 | struct tp_probes *tp_probes = container_of(old, | ||
| 397 | struct tp_probes, probes[0]); | ||
| 398 | list_add(&tp_probes->u.list, &old_probes); | ||
| 399 | } | ||
| 400 | } | ||
| 401 | |||
| 402 | /** | ||
| 403 | * tracepoint_probe_register_noupdate - register a probe but not connect | ||
| 404 | * @name: tracepoint name | ||
| 405 | * @probe: probe handler | ||
| 406 | * | ||
| 407 | * caller must call tracepoint_probe_update_all() | ||
| 408 | */ | ||
| 409 | int tracepoint_probe_register_noupdate(const char *name, void *probe) | ||
| 410 | { | ||
| 411 | void *old; | ||
| 412 | |||
| 401 | mutex_lock(&tracepoints_mutex); | 413 | mutex_lock(&tracepoints_mutex); |
| 402 | entry = get_tracepoint(name); | 414 | old = tracepoint_add_probe(name, probe); |
| 403 | if (!entry) | 415 | if (IS_ERR(old)) { |
| 404 | goto end; | 416 | mutex_unlock(&tracepoints_mutex); |
| 405 | if (entry->rcu_pending) | 417 | return PTR_ERR(old); |
| 406 | rcu_barrier_sched(); | 418 | } |
| 407 | tracepoint_entry_free_old(entry, old); | 419 | tracepoint_add_old_probes(old); |
| 408 | remove_tracepoint(name); /* Ignore busy error message */ | ||
| 409 | ret = 0; | ||
| 410 | end: | ||
| 411 | mutex_unlock(&tracepoints_mutex); | 420 | mutex_unlock(&tracepoints_mutex); |
| 412 | return ret; | 421 | return 0; |
| 413 | } | 422 | } |
| 414 | EXPORT_SYMBOL_GPL(tracepoint_probe_unregister); | 423 | EXPORT_SYMBOL_GPL(tracepoint_probe_register_noupdate); |
| 424 | |||
| 425 | /** | ||
| 426 | * tracepoint_probe_unregister_noupdate - remove a probe but not disconnect | ||
| 427 | * @name: tracepoint name | ||
| 428 | * @probe: probe function pointer | ||
| 429 | * | ||
| 430 | * caller must call tracepoint_probe_update_all() | ||
| 431 | */ | ||
| 432 | int tracepoint_probe_unregister_noupdate(const char *name, void *probe) | ||
| 433 | { | ||
| 434 | void *old; | ||
| 435 | |||
| 436 | mutex_lock(&tracepoints_mutex); | ||
| 437 | old = tracepoint_remove_probe(name, probe); | ||
| 438 | if (IS_ERR(old)) { | ||
| 439 | mutex_unlock(&tracepoints_mutex); | ||
| 440 | return PTR_ERR(old); | ||
| 441 | } | ||
| 442 | tracepoint_add_old_probes(old); | ||
| 443 | mutex_unlock(&tracepoints_mutex); | ||
| 444 | return 0; | ||
| 445 | } | ||
| 446 | EXPORT_SYMBOL_GPL(tracepoint_probe_unregister_noupdate); | ||
| 447 | |||
| 448 | /** | ||
| 449 | * tracepoint_probe_update_all - update tracepoints | ||
| 450 | */ | ||
| 451 | void tracepoint_probe_update_all(void) | ||
| 452 | { | ||
| 453 | LIST_HEAD(release_probes); | ||
| 454 | struct tp_probes *pos, *next; | ||
| 455 | |||
| 456 | mutex_lock(&tracepoints_mutex); | ||
| 457 | if (!need_update) { | ||
| 458 | mutex_unlock(&tracepoints_mutex); | ||
| 459 | return; | ||
| 460 | } | ||
| 461 | if (!list_empty(&old_probes)) | ||
| 462 | list_replace_init(&old_probes, &release_probes); | ||
| 463 | need_update = 0; | ||
| 464 | mutex_unlock(&tracepoints_mutex); | ||
| 465 | |||
| 466 | tracepoint_update_probes(); | ||
| 467 | list_for_each_entry_safe(pos, next, &release_probes, u.list) { | ||
| 468 | list_del(&pos->u.list); | ||
| 469 | call_rcu_sched(&pos->u.rcu, rcu_free_old_probes); | ||
| 470 | } | ||
| 471 | } | ||
| 472 | EXPORT_SYMBOL_GPL(tracepoint_probe_update_all); | ||
| 415 | 473 | ||
| 416 | /** | 474 | /** |
| 417 | * tracepoint_get_iter_range - Get a next tracepoint iterator given a range. | 475 | * tracepoint_get_iter_range - Get a next tracepoint iterator given a range. |
| @@ -483,3 +541,36 @@ void tracepoint_iter_reset(struct tracepoint_iter *iter) | |||
| 483 | iter->tracepoint = NULL; | 541 | iter->tracepoint = NULL; |
| 484 | } | 542 | } |
| 485 | EXPORT_SYMBOL_GPL(tracepoint_iter_reset); | 543 | EXPORT_SYMBOL_GPL(tracepoint_iter_reset); |
| 544 | |||
| 545 | #ifdef CONFIG_MODULES | ||
| 546 | |||
| 547 | int tracepoint_module_notify(struct notifier_block *self, | ||
| 548 | unsigned long val, void *data) | ||
| 549 | { | ||
| 550 | struct module *mod = data; | ||
| 551 | |||
| 552 | switch (val) { | ||
| 553 | case MODULE_STATE_COMING: | ||
| 554 | tracepoint_update_probe_range(mod->tracepoints, | ||
| 555 | mod->tracepoints + mod->num_tracepoints); | ||
| 556 | break; | ||
| 557 | case MODULE_STATE_GOING: | ||
| 558 | tracepoint_update_probe_range(mod->tracepoints, | ||
| 559 | mod->tracepoints + mod->num_tracepoints); | ||
| 560 | break; | ||
| 561 | } | ||
| 562 | return 0; | ||
| 563 | } | ||
| 564 | |||
| 565 | struct notifier_block tracepoint_module_nb = { | ||
| 566 | .notifier_call = tracepoint_module_notify, | ||
| 567 | .priority = 0, | ||
| 568 | }; | ||
| 569 | |||
| 570 | static int init_tracepoints(void) | ||
| 571 | { | ||
| 572 | return register_module_notifier(&tracepoint_module_nb); | ||
| 573 | } | ||
| 574 | __initcall(init_tracepoints); | ||
| 575 | |||
| 576 | #endif /* CONFIG_MODULES */ | ||
