diff options
author | Peter Zijlstra <a.p.zijlstra@chello.nl> | 2010-03-08 07:51:20 -0500 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2010-03-10 07:22:36 -0500 |
commit | d4944a06666054707d23e11888e480af239e5abf (patch) | |
tree | 58d8e847f198c29a2a2ddee60fe862f8973794d1 | |
parent | f3d46b2e6fa57547f9884330798792afc83f4b04 (diff) |
perf: Provide better condition for event rotation
Try to avoid useless rotation and PMU disables.
[ Could be improved by keeping a nr_runnable count to better account
for the < PERF_STAT_INACTIVE counters ]
Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Arnaldo Carvalho de Melo <acme@infradead.org>
Cc: paulus@samba.org
Cc: eranian@google.com
Cc: robert.richter@amd.com
Cc: fweisbec@gmail.com
LKML-Reference: <new-submission>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
-rw-r--r-- | kernel/perf_event.c | 21 |
1 files changed, 15 insertions, 6 deletions
diff --git a/kernel/perf_event.c b/kernel/perf_event.c index d8108465397d..52c69a34d697 100644 --- a/kernel/perf_event.c +++ b/kernel/perf_event.c | |||
@@ -1524,12 +1524,15 @@ static void perf_ctx_adjust_freq(struct perf_event_context *ctx) | |||
1524 | */ | 1524 | */ |
1525 | if (interrupts == MAX_INTERRUPTS) { | 1525 | if (interrupts == MAX_INTERRUPTS) { |
1526 | perf_log_throttle(event, 1); | 1526 | perf_log_throttle(event, 1); |
1527 | perf_disable(); | ||
1527 | event->pmu->unthrottle(event); | 1528 | event->pmu->unthrottle(event); |
1529 | perf_enable(); | ||
1528 | } | 1530 | } |
1529 | 1531 | ||
1530 | if (!event->attr.freq || !event->attr.sample_freq) | 1532 | if (!event->attr.freq || !event->attr.sample_freq) |
1531 | continue; | 1533 | continue; |
1532 | 1534 | ||
1535 | perf_disable(); | ||
1533 | event->pmu->read(event); | 1536 | event->pmu->read(event); |
1534 | now = atomic64_read(&event->count); | 1537 | now = atomic64_read(&event->count); |
1535 | delta = now - hwc->freq_count_stamp; | 1538 | delta = now - hwc->freq_count_stamp; |
@@ -1537,6 +1540,7 @@ static void perf_ctx_adjust_freq(struct perf_event_context *ctx) | |||
1537 | 1540 | ||
1538 | if (delta > 0) | 1541 | if (delta > 0) |
1539 | perf_adjust_period(event, TICK_NSEC, delta); | 1542 | perf_adjust_period(event, TICK_NSEC, delta); |
1543 | perf_enable(); | ||
1540 | } | 1544 | } |
1541 | raw_spin_unlock(&ctx->lock); | 1545 | raw_spin_unlock(&ctx->lock); |
1542 | } | 1546 | } |
@@ -1546,9 +1550,6 @@ static void perf_ctx_adjust_freq(struct perf_event_context *ctx) | |||
1546 | */ | 1550 | */ |
1547 | static void rotate_ctx(struct perf_event_context *ctx) | 1551 | static void rotate_ctx(struct perf_event_context *ctx) |
1548 | { | 1552 | { |
1549 | if (!ctx->nr_events) | ||
1550 | return; | ||
1551 | |||
1552 | raw_spin_lock(&ctx->lock); | 1553 | raw_spin_lock(&ctx->lock); |
1553 | 1554 | ||
1554 | /* Rotate the first entry last of non-pinned groups */ | 1555 | /* Rotate the first entry last of non-pinned groups */ |
@@ -1561,19 +1562,28 @@ void perf_event_task_tick(struct task_struct *curr) | |||
1561 | { | 1562 | { |
1562 | struct perf_cpu_context *cpuctx; | 1563 | struct perf_cpu_context *cpuctx; |
1563 | struct perf_event_context *ctx; | 1564 | struct perf_event_context *ctx; |
1565 | int rotate = 0; | ||
1564 | 1566 | ||
1565 | if (!atomic_read(&nr_events)) | 1567 | if (!atomic_read(&nr_events)) |
1566 | return; | 1568 | return; |
1567 | 1569 | ||
1568 | cpuctx = &__get_cpu_var(perf_cpu_context); | 1570 | cpuctx = &__get_cpu_var(perf_cpu_context); |
1569 | ctx = curr->perf_event_ctxp; | 1571 | if (cpuctx->ctx.nr_events && |
1572 | cpuctx->ctx.nr_events != cpuctx->ctx.nr_active) | ||
1573 | rotate = 1; | ||
1570 | 1574 | ||
1571 | perf_disable(); | 1575 | ctx = curr->perf_event_ctxp; |
1576 | if (ctx && ctx->nr_events && ctx->nr_events != ctx->nr_active) | ||
1577 | rotate = 1; | ||
1572 | 1578 | ||
1573 | perf_ctx_adjust_freq(&cpuctx->ctx); | 1579 | perf_ctx_adjust_freq(&cpuctx->ctx); |
1574 | if (ctx) | 1580 | if (ctx) |
1575 | perf_ctx_adjust_freq(ctx); | 1581 | perf_ctx_adjust_freq(ctx); |
1576 | 1582 | ||
1583 | if (!rotate) | ||
1584 | return; | ||
1585 | |||
1586 | perf_disable(); | ||
1577 | cpu_ctx_sched_out(cpuctx, EVENT_FLEXIBLE); | 1587 | cpu_ctx_sched_out(cpuctx, EVENT_FLEXIBLE); |
1578 | if (ctx) | 1588 | if (ctx) |
1579 | task_ctx_sched_out(ctx, EVENT_FLEXIBLE); | 1589 | task_ctx_sched_out(ctx, EVENT_FLEXIBLE); |
@@ -1585,7 +1595,6 @@ void perf_event_task_tick(struct task_struct *curr) | |||
1585 | cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE); | 1595 | cpu_ctx_sched_in(cpuctx, EVENT_FLEXIBLE); |
1586 | if (ctx) | 1596 | if (ctx) |
1587 | task_ctx_sched_in(curr, EVENT_FLEXIBLE); | 1597 | task_ctx_sched_in(curr, EVENT_FLEXIBLE); |
1588 | |||
1589 | perf_enable(); | 1598 | perf_enable(); |
1590 | } | 1599 | } |
1591 | 1600 | ||