aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorPeter Zijlstra <a.p.zijlstra@chello.nl>2009-09-04 09:36:08 -0400
committerIngo Molnar <mingo@elte.hu>2009-09-04 10:33:08 -0400
commit9e9772c458d50dabdb5327821da3803254638cd1 (patch)
tree98e714214b30aae145f023209e843c4ae0548c52
parent506d4bc8d5dab20d84624aa07cdc6dcd77915d52 (diff)
perf stat: Remove the limit on repeat
Since we don't need all the individual samples to calculate the error remove both the limit and the storage overhead associated with that. Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> LKML-Reference: <new-submission> Signed-off-by: Ingo Molnar <mingo@elte.hu>
-rw-r--r--tools/perf/builtin-stat.c84
1 files changed, 27 insertions, 57 deletions
diff --git a/tools/perf/builtin-stat.c b/tools/perf/builtin-stat.c
index 31ffc4d3ba60..9c6377f7152f 100644
--- a/tools/perf/builtin-stat.c
+++ b/tools/perf/builtin-stat.c
@@ -62,8 +62,6 @@ static struct perf_counter_attr default_attrs[] = {
62 62
63}; 63};
64 64
65#define MAX_RUN 100
66
67static int system_wide = 0; 65static int system_wide = 0;
68static unsigned int nr_cpus = 0; 66static unsigned int nr_cpus = 0;
69static int run_idx = 0; 67static int run_idx = 0;
@@ -76,12 +74,8 @@ static int null_run = 0;
76 74
77static int fd[MAX_NR_CPUS][MAX_COUNTERS]; 75static int fd[MAX_NR_CPUS][MAX_COUNTERS];
78 76
79static u64 runtime_nsecs[MAX_RUN]; 77static u64 event_res[MAX_COUNTERS][3];
80static u64 walltime_nsecs[MAX_RUN]; 78static u64 event_scaled[MAX_COUNTERS];
81static u64 runtime_cycles[MAX_RUN];
82
83static u64 event_res[MAX_RUN][MAX_COUNTERS][3];
84static u64 event_scaled[MAX_RUN][MAX_COUNTERS];
85 79
86struct stats 80struct stats
87{ 81{
@@ -89,6 +83,14 @@ struct stats
89 double sum_sq; 83 double sum_sq;
90}; 84};
91 85
86static void update_stats(struct stats *stats, u64 val)
87{
88 double sq = val;
89
90 stats->sum += val;
91 stats->sum_sq += sq * sq;
92}
93
92static double avg_stats(struct stats *stats) 94static double avg_stats(struct stats *stats)
93{ 95{
94 return stats->sum / run_count; 96 return stats->sum / run_count;
@@ -167,8 +169,9 @@ static void read_counter(int counter)
167 unsigned int cpu; 169 unsigned int cpu;
168 size_t res, nv; 170 size_t res, nv;
169 int scaled; 171 int scaled;
172 int i;
170 173
171 count = event_res[run_idx][counter]; 174 count = event_res[counter];
172 175
173 count[0] = count[1] = count[2] = 0; 176 count[0] = count[1] = count[2] = 0;
174 177
@@ -193,24 +196,33 @@ static void read_counter(int counter)
193 scaled = 0; 196 scaled = 0;
194 if (scale) { 197 if (scale) {
195 if (count[2] == 0) { 198 if (count[2] == 0) {
196 event_scaled[run_idx][counter] = -1; 199 event_scaled[counter] = -1;
197 count[0] = 0; 200 count[0] = 0;
198 return; 201 return;
199 } 202 }
200 203
201 if (count[2] < count[1]) { 204 if (count[2] < count[1]) {
202 event_scaled[run_idx][counter] = 1; 205 event_scaled[counter] = 1;
203 count[0] = (unsigned long long) 206 count[0] = (unsigned long long)
204 ((double)count[0] * count[1] / count[2] + 0.5); 207 ((double)count[0] * count[1] / count[2] + 0.5);
205 } 208 }
206 } 209 }
210
211 for (i = 0; i < 3; i++)
212 update_stats(&event_res_stats[counter][i], count[i]);
213
214 if (verbose) {
215 fprintf(stderr, "%s: %Ld %Ld %Ld\n", event_name(counter),
216 count[0], count[1], count[2]);
217 }
218
207 /* 219 /*
208 * Save the full runtime - to allow normalization during printout: 220 * Save the full runtime - to allow normalization during printout:
209 */ 221 */
210 if (MATCH_EVENT(SOFTWARE, SW_TASK_CLOCK, counter)) 222 if (MATCH_EVENT(SOFTWARE, SW_TASK_CLOCK, counter))
211 runtime_nsecs[run_idx] = count[0]; 223 update_stats(&runtime_nsecs_stats, count[0]);
212 if (MATCH_EVENT(HARDWARE, HW_CPU_CYCLES, counter)) 224 if (MATCH_EVENT(HARDWARE, HW_CPU_CYCLES, counter))
213 runtime_cycles[run_idx] = count[0]; 225 update_stats(&runtime_cycles_stats, count[0]);
214} 226}
215 227
216static int run_perf_stat(int argc __used, const char **argv) 228static int run_perf_stat(int argc __used, const char **argv)
@@ -284,7 +296,7 @@ static int run_perf_stat(int argc __used, const char **argv)
284 296
285 t1 = rdclock(); 297 t1 = rdclock();
286 298
287 walltime_nsecs[run_idx] = t1 - t0; 299 update_stats(&walltime_nsecs_stats, t1 - t0);
288 300
289 for (counter = 0; counter < nr_counters; counter++) 301 for (counter = 0; counter < nr_counters; counter++)
290 read_counter(counter); 302 read_counter(counter);
@@ -361,52 +373,10 @@ static void print_counter(int counter)
361 fprintf(stderr, "\n"); 373 fprintf(stderr, "\n");
362} 374}
363 375
364static void update_stats(const char *name, int idx, struct stats *stats, u64 *val)
365{
366 double sq = *val;
367
368 stats->sum += *val;
369 stats->sum_sq += sq * sq;
370
371 if (verbose > 1)
372 fprintf(stderr, "debug: %20s[%d]: %Ld\n", name, idx, *val);
373}
374
375/*
376 * Calculate the averages and noises:
377 */
378static void calc_avg(void)
379{
380 int i, j;
381
382 if (verbose > 1)
383 fprintf(stderr, "\n");
384
385 for (i = 0; i < run_count; i++) {
386 update_stats("runtime", 0, &runtime_nsecs_stats, runtime_nsecs + i);
387 update_stats("walltime", 0, &walltime_nsecs_stats, walltime_nsecs + i);
388 update_stats("runtime_cycles", 0, &runtime_cycles_stats, runtime_cycles + i);
389
390 for (j = 0; j < nr_counters; j++) {
391 update_stats("counter/0", j,
392 event_res_stats[j]+0, event_res[i][j]+0);
393 update_stats("counter/1", j,
394 event_res_stats[j]+1, event_res[i][j]+1);
395 update_stats("counter/2", j,
396 event_res_stats[j]+2, event_res[i][j]+2);
397 if (event_scaled[i][j] != (u64)-1)
398 update_stats("scaled", j,
399 event_scaled_stats + j, event_scaled[i]+j);
400 }
401 }
402}
403
404static void print_stat(int argc, const char **argv) 376static void print_stat(int argc, const char **argv)
405{ 377{
406 int i, counter; 378 int i, counter;
407 379
408 calc_avg();
409
410 fflush(stdout); 380 fflush(stdout);
411 381
412 fprintf(stderr, "\n"); 382 fprintf(stderr, "\n");
@@ -484,7 +454,7 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
484 PARSE_OPT_STOP_AT_NON_OPTION); 454 PARSE_OPT_STOP_AT_NON_OPTION);
485 if (!argc) 455 if (!argc)
486 usage_with_options(stat_usage, options); 456 usage_with_options(stat_usage, options);
487 if (run_count <= 0 || run_count > MAX_RUN) 457 if (run_count <= 0)
488 usage_with_options(stat_usage, options); 458 usage_with_options(stat_usage, options);
489 459
490 /* Set attrs and nr_counters if no event is selected and !null_run */ 460 /* Set attrs and nr_counters if no event is selected and !null_run */