blob: a89fc0835367c5dd655c827365bcda3b8b94e39f [file] [log] [blame]
Ingo Molnarddcacfa2009-04-20 15:37:32 +02001/*
Ingo Molnarbf9e1872009-06-02 23:37:05 +02002 * builtin-stat.c
3 *
4 * Builtin stat command: Give a precise performance counters summary
5 * overview about any workload, CPU or specific PID.
6 *
7 * Sample output:
Ingo Molnarddcacfa2009-04-20 15:37:32 +02008
Ingo Molnar2cba3ff2011-05-19 13:30:56 +02009 $ perf stat ./hackbench 10
Ingo Molnarddcacfa2009-04-20 15:37:32 +020010
Ingo Molnar2cba3ff2011-05-19 13:30:56 +020011 Time: 0.118
Ingo Molnarddcacfa2009-04-20 15:37:32 +020012
Ingo Molnar2cba3ff2011-05-19 13:30:56 +020013 Performance counter stats for './hackbench 10':
Ingo Molnarddcacfa2009-04-20 15:37:32 +020014
Ingo Molnar2cba3ff2011-05-19 13:30:56 +020015 1708.761321 task-clock # 11.037 CPUs utilized
16 41,190 context-switches # 0.024 M/sec
17 6,735 CPU-migrations # 0.004 M/sec
18 17,318 page-faults # 0.010 M/sec
19 5,205,202,243 cycles # 3.046 GHz
20 3,856,436,920 stalled-cycles-frontend # 74.09% frontend cycles idle
21 1,600,790,871 stalled-cycles-backend # 30.75% backend cycles idle
22 2,603,501,247 instructions # 0.50 insns per cycle
23 # 1.48 stalled cycles per insn
24 484,357,498 branches # 283.455 M/sec
25 6,388,934 branch-misses # 1.32% of all branches
26
27 0.154822978 seconds time elapsed
Ingo Molnarddcacfa2009-04-20 15:37:32 +020028
Ingo Molnar52425192009-05-26 09:17:18 +020029 *
Ingo Molnar2cba3ff2011-05-19 13:30:56 +020030 * Copyright (C) 2008-2011, Red Hat Inc, Ingo Molnar <mingo@redhat.com>
Ingo Molnar52425192009-05-26 09:17:18 +020031 *
32 * Improvements and fixes by:
33 *
34 * Arjan van de Ven <arjan@linux.intel.com>
35 * Yanmin Zhang <yanmin.zhang@intel.com>
36 * Wu Fengguang <fengguang.wu@intel.com>
37 * Mike Galbraith <efault@gmx.de>
38 * Paul Mackerras <paulus@samba.org>
Jaswinder Singh Rajput6e750a8f2009-06-27 03:02:07 +053039 * Jaswinder Singh Rajput <jaswinder@kernel.org>
Ingo Molnar52425192009-05-26 09:17:18 +020040 *
41 * Released under the GPL v2. (and only v2, not any later version)
Ingo Molnarddcacfa2009-04-20 15:37:32 +020042 */
43
Peter Zijlstra1a482f32009-05-23 18:28:58 +020044#include "perf.h"
Ingo Molnar16f762a2009-05-27 09:10:38 +020045#include "builtin.h"
Ingo Molnar148be2c2009-04-27 08:02:14 +020046#include "util/util.h"
Ingo Molnar52425192009-05-26 09:17:18 +020047#include "util/parse-options.h"
48#include "util/parse-events.h"
Frederic Weisbecker8f288272009-08-16 22:05:48 +020049#include "util/event.h"
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -020050#include "util/evlist.h"
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -020051#include "util/evsel.h"
Frederic Weisbecker8f288272009-08-16 22:05:48 +020052#include "util/debug.h"
Ingo Molnara5d243d2011-04-27 05:39:24 +020053#include "util/color.h"
Liming Wang60666c62009-12-31 16:05:50 +080054#include "util/header.h"
Paul Mackerrasa12b51c2010-03-10 20:36:09 +110055#include "util/cpumap.h"
Zhang, Yanmind6d901c2010-03-18 11:36:05 -030056#include "util/thread.h"
Arnaldo Carvalho de Melofd782602011-01-18 15:15:24 -020057#include "util/thread_map.h"
Ingo Molnarddcacfa2009-04-20 15:37:32 +020058
Ingo Molnarddcacfa2009-04-20 15:37:32 +020059#include <sys/prctl.h>
Ingo Molnar42202dd2009-06-13 14:57:28 +020060#include <math.h>
Stephane Eranian5af52b52010-05-18 15:00:01 +020061#include <locale.h>
Peter Zijlstra16c8a102009-05-05 17:50:27 +020062
Stephane Eraniand7470b62010-12-01 18:49:05 +020063#define DEFAULT_SEPARATOR " "
64
Ingo Molnarcdd6c482009-09-21 12:02:48 +020065static struct perf_event_attr default_attrs[] = {
Ingo Molnara21ca2c2009-06-06 09:58:57 +020066
Ingo Molnar56aab462009-10-19 13:27:08 +020067 { .type = PERF_TYPE_SOFTWARE, .config = PERF_COUNT_SW_TASK_CLOCK },
68 { .type = PERF_TYPE_SOFTWARE, .config = PERF_COUNT_SW_CONTEXT_SWITCHES },
69 { .type = PERF_TYPE_SOFTWARE, .config = PERF_COUNT_SW_CPU_MIGRATIONS },
70 { .type = PERF_TYPE_SOFTWARE, .config = PERF_COUNT_SW_PAGE_FAULTS },
Ingo Molnara21ca2c2009-06-06 09:58:57 +020071
Ingo Molnar56aab462009-10-19 13:27:08 +020072 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_CPU_CYCLES },
Ingo Molnar129c04c2011-04-29 14:41:28 +020073 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_STALLED_CYCLES_FRONTEND },
74 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_STALLED_CYCLES_BACKEND },
Ingo Molnar56aab462009-10-19 13:27:08 +020075 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_INSTRUCTIONS },
Ingo Molnar56aab462009-10-19 13:27:08 +020076 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_BRANCH_INSTRUCTIONS },
77 { .type = PERF_TYPE_HARDWARE, .config = PERF_COUNT_HW_BRANCH_MISSES },
Peter Zijlstraf4dbfa82009-06-11 14:06:28 +020078
Ingo Molnara21ca2c2009-06-06 09:58:57 +020079};
80
Ingo Molnarc6264de2011-04-27 13:50:47 +020081/*
Ingo Molnar2cba3ff2011-05-19 13:30:56 +020082 * Detailed stats (-d), covering the L1 and last level data caches:
Ingo Molnarc6264de2011-04-27 13:50:47 +020083 */
84static struct perf_event_attr detailed_attrs[] = {
85
Ingo Molnarc6264de2011-04-27 13:50:47 +020086 { .type = PERF_TYPE_HW_CACHE,
87 .config =
88 PERF_COUNT_HW_CACHE_L1D << 0 |
89 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
90 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
91
92 { .type = PERF_TYPE_HW_CACHE,
93 .config =
94 PERF_COUNT_HW_CACHE_L1D << 0 |
95 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
96 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
97
98 { .type = PERF_TYPE_HW_CACHE,
99 .config =
100 PERF_COUNT_HW_CACHE_LL << 0 |
101 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
102 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
103
104 { .type = PERF_TYPE_HW_CACHE,
105 .config =
106 PERF_COUNT_HW_CACHE_LL << 0 |
107 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
108 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
109};
110
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200111/*
112 * Very detailed stats (-d -d), covering the instruction cache and the TLB caches:
113 */
114static struct perf_event_attr very_detailed_attrs[] = {
115
116 { .type = PERF_TYPE_HW_CACHE,
117 .config =
118 PERF_COUNT_HW_CACHE_L1I << 0 |
119 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
120 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
121
122 { .type = PERF_TYPE_HW_CACHE,
123 .config =
124 PERF_COUNT_HW_CACHE_L1I << 0 |
125 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
126 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
127
128 { .type = PERF_TYPE_HW_CACHE,
129 .config =
130 PERF_COUNT_HW_CACHE_DTLB << 0 |
131 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
132 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
133
134 { .type = PERF_TYPE_HW_CACHE,
135 .config =
136 PERF_COUNT_HW_CACHE_DTLB << 0 |
137 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
138 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
139
140 { .type = PERF_TYPE_HW_CACHE,
141 .config =
142 PERF_COUNT_HW_CACHE_ITLB << 0 |
143 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
144 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
145
146 { .type = PERF_TYPE_HW_CACHE,
147 .config =
148 PERF_COUNT_HW_CACHE_ITLB << 0 |
149 (PERF_COUNT_HW_CACHE_OP_READ << 8) |
150 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
151
152};
153
154/*
155 * Very, very detailed stats (-d -d -d), adding prefetch events:
156 */
157static struct perf_event_attr very_very_detailed_attrs[] = {
158
159 { .type = PERF_TYPE_HW_CACHE,
160 .config =
161 PERF_COUNT_HW_CACHE_L1D << 0 |
162 (PERF_COUNT_HW_CACHE_OP_PREFETCH << 8) |
163 (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16) },
164
165 { .type = PERF_TYPE_HW_CACHE,
166 .config =
167 PERF_COUNT_HW_CACHE_L1D << 0 |
168 (PERF_COUNT_HW_CACHE_OP_PREFETCH << 8) |
169 (PERF_COUNT_HW_CACHE_RESULT_MISS << 16) },
170};
171
172
173
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200174struct perf_evlist *evsel_list;
175
Ian Munsiec0555642010-04-13 18:37:33 +1000176static bool system_wide = false;
Jaswinder Singh Rajput3d632592009-06-24 18:19:34 +0530177static int run_idx = 0;
178
179static int run_count = 1;
Stephane Eranian2e6cdf92010-05-12 10:40:01 +0200180static bool no_inherit = false;
Ian Munsiec0555642010-04-13 18:37:33 +1000181static bool scale = true;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200182static bool no_aggr = false;
Chris Wilson933da832009-10-04 01:35:01 +0100183static pid_t target_pid = -1;
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300184static pid_t target_tid = -1;
Chris Wilson933da832009-10-04 01:35:01 +0100185static pid_t child_pid = -1;
Ian Munsiec0555642010-04-13 18:37:33 +1000186static bool null_run = false;
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200187static int detailed_run = 0;
Ingo Molnarf9cef0a2011-04-28 18:17:11 +0200188static bool sync_run = false;
Arnaldo Carvalho de Melo201e0b02010-12-01 17:53:27 -0200189static bool big_num = true;
Stephane Eraniand7470b62010-12-01 18:49:05 +0200190static int big_num_opt = -1;
Stephane Eranianc45c6ea2010-05-28 12:00:01 +0200191static const char *cpu_list;
Stephane Eraniand7470b62010-12-01 18:49:05 +0200192static const char *csv_sep = NULL;
193static bool csv_output = false;
Stephane Eranian5af52b52010-05-18 15:00:01 +0200194
Liming Wang60666c62009-12-31 16:05:50 +0800195static volatile int done = 0;
196
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200197struct stats
198{
Peter Zijlstra8a026312009-09-04 17:26:26 +0200199 double n, mean, M2;
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200200};
Ingo Molnar42202dd2009-06-13 14:57:28 +0200201
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200202struct perf_stat {
203 struct stats res_stats[3];
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200204};
205
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200206static int perf_evsel__alloc_stat_priv(struct perf_evsel *evsel)
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200207{
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200208 evsel->priv = zalloc(sizeof(struct perf_stat));
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200209 return evsel->priv == NULL ? -ENOMEM : 0;
210}
211
212static void perf_evsel__free_stat_priv(struct perf_evsel *evsel)
213{
214 free(evsel->priv);
215 evsel->priv = NULL;
216}
217
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200218static void update_stats(struct stats *stats, u64 val)
219{
Peter Zijlstra8a026312009-09-04 17:26:26 +0200220 double delta;
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200221
Peter Zijlstra8a026312009-09-04 17:26:26 +0200222 stats->n++;
223 delta = val - stats->mean;
224 stats->mean += delta / stats->n;
225 stats->M2 += delta*(val - stats->mean);
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200226}
227
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200228static double avg_stats(struct stats *stats)
229{
Peter Zijlstra8a026312009-09-04 17:26:26 +0200230 return stats->mean;
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200231}
Ingo Molnar42202dd2009-06-13 14:57:28 +0200232
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200233/*
Peter Zijlstra63d40de2009-09-04 17:03:13 +0200234 * http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
235 *
Peter Zijlstra8a026312009-09-04 17:26:26 +0200236 * (\Sum n_i^2) - ((\Sum n_i)^2)/n
237 * s^2 = -------------------------------
238 * n - 1
Peter Zijlstra63d40de2009-09-04 17:03:13 +0200239 *
240 * http://en.wikipedia.org/wiki/Stddev
241 *
242 * The std dev of the mean is related to the std dev by:
243 *
244 * s
245 * s_mean = -------
246 * sqrt(n)
247 *
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200248 */
249static double stddev_stats(struct stats *stats)
250{
Peter Zijlstra8a026312009-09-04 17:26:26 +0200251 double variance = stats->M2 / (stats->n - 1);
252 double variance_mean = variance / stats->n;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200253
Peter Zijlstra63d40de2009-09-04 17:03:13 +0200254 return sqrt(variance_mean);
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200255}
Ingo Molnar42202dd2009-06-13 14:57:28 +0200256
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200257struct stats runtime_nsecs_stats[MAX_NR_CPUS];
258struct stats runtime_cycles_stats[MAX_NR_CPUS];
Ingo Molnard3d1e862011-04-29 13:49:08 +0200259struct stats runtime_stalled_cycles_front_stats[MAX_NR_CPUS];
260struct stats runtime_stalled_cycles_back_stats[MAX_NR_CPUS];
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200261struct stats runtime_branches_stats[MAX_NR_CPUS];
Ingo Molnard58f4c82011-04-27 03:42:18 +0200262struct stats runtime_cacherefs_stats[MAX_NR_CPUS];
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200263struct stats runtime_l1_dcache_stats[MAX_NR_CPUS];
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200264struct stats walltime_nsecs_stats;
Ingo Molnarbe1ac0d2009-05-29 09:10:54 +0200265
Arnaldo Carvalho de Melo48290602011-01-03 17:48:12 -0200266static int create_perf_stat_counter(struct perf_evsel *evsel)
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200267{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200268 struct perf_event_attr *attr = &evsel->attr;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200269
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200270 if (scale)
Ingo Molnara21ca2c2009-06-06 09:58:57 +0200271 attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED |
272 PERF_FORMAT_TOTAL_TIME_RUNNING;
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200273
Arnaldo Carvalho de Melo48290602011-01-03 17:48:12 -0200274 attr->inherit = !no_inherit;
Arnaldo Carvalho de Melo5d2cd902011-04-14 11:20:14 -0300275
276 if (system_wide)
277 return perf_evsel__open_per_cpu(evsel, evsel_list->cpus, false);
278
Arnaldo Carvalho de Melo48290602011-01-03 17:48:12 -0200279 if (target_pid == -1 && target_tid == -1) {
280 attr->disabled = 1;
281 attr->enable_on_exec = 1;
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200282 }
Arnaldo Carvalho de Melo084ab9f2010-03-22 13:10:28 -0300283
Arnaldo Carvalho de Melo5d2cd902011-04-14 11:20:14 -0300284 return perf_evsel__open_per_thread(evsel, evsel_list->threads, false);
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200285}
286
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200287/*
288 * Does the counter have nsecs as a unit?
289 */
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200290static inline int nsec_counter(struct perf_evsel *evsel)
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200291{
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200292 if (perf_evsel__match(evsel, SOFTWARE, SW_CPU_CLOCK) ||
293 perf_evsel__match(evsel, SOFTWARE, SW_TASK_CLOCK))
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200294 return 1;
295
296 return 0;
297}
298
299/*
Ingo Molnardcd99362011-04-27 04:36:37 +0200300 * Update various tracking values we maintain to print
301 * more semantic information such as miss/hit ratios,
302 * instruction rates, etc:
303 */
304static void update_shadow_stats(struct perf_evsel *counter, u64 *count)
305{
306 if (perf_evsel__match(counter, SOFTWARE, SW_TASK_CLOCK))
307 update_stats(&runtime_nsecs_stats[0], count[0]);
308 else if (perf_evsel__match(counter, HARDWARE, HW_CPU_CYCLES))
309 update_stats(&runtime_cycles_stats[0], count[0]);
Ingo Molnard3d1e862011-04-29 13:49:08 +0200310 else if (perf_evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_FRONTEND))
311 update_stats(&runtime_stalled_cycles_front_stats[0], count[0]);
Ingo Molnar129c04c2011-04-29 14:41:28 +0200312 else if (perf_evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_BACKEND))
Ingo Molnard3d1e862011-04-29 13:49:08 +0200313 update_stats(&runtime_stalled_cycles_back_stats[0], count[0]);
Ingo Molnardcd99362011-04-27 04:36:37 +0200314 else if (perf_evsel__match(counter, HARDWARE, HW_BRANCH_INSTRUCTIONS))
315 update_stats(&runtime_branches_stats[0], count[0]);
316 else if (perf_evsel__match(counter, HARDWARE, HW_CACHE_REFERENCES))
317 update_stats(&runtime_cacherefs_stats[0], count[0]);
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200318 else if (perf_evsel__match(counter, HW_CACHE, HW_CACHE_L1D))
319 update_stats(&runtime_l1_dcache_stats[0], count[0]);
Ingo Molnardcd99362011-04-27 04:36:37 +0200320}
321
322/*
Ingo Molnar2996f5d2009-05-29 09:10:54 +0200323 * Read out the results of a single counter:
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200324 * aggregate counts across CPUs in system-wide mode
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200325 */
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200326static int read_counter_aggr(struct perf_evsel *counter)
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200327{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200328 struct perf_stat *ps = counter->priv;
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200329 u64 *count = counter->counts->aggr.values;
330 int i;
Ingo Molnarc04f5e52009-05-29 09:10:54 +0200331
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200332 if (__perf_evsel__read(counter, evsel_list->cpus->nr,
333 evsel_list->threads->nr, scale) < 0)
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200334 return -1;
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200335
336 for (i = 0; i < 3; i++)
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200337 update_stats(&ps->res_stats[i], count[i]);
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200338
339 if (verbose) {
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -0200340 fprintf(stderr, "%s: %" PRIu64 " %" PRIu64 " %" PRIu64 "\n",
341 event_name(counter), count[0], count[1], count[2]);
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200342 }
343
Ingo Molnarbe1ac0d2009-05-29 09:10:54 +0200344 /*
345 * Save the full runtime - to allow normalization during printout:
346 */
Ingo Molnardcd99362011-04-27 04:36:37 +0200347 update_shadow_stats(counter, count);
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200348
349 return 0;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200350}
351
352/*
353 * Read out the results of a single counter:
354 * do not aggregate counts across CPUs in system-wide mode
355 */
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200356static int read_counter(struct perf_evsel *counter)
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200357{
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200358 u64 *count;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200359 int cpu;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200360
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200361 for (cpu = 0; cpu < evsel_list->cpus->nr; cpu++) {
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200362 if (__perf_evsel__read_on_cpu(counter, cpu, 0, scale) < 0)
363 return -1;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200364
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200365 count = counter->counts->cpu[cpu].values;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200366
Ingo Molnardcd99362011-04-27 04:36:37 +0200367 update_shadow_stats(counter, count);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200368 }
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200369
370 return 0;
Ingo Molnar2996f5d2009-05-29 09:10:54 +0200371}
372
Ingo Molnarf37a2912009-07-01 12:37:06 +0200373static int run_perf_stat(int argc __used, const char **argv)
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200374{
375 unsigned long long t0, t1;
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200376 struct perf_evsel *counter;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200377 int status = 0;
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000378 int child_ready_pipe[2], go_pipe[2];
Zhang, Yanmin6be28502010-03-18 11:36:03 -0300379 const bool forks = (argc > 0);
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000380 char buf;
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200381
Liming Wang60666c62009-12-31 16:05:50 +0800382 if (forks && (pipe(child_ready_pipe) < 0 || pipe(go_pipe) < 0)) {
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000383 perror("failed to create pipes");
384 exit(1);
385 }
386
Liming Wang60666c62009-12-31 16:05:50 +0800387 if (forks) {
Zhang, Yanmin6be28502010-03-18 11:36:03 -0300388 if ((child_pid = fork()) < 0)
Liming Wang60666c62009-12-31 16:05:50 +0800389 perror("failed to fork");
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000390
Zhang, Yanmin6be28502010-03-18 11:36:03 -0300391 if (!child_pid) {
Liming Wang60666c62009-12-31 16:05:50 +0800392 close(child_ready_pipe[0]);
393 close(go_pipe[1]);
394 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
395
396 /*
397 * Do a dummy execvp to get the PLT entry resolved,
398 * so we avoid the resolver overhead on the real
399 * execvp call.
400 */
401 execvp("", (char **)argv);
402
403 /*
404 * Tell the parent we're ready to go
405 */
406 close(child_ready_pipe[1]);
407
408 /*
409 * Wait until the parent tells us to go.
410 */
411 if (read(go_pipe[0], &buf, 1) == -1)
412 perror("unable to read pipe");
413
414 execvp(argv[0], (char **)argv);
415
416 perror(argv[0]);
417 exit(-1);
418 }
419
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300420 if (target_tid == -1 && target_pid == -1 && !system_wide)
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200421 evsel_list->threads->map[0] = child_pid;
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300422
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000423 /*
Liming Wang60666c62009-12-31 16:05:50 +0800424 * Wait for the child to be ready to exec.
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000425 */
426 close(child_ready_pipe[1]);
Liming Wang60666c62009-12-31 16:05:50 +0800427 close(go_pipe[0]);
428 if (read(child_ready_pipe[0], &buf, 1) == -1)
Frederic Weisbeckera92bef02009-07-01 21:02:10 +0200429 perror("unable to read pipe");
Liming Wang60666c62009-12-31 16:05:50 +0800430 close(child_ready_pipe[0]);
Paul Mackerras051ae7f2009-06-29 21:13:21 +1000431 }
432
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200433 list_for_each_entry(counter, &evsel_list->entries, node) {
Arnaldo Carvalho de Melo48290602011-01-03 17:48:12 -0200434 if (create_perf_stat_counter(counter) < 0) {
David Ahernc63ca0c2011-04-29 16:04:15 -0600435 if (errno == EINVAL || errno == ENOSYS || errno == ENOENT) {
436 if (verbose)
437 ui__warning("%s event is not supported by the kernel.\n",
438 event_name(counter));
Ingo Molnarede70292011-04-28 08:48:42 +0200439 continue;
David Ahernc63ca0c2011-04-29 16:04:15 -0600440 }
Ingo Molnarede70292011-04-28 08:48:42 +0200441
442 if (errno == EPERM || errno == EACCES) {
Arnaldo Carvalho de Melo48290602011-01-03 17:48:12 -0200443 error("You may not have permission to collect %sstats.\n"
444 "\t Consider tweaking"
445 " /proc/sys/kernel/perf_event_paranoid or running as root.",
446 system_wide ? "system-wide " : "");
447 } else {
448 error("open_counter returned with %d (%s). "
449 "/bin/dmesg may provide additional information.\n",
450 errno, strerror(errno));
451 }
452 if (child_pid != -1)
453 kill(child_pid, SIGTERM);
454 die("Not all events could be opened.\n");
455 return -1;
456 }
Arnaldo Carvalho de Melo084ab9f2010-03-22 13:10:28 -0300457 }
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200458
Frederic Weisbeckercfd748a2011-03-14 16:40:30 +0100459 if (perf_evlist__set_filters(evsel_list)) {
460 error("failed to set filter with %d (%s)\n", errno,
461 strerror(errno));
462 return -1;
463 }
464
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200465 /*
466 * Enable counters and exec the command:
467 */
468 t0 = rdclock();
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200469
Liming Wang60666c62009-12-31 16:05:50 +0800470 if (forks) {
471 close(go_pipe[1]);
472 wait(&status);
473 } else {
Zhang, Yanmin6be28502010-03-18 11:36:03 -0300474 while(!done) sleep(1);
Liming Wang60666c62009-12-31 16:05:50 +0800475 }
Ingo Molnar44db76c2009-06-03 19:36:07 +0200476
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200477 t1 = rdclock();
478
Peter Zijlstra9e9772c2009-09-04 15:36:08 +0200479 update_stats(&walltime_nsecs_stats, t1 - t0);
Ingo Molnar42202dd2009-06-13 14:57:28 +0200480
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200481 if (no_aggr) {
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200482 list_for_each_entry(counter, &evsel_list->entries, node) {
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200483 read_counter(counter);
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200484 perf_evsel__close_fd(counter, evsel_list->cpus->nr, 1);
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200485 }
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200486 } else {
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200487 list_for_each_entry(counter, &evsel_list->entries, node) {
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200488 read_counter_aggr(counter);
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200489 perf_evsel__close_fd(counter, evsel_list->cpus->nr,
490 evsel_list->threads->nr);
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200491 }
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200492 }
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200493
Ingo Molnar42202dd2009-06-13 14:57:28 +0200494 return WEXITSTATUS(status);
495}
496
Ingo Molnarf99844c2011-04-27 05:35:39 +0200497static void print_noise_pct(double total, double avg)
498{
499 double pct = 0.0;
500
501 if (avg)
502 pct = 100.0*total/avg;
503
504 fprintf(stderr, " ( +-%6.2f%% )", pct);
505}
506
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200507static void print_noise(struct perf_evsel *evsel, double avg)
Ingo Molnar42202dd2009-06-13 14:57:28 +0200508{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200509 struct perf_stat *ps;
510
Peter Zijlstra849abde2009-09-04 18:23:38 +0200511 if (run_count == 1)
512 return;
513
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200514 ps = evsel->priv;
Ingo Molnarf99844c2011-04-27 05:35:39 +0200515 print_noise_pct(stddev_stats(&ps->res_stats[0]), avg);
Ingo Molnar42202dd2009-06-13 14:57:28 +0200516}
517
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200518static void nsec_printout(int cpu, struct perf_evsel *evsel, double avg)
Ingo Molnar42202dd2009-06-13 14:57:28 +0200519{
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200520 double msecs = avg / 1e6;
Stephane Eraniand7470b62010-12-01 18:49:05 +0200521 char cpustr[16] = { '\0', };
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200522 const char *fmt = csv_output ? "%s%.6f%s%s" : "%s%18.6f%s%-25s";
Ingo Molnar42202dd2009-06-13 14:57:28 +0200523
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200524 if (no_aggr)
Stephane Eraniand7470b62010-12-01 18:49:05 +0200525 sprintf(cpustr, "CPU%*d%s",
526 csv_output ? 0 : -4,
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200527 evsel_list->cpus->map[cpu], csv_sep);
Stephane Eraniand7470b62010-12-01 18:49:05 +0200528
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200529 fprintf(stderr, fmt, cpustr, msecs, csv_sep, event_name(evsel));
Stephane Eraniand7470b62010-12-01 18:49:05 +0200530
Stephane Eranian023695d2011-02-14 11:20:01 +0200531 if (evsel->cgrp)
532 fprintf(stderr, "%s%s", csv_sep, evsel->cgrp->name);
533
Stephane Eraniand7470b62010-12-01 18:49:05 +0200534 if (csv_output)
535 return;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200536
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200537 if (perf_evsel__match(evsel, SOFTWARE, SW_TASK_CLOCK))
Ingo Molnar481f9882011-04-27 04:34:16 +0200538 fprintf(stderr, " # %8.3f CPUs utilized ", avg / avg_stats(&walltime_nsecs_stats));
Ingo Molnar42202dd2009-06-13 14:57:28 +0200539}
540
Ingo Molnard3d1e862011-04-29 13:49:08 +0200541static void print_stalled_cycles_frontend(int cpu, struct perf_evsel *evsel __used, double avg)
542{
543 double total, ratio = 0.0;
544 const char *color;
545
546 total = avg_stats(&runtime_cycles_stats[cpu]);
547
548 if (total)
549 ratio = avg / total * 100.0;
550
551 color = PERF_COLOR_NORMAL;
Ingo Molnar2b427e12011-04-29 14:16:18 +0200552 if (ratio > 50.0)
Ingo Molnard3d1e862011-04-29 13:49:08 +0200553 color = PERF_COLOR_RED;
Ingo Molnar2b427e12011-04-29 14:16:18 +0200554 else if (ratio > 30.0)
Ingo Molnard3d1e862011-04-29 13:49:08 +0200555 color = PERF_COLOR_MAGENTA;
Ingo Molnar2b427e12011-04-29 14:16:18 +0200556 else if (ratio > 10.0)
Ingo Molnard3d1e862011-04-29 13:49:08 +0200557 color = PERF_COLOR_YELLOW;
558
Ingo Molnarfce3c782011-04-30 09:03:15 +0200559 fprintf(stderr, " # ");
560 color_fprintf(stderr, color, "%6.2f%%", ratio);
Ingo Molnard3d1e862011-04-29 13:49:08 +0200561 fprintf(stderr, " frontend cycles idle ");
562}
563
564static void print_stalled_cycles_backend(int cpu, struct perf_evsel *evsel __used, double avg)
Ingo Molnara5d243d2011-04-27 05:39:24 +0200565{
566 double total, ratio = 0.0;
567 const char *color;
568
569 total = avg_stats(&runtime_cycles_stats[cpu]);
570
571 if (total)
572 ratio = avg / total * 100.0;
573
574 color = PERF_COLOR_NORMAL;
575 if (ratio > 75.0)
576 color = PERF_COLOR_RED;
577 else if (ratio > 50.0)
578 color = PERF_COLOR_MAGENTA;
Ingo Molnar2b427e12011-04-29 14:16:18 +0200579 else if (ratio > 20.0)
Ingo Molnara5d243d2011-04-27 05:39:24 +0200580 color = PERF_COLOR_YELLOW;
581
Ingo Molnarfce3c782011-04-30 09:03:15 +0200582 fprintf(stderr, " # ");
583 color_fprintf(stderr, color, "%6.2f%%", ratio);
584 fprintf(stderr, " backend cycles idle ");
Ingo Molnara5d243d2011-04-27 05:39:24 +0200585}
586
Ingo Molnarc78df6c2011-04-27 12:16:10 +0200587static void print_branch_misses(int cpu, struct perf_evsel *evsel __used, double avg)
588{
589 double total, ratio = 0.0;
590 const char *color;
591
592 total = avg_stats(&runtime_branches_stats[cpu]);
593
594 if (total)
595 ratio = avg / total * 100.0;
596
597 color = PERF_COLOR_NORMAL;
598 if (ratio > 20.0)
599 color = PERF_COLOR_RED;
600 else if (ratio > 10.0)
601 color = PERF_COLOR_MAGENTA;
602 else if (ratio > 5.0)
603 color = PERF_COLOR_YELLOW;
604
Ingo Molnarfce3c782011-04-30 09:03:15 +0200605 fprintf(stderr, " # ");
606 color_fprintf(stderr, color, "%6.2f%%", ratio);
Ingo Molnarc78df6c2011-04-27 12:16:10 +0200607 fprintf(stderr, " of all branches ");
608}
609
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200610static void print_l1_dcache_misses(int cpu, struct perf_evsel *evsel __used, double avg)
611{
612 double total, ratio = 0.0;
613 const char *color;
614
615 total = avg_stats(&runtime_l1_dcache_stats[cpu]);
616
617 if (total)
618 ratio = avg / total * 100.0;
619
620 color = PERF_COLOR_NORMAL;
621 if (ratio > 20.0)
622 color = PERF_COLOR_RED;
623 else if (ratio > 10.0)
624 color = PERF_COLOR_MAGENTA;
625 else if (ratio > 5.0)
626 color = PERF_COLOR_YELLOW;
627
Ingo Molnarfce3c782011-04-30 09:03:15 +0200628 fprintf(stderr, " # ");
629 color_fprintf(stderr, color, "%6.2f%%", ratio);
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200630 fprintf(stderr, " of all L1-dcache hits ");
631}
632
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200633static void abs_printout(int cpu, struct perf_evsel *evsel, double avg)
Ingo Molnar42202dd2009-06-13 14:57:28 +0200634{
Ingo Molnarc7f7fea2009-09-22 14:53:51 +0200635 double total, ratio = 0.0;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200636 char cpustr[16] = { '\0', };
Stephane Eraniand7470b62010-12-01 18:49:05 +0200637 const char *fmt;
638
639 if (csv_output)
640 fmt = "%s%.0f%s%s";
641 else if (big_num)
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200642 fmt = "%s%'18.0f%s%-25s";
Stephane Eraniand7470b62010-12-01 18:49:05 +0200643 else
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200644 fmt = "%s%18.0f%s%-25s";
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200645
646 if (no_aggr)
Stephane Eraniand7470b62010-12-01 18:49:05 +0200647 sprintf(cpustr, "CPU%*d%s",
648 csv_output ? 0 : -4,
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200649 evsel_list->cpus->map[cpu], csv_sep);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200650 else
651 cpu = 0;
Ingo Molnarc7f7fea2009-09-22 14:53:51 +0200652
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200653 fprintf(stderr, fmt, cpustr, avg, csv_sep, event_name(evsel));
Stephane Eraniand7470b62010-12-01 18:49:05 +0200654
Stephane Eranian023695d2011-02-14 11:20:01 +0200655 if (evsel->cgrp)
656 fprintf(stderr, "%s%s", csv_sep, evsel->cgrp->name);
657
Stephane Eraniand7470b62010-12-01 18:49:05 +0200658 if (csv_output)
659 return;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200660
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200661 if (perf_evsel__match(evsel, HARDWARE, HW_INSTRUCTIONS)) {
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200662 total = avg_stats(&runtime_cycles_stats[cpu]);
Ingo Molnarc7f7fea2009-09-22 14:53:51 +0200663
664 if (total)
665 ratio = avg / total;
666
Ingo Molnarfce3c782011-04-30 09:03:15 +0200667 fprintf(stderr, " # %5.2f insns per cycle ", ratio);
Ingo Molnar481f9882011-04-27 04:34:16 +0200668
Ingo Molnard3d1e862011-04-29 13:49:08 +0200669 total = avg_stats(&runtime_stalled_cycles_front_stats[cpu]);
670 total = max(total, avg_stats(&runtime_stalled_cycles_back_stats[cpu]));
Ingo Molnar481f9882011-04-27 04:34:16 +0200671
672 if (total && avg) {
673 ratio = total / avg;
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200674 fprintf(stderr, "\n # %5.2f stalled cycles per insn", ratio);
Ingo Molnar481f9882011-04-27 04:34:16 +0200675 }
676
Arnaldo Carvalho de Melodaec78a2011-01-03 16:49:44 -0200677 } else if (perf_evsel__match(evsel, HARDWARE, HW_BRANCH_MISSES) &&
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200678 runtime_branches_stats[cpu].n != 0) {
Ingo Molnarc78df6c2011-04-27 12:16:10 +0200679 print_branch_misses(cpu, evsel, avg);
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200680 } else if (
681 evsel->attr.type == PERF_TYPE_HW_CACHE &&
682 evsel->attr.config == ( PERF_COUNT_HW_CACHE_L1D |
683 ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
684 ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16)) &&
Ingo Molnarc6264de2011-04-27 13:50:47 +0200685 runtime_l1_dcache_stats[cpu].n != 0) {
Ingo Molnar8bb6c792011-04-27 13:25:24 +0200686 print_l1_dcache_misses(cpu, evsel, avg);
Ingo Molnard58f4c82011-04-27 03:42:18 +0200687 } else if (perf_evsel__match(evsel, HARDWARE, HW_CACHE_MISSES) &&
688 runtime_cacherefs_stats[cpu].n != 0) {
689 total = avg_stats(&runtime_cacherefs_stats[cpu]);
690
691 if (total)
692 ratio = avg * 100 / total;
693
Ingo Molnar481f9882011-04-27 04:34:16 +0200694 fprintf(stderr, " # %8.3f %% of all cache refs ", ratio);
Ingo Molnard58f4c82011-04-27 03:42:18 +0200695
Ingo Molnard3d1e862011-04-29 13:49:08 +0200696 } else if (perf_evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_FRONTEND)) {
697 print_stalled_cycles_frontend(cpu, evsel, avg);
Ingo Molnar129c04c2011-04-29 14:41:28 +0200698 } else if (perf_evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_BACKEND)) {
Ingo Molnard3d1e862011-04-29 13:49:08 +0200699 print_stalled_cycles_backend(cpu, evsel, avg);
Ingo Molnar481f9882011-04-27 04:34:16 +0200700 } else if (perf_evsel__match(evsel, HARDWARE, HW_CPU_CYCLES)) {
701 total = avg_stats(&runtime_nsecs_stats[cpu]);
702
703 if (total)
704 ratio = 1.0 * avg / total;
705
706 fprintf(stderr, " # %8.3f GHz ", ratio);
707 } else if (runtime_nsecs_stats[cpu].n != 0) {
708 total = avg_stats(&runtime_nsecs_stats[cpu]);
709
710 if (total)
711 ratio = 1000.0 * avg / total;
712
713 fprintf(stderr, " # %8.3f M/sec ", ratio);
Ingo Molnara5d243d2011-04-27 05:39:24 +0200714 } else {
715 fprintf(stderr, " ");
Ingo Molnar42202dd2009-06-13 14:57:28 +0200716 }
Ingo Molnar42202dd2009-06-13 14:57:28 +0200717}
718
719/*
720 * Print out the results of a single counter:
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200721 * aggregated counts in system-wide mode
Ingo Molnar42202dd2009-06-13 14:57:28 +0200722 */
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200723static void print_counter_aggr(struct perf_evsel *counter)
Ingo Molnar42202dd2009-06-13 14:57:28 +0200724{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200725 struct perf_stat *ps = counter->priv;
726 double avg = avg_stats(&ps->res_stats[0]);
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200727 int scaled = counter->counts->scaled;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200728
Ingo Molnar42202dd2009-06-13 14:57:28 +0200729 if (scaled == -1) {
Stephane Eranian023695d2011-02-14 11:20:01 +0200730 fprintf(stderr, "%*s%s%*s",
Stephane Eraniand7470b62010-12-01 18:49:05 +0200731 csv_output ? 0 : 18,
Stephane Eranian023695d2011-02-14 11:20:01 +0200732 "<not counted>",
733 csv_sep,
734 csv_output ? 0 : -24,
735 event_name(counter));
736
737 if (counter->cgrp)
738 fprintf(stderr, "%s%s", csv_sep, counter->cgrp->name);
739
740 fputc('\n', stderr);
Ingo Molnar42202dd2009-06-13 14:57:28 +0200741 return;
742 }
743
744 if (nsec_counter(counter))
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200745 nsec_printout(-1, counter, avg);
Ingo Molnar42202dd2009-06-13 14:57:28 +0200746 else
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200747 abs_printout(-1, counter, avg);
Peter Zijlstra849abde2009-09-04 18:23:38 +0200748
Stephane Eraniand7470b62010-12-01 18:49:05 +0200749 if (csv_output) {
750 fputc('\n', stderr);
751 return;
752 }
753
Peter Zijlstra849abde2009-09-04 18:23:38 +0200754 print_noise(counter, avg);
Ingo Molnar42202dd2009-06-13 14:57:28 +0200755
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200756 if (scaled) {
757 double avg_enabled, avg_running;
758
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200759 avg_enabled = avg_stats(&ps->res_stats[1]);
760 avg_running = avg_stats(&ps->res_stats[2]);
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200761
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200762 fprintf(stderr, " [%5.2f%%]", 100 * avg_running / avg_enabled);
Peter Zijlstra506d4bc2009-09-04 15:36:12 +0200763 }
Ingo Molnar42202dd2009-06-13 14:57:28 +0200764 fprintf(stderr, "\n");
765}
766
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200767/*
768 * Print out the results of a single counter:
769 * does not use aggregated count in system-wide
770 */
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200771static void print_counter(struct perf_evsel *counter)
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200772{
773 u64 ena, run, val;
774 int cpu;
775
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200776 for (cpu = 0; cpu < evsel_list->cpus->nr; cpu++) {
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -0200777 val = counter->counts->cpu[cpu].val;
778 ena = counter->counts->cpu[cpu].ena;
779 run = counter->counts->cpu[cpu].run;
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200780 if (run == 0 || ena == 0) {
Stephane Eranian023695d2011-02-14 11:20:01 +0200781 fprintf(stderr, "CPU%*d%s%*s%s%*s",
Stephane Eraniand7470b62010-12-01 18:49:05 +0200782 csv_output ? 0 : -4,
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -0200783 evsel_list->cpus->map[cpu], csv_sep,
Stephane Eraniand7470b62010-12-01 18:49:05 +0200784 csv_output ? 0 : 18,
785 "<not counted>", csv_sep,
Stephane Eranian023695d2011-02-14 11:20:01 +0200786 csv_output ? 0 : -24,
Stephane Eraniand7470b62010-12-01 18:49:05 +0200787 event_name(counter));
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200788
Stephane Eranian023695d2011-02-14 11:20:01 +0200789 if (counter->cgrp)
790 fprintf(stderr, "%s%s", csv_sep, counter->cgrp->name);
791
792 fputc('\n', stderr);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200793 continue;
794 }
795
796 if (nsec_counter(counter))
797 nsec_printout(cpu, counter, val);
798 else
799 abs_printout(cpu, counter, val);
800
Stephane Eraniand7470b62010-12-01 18:49:05 +0200801 if (!csv_output) {
802 print_noise(counter, 1.0);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200803
Ingo Molnarc6264de2011-04-27 13:50:47 +0200804 if (run != ena)
805 fprintf(stderr, " (%.2f%%)", 100.0 * run / ena);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200806 }
Stephane Eranian023695d2011-02-14 11:20:01 +0200807 fputc('\n', stderr);
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200808 }
809}
810
Ingo Molnar42202dd2009-06-13 14:57:28 +0200811static void print_stat(int argc, const char **argv)
812{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200813 struct perf_evsel *counter;
814 int i;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200815
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200816 fflush(stdout);
817
Stephane Eraniand7470b62010-12-01 18:49:05 +0200818 if (!csv_output) {
819 fprintf(stderr, "\n");
820 fprintf(stderr, " Performance counter stats for ");
821 if(target_pid == -1 && target_tid == -1) {
822 fprintf(stderr, "\'%s", argv[0]);
823 for (i = 1; i < argc; i++)
824 fprintf(stderr, " %s", argv[i]);
825 } else if (target_pid != -1)
826 fprintf(stderr, "process id \'%d", target_pid);
827 else
828 fprintf(stderr, "thread id \'%d", target_tid);
Ingo Molnar44db76c2009-06-03 19:36:07 +0200829
Stephane Eraniand7470b62010-12-01 18:49:05 +0200830 fprintf(stderr, "\'");
831 if (run_count > 1)
832 fprintf(stderr, " (%d runs)", run_count);
833 fprintf(stderr, ":\n\n");
834 }
Ingo Molnar2996f5d2009-05-29 09:10:54 +0200835
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200836 if (no_aggr) {
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200837 list_for_each_entry(counter, &evsel_list->entries, node)
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200838 print_counter(counter);
839 } else {
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200840 list_for_each_entry(counter, &evsel_list->entries, node)
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200841 print_counter_aggr(counter);
842 }
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200843
Stephane Eraniand7470b62010-12-01 18:49:05 +0200844 if (!csv_output) {
845 fprintf(stderr, "\n");
846 fprintf(stderr, " %18.9f seconds time elapsed",
847 avg_stats(&walltime_nsecs_stats)/1e9);
848 if (run_count > 1) {
Ingo Molnarf99844c2011-04-27 05:35:39 +0200849 print_noise_pct(stddev_stats(&walltime_nsecs_stats),
850 avg_stats(&walltime_nsecs_stats));
Stephane Eraniand7470b62010-12-01 18:49:05 +0200851 }
852 fprintf(stderr, "\n\n");
Ingo Molnar566747e2009-06-27 06:24:32 +0200853 }
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200854}
855
Peter Zijlstraf7b7c262009-06-10 15:55:59 +0200856static volatile int signr = -1;
857
Ingo Molnar52425192009-05-26 09:17:18 +0200858static void skip_signal(int signo)
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200859{
Zhang, Yanmin6be28502010-03-18 11:36:03 -0300860 if(child_pid == -1)
Liming Wang60666c62009-12-31 16:05:50 +0800861 done = 1;
862
Peter Zijlstraf7b7c262009-06-10 15:55:59 +0200863 signr = signo;
864}
865
866static void sig_atexit(void)
867{
Chris Wilson933da832009-10-04 01:35:01 +0100868 if (child_pid != -1)
869 kill(child_pid, SIGTERM);
870
Peter Zijlstraf7b7c262009-06-10 15:55:59 +0200871 if (signr == -1)
872 return;
873
874 signal(signr, SIG_DFL);
875 kill(getpid(), signr);
Ingo Molnar52425192009-05-26 09:17:18 +0200876}
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200877
Ingo Molnar52425192009-05-26 09:17:18 +0200878static const char * const stat_usage[] = {
Liming Wang60666c62009-12-31 16:05:50 +0800879 "perf stat [<options>] [<command>]",
Ingo Molnar52425192009-05-26 09:17:18 +0200880 NULL
881};
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200882
Stephane Eraniand7470b62010-12-01 18:49:05 +0200883static int stat__set_big_num(const struct option *opt __used,
884 const char *s __used, int unset)
885{
886 big_num_opt = unset ? 0 : 1;
887 return 0;
888}
889
Ingo Molnar52425192009-05-26 09:17:18 +0200890static const struct option options[] = {
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -0200891 OPT_CALLBACK('e', "event", &evsel_list, "event",
Thomas Gleixner86847b62009-06-06 12:24:17 +0200892 "event selector. use 'perf list' to list available events",
893 parse_events),
Frederic Weisbeckercfd748a2011-03-14 16:40:30 +0100894 OPT_CALLBACK(0, "filter", &evsel_list, "filter",
895 "event filter", parse_filter),
Stephane Eranian2e6cdf92010-05-12 10:40:01 +0200896 OPT_BOOLEAN('i', "no-inherit", &no_inherit,
897 "child tasks do not inherit counters"),
Ingo Molnar52425192009-05-26 09:17:18 +0200898 OPT_INTEGER('p', "pid", &target_pid,
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300899 "stat events on existing process id"),
900 OPT_INTEGER('t', "tid", &target_tid,
901 "stat events on existing thread id"),
Ingo Molnar52425192009-05-26 09:17:18 +0200902 OPT_BOOLEAN('a', "all-cpus", &system_wide,
Jaswinder Singh Rajput3d632592009-06-24 18:19:34 +0530903 "system-wide collection from all CPUs"),
Brice Goglinb26bc5a2009-08-07 10:18:39 +0200904 OPT_BOOLEAN('c', "scale", &scale,
Jaswinder Singh Rajput3d632592009-06-24 18:19:34 +0530905 "scale/normalize counters"),
Ian Munsiec0555642010-04-13 18:37:33 +1000906 OPT_INCR('v', "verbose", &verbose,
Ingo Molnar743ee1f2009-06-07 17:06:46 +0200907 "be more verbose (show counter open errors, etc)"),
Ingo Molnar42202dd2009-06-13 14:57:28 +0200908 OPT_INTEGER('r', "repeat", &run_count,
909 "repeat command and print average + stddev (max: 100)"),
Ingo Molnar0cfb7a12009-06-27 06:10:30 +0200910 OPT_BOOLEAN('n', "null", &null_run,
911 "null run - dont start any counters"),
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200912 OPT_INCR('d', "detailed", &detailed_run,
Ingo Molnarc6264de2011-04-27 13:50:47 +0200913 "detailed run - start a lot of events"),
Ingo Molnarf9cef0a2011-04-28 18:17:11 +0200914 OPT_BOOLEAN('S', "sync", &sync_run,
915 "call sync() before starting a run"),
Stephane Eraniand7470b62010-12-01 18:49:05 +0200916 OPT_CALLBACK_NOOPT('B', "big-num", NULL, NULL,
917 "print large numbers with thousands\' separators",
918 stat__set_big_num),
Stephane Eranianc45c6ea2010-05-28 12:00:01 +0200919 OPT_STRING('C', "cpu", &cpu_list, "cpu",
920 "list of cpus to monitor in system-wide"),
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +0200921 OPT_BOOLEAN('A', "no-aggr", &no_aggr,
922 "disable CPU count aggregation"),
Stephane Eraniand7470b62010-12-01 18:49:05 +0200923 OPT_STRING('x', "field-separator", &csv_sep, "separator",
924 "print counts with custom separator"),
Stephane Eranian023695d2011-02-14 11:20:01 +0200925 OPT_CALLBACK('G', "cgroup", &evsel_list, "name",
926 "monitor event in cgroup name only",
927 parse_cgroups),
Ingo Molnar52425192009-05-26 09:17:18 +0200928 OPT_END()
929};
Ingo Molnarddcacfa2009-04-20 15:37:32 +0200930
Ingo Molnar2cba3ff2011-05-19 13:30:56 +0200931/*
932 * Add default attributes, if there were no attributes specified or
933 * if -d/--detailed, -d -d or -d -d -d is used:
934 */
935static int add_default_attributes(void)
936{
937 struct perf_evsel *pos;
938 size_t attr_nr = 0;
939 size_t c;
940
941 /* Set attrs if no event is selected and !null_run: */
942 if (null_run)
943 return 0;
944
945 if (!evsel_list->nr_entries) {
946 for (c = 0; c < ARRAY_SIZE(default_attrs); c++) {
947 pos = perf_evsel__new(default_attrs + c, c + attr_nr);
948 if (pos == NULL)
949 return -1;
950 perf_evlist__add(evsel_list, pos);
951 }
952 attr_nr += c;
953 }
954
955 /* Detailed events get appended to the event list: */
956
957 if (detailed_run < 1)
958 return 0;
959
960 /* Append detailed run extra attributes: */
961 for (c = 0; c < ARRAY_SIZE(detailed_attrs); c++) {
962 pos = perf_evsel__new(detailed_attrs + c, c + attr_nr);
963 if (pos == NULL)
964 return -1;
965 perf_evlist__add(evsel_list, pos);
966 }
967 attr_nr += c;
968
969 if (detailed_run < 2)
970 return 0;
971
972 /* Append very detailed run extra attributes: */
973 for (c = 0; c < ARRAY_SIZE(very_detailed_attrs); c++) {
974 pos = perf_evsel__new(very_detailed_attrs + c, c + attr_nr);
975 if (pos == NULL)
976 return -1;
977 perf_evlist__add(evsel_list, pos);
978 }
979
980 if (detailed_run < 3)
981 return 0;
982
983 /* Append very, very detailed run extra attributes: */
984 for (c = 0; c < ARRAY_SIZE(very_very_detailed_attrs); c++) {
985 pos = perf_evsel__new(very_very_detailed_attrs + c, c + attr_nr);
986 if (pos == NULL)
987 return -1;
988 perf_evlist__add(evsel_list, pos);
989 }
990
991
992 return 0;
993}
994
Ingo Molnarf37a2912009-07-01 12:37:06 +0200995int cmd_stat(int argc, const char **argv, const char *prefix __used)
Ingo Molnar52425192009-05-26 09:17:18 +0200996{
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -0200997 struct perf_evsel *pos;
998 int status = -ENOMEM;
Ingo Molnar42202dd2009-06-13 14:57:28 +0200999
Stephane Eranian5af52b52010-05-18 15:00:01 +02001000 setlocale(LC_ALL, "");
1001
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001002 evsel_list = perf_evlist__new(NULL, NULL);
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -02001003 if (evsel_list == NULL)
1004 return -ENOMEM;
1005
Anton Blancharda0541232009-07-22 23:04:12 +10001006 argc = parse_options(argc, argv, options, stat_usage,
1007 PARSE_OPT_STOP_AT_NON_OPTION);
Stephane Eraniand7470b62010-12-01 18:49:05 +02001008
1009 if (csv_sep)
1010 csv_output = true;
1011 else
1012 csv_sep = DEFAULT_SEPARATOR;
1013
1014 /*
1015 * let the spreadsheet do the pretty-printing
1016 */
1017 if (csv_output) {
1018 /* User explicitely passed -B? */
1019 if (big_num_opt == 1) {
1020 fprintf(stderr, "-B option not supported with -x\n");
1021 usage_with_options(stat_usage, options);
1022 } else /* Nope, so disable big number formatting */
1023 big_num = false;
1024 } else if (big_num_opt == 0) /* User passed --no-big-num */
1025 big_num = false;
1026
Zhang, Yanmind6d901c2010-03-18 11:36:05 -03001027 if (!argc && target_pid == -1 && target_tid == -1)
Ingo Molnar52425192009-05-26 09:17:18 +02001028 usage_with_options(stat_usage, options);
Peter Zijlstra9e9772c2009-09-04 15:36:08 +02001029 if (run_count <= 0)
Ingo Molnar42202dd2009-06-13 14:57:28 +02001030 usage_with_options(stat_usage, options);
Ingo Molnarddcacfa2009-04-20 15:37:32 +02001031
Stephane Eranian023695d2011-02-14 11:20:01 +02001032 /* no_aggr, cgroup are for system-wide only */
1033 if ((no_aggr || nr_cgroups) && !system_wide) {
1034 fprintf(stderr, "both cgroup and no-aggregation "
1035 "modes only available in system-wide mode\n");
1036
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +02001037 usage_with_options(stat_usage, options);
Stephane Eranian023695d2011-02-14 11:20:01 +02001038 }
Stephane Eranianf5b4a9c32010-11-16 11:05:01 +02001039
Ingo Molnar2cba3ff2011-05-19 13:30:56 +02001040 if (add_default_attributes())
1041 goto out;
Ingo Molnarddcacfa2009-04-20 15:37:32 +02001042
Arnaldo Carvalho de Melo5c98d4662011-01-03 17:53:33 -02001043 if (target_pid != -1)
1044 target_tid = target_pid;
1045
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001046 evsel_list->threads = thread_map__new(target_pid, target_tid);
1047 if (evsel_list->threads == NULL) {
Arnaldo Carvalho de Melo5c98d4662011-01-03 17:53:33 -02001048 pr_err("Problems finding threads of monitor\n");
1049 usage_with_options(stat_usage, options);
1050 }
1051
Paul Mackerrasa12b51c2010-03-10 20:36:09 +11001052 if (system_wide)
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001053 evsel_list->cpus = cpu_map__new(cpu_list);
Paul Mackerrasa12b51c2010-03-10 20:36:09 +11001054 else
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001055 evsel_list->cpus = cpu_map__dummy_new();
Ingo Molnarddcacfa2009-04-20 15:37:32 +02001056
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001057 if (evsel_list->cpus == NULL) {
Arnaldo Carvalho de Melo60d567e2011-01-03 17:49:48 -02001058 perror("failed to parse CPUs map");
Stephane Eranianc45c6ea2010-05-28 12:00:01 +02001059 usage_with_options(stat_usage, options);
Arnaldo Carvalho de Melo60d567e2011-01-03 17:49:48 -02001060 return -1;
1061 }
Stephane Eranianc45c6ea2010-05-28 12:00:01 +02001062
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -02001063 list_for_each_entry(pos, &evsel_list->entries, node) {
Arnaldo Carvalho de Meloc52b12e2011-01-03 17:45:52 -02001064 if (perf_evsel__alloc_stat_priv(pos) < 0 ||
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001065 perf_evsel__alloc_counts(pos, evsel_list->cpus->nr) < 0 ||
1066 perf_evsel__alloc_fd(pos, evsel_list->cpus->nr, evsel_list->threads->nr) < 0)
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -02001067 goto out_free_fd;
Zhang, Yanmind6d901c2010-03-18 11:36:05 -03001068 }
1069
Ingo Molnar58d7e992009-05-15 11:03:23 +02001070 /*
1071 * We dont want to block the signals - that would cause
1072 * child tasks to inherit that and Ctrl-C would not work.
1073 * What we want is for Ctrl-C to work in the exec()-ed
1074 * task, but being ignored by perf stat itself:
1075 */
Peter Zijlstraf7b7c262009-06-10 15:55:59 +02001076 atexit(sig_atexit);
Ingo Molnar58d7e992009-05-15 11:03:23 +02001077 signal(SIGINT, skip_signal);
1078 signal(SIGALRM, skip_signal);
1079 signal(SIGABRT, skip_signal);
1080
Ingo Molnar42202dd2009-06-13 14:57:28 +02001081 status = 0;
1082 for (run_idx = 0; run_idx < run_count; run_idx++) {
1083 if (run_count != 1 && verbose)
Jaswinder Singh Rajput3d632592009-06-24 18:19:34 +05301084 fprintf(stderr, "[ perf stat: executing run #%d ... ]\n", run_idx + 1);
Ingo Molnarf9cef0a2011-04-28 18:17:11 +02001085
1086 if (sync_run)
1087 sync();
1088
Ingo Molnar42202dd2009-06-13 14:57:28 +02001089 status = run_perf_stat(argc, argv);
1090 }
1091
Arnaldo Carvalho de Melo084ab9f2010-03-22 13:10:28 -03001092 if (status != -1)
1093 print_stat(argc, argv);
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -02001094out_free_fd:
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -02001095 list_for_each_entry(pos, &evsel_list->entries, node)
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -02001096 perf_evsel__free_stat_priv(pos);
Arnaldo Carvalho de Melo7e2ed092011-01-30 11:59:43 -02001097 perf_evlist__delete_maps(evsel_list);
Arnaldo Carvalho de Melo0015e2e2011-02-01 16:18:10 -02001098out:
1099 perf_evlist__delete(evsel_list);
Ingo Molnar42202dd2009-06-13 14:57:28 +02001100 return status;
Ingo Molnarddcacfa2009-04-20 15:37:32 +02001101}