Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Arnaldo Carvalho de Melo | a43783a | 2017-04-18 10:46:11 -0300 | [diff] [blame] | 2 | #include <errno.h> |
Arnaldo Carvalho de Melo | fd20e81 | 2017-04-17 15:23:08 -0300 | [diff] [blame] | 3 | #include <inttypes.h> |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 4 | #include <math.h> |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 5 | #include <string.h> |
Arnaldo Carvalho de Melo | bfc4918 | 2019-08-21 14:02:05 -0300 | [diff] [blame] | 6 | #include "counts.h" |
Arnaldo Carvalho de Melo | 87ffb6c | 2019-09-10 16:29:02 +0100 | [diff] [blame] | 7 | #include "cpumap.h" |
Arnaldo Carvalho de Melo | b420902 | 2019-08-29 15:56:40 -0300 | [diff] [blame] | 8 | #include "debug.h" |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 9 | #include "header.h" |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 10 | #include "stat.h" |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 11 | #include "session.h" |
Arnaldo Carvalho de Melo | aeb00b1 | 2019-08-22 15:40:29 -0300 | [diff] [blame] | 12 | #include "target.h" |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 13 | #include "evlist.h" |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 14 | #include "evsel.h" |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 15 | #include "thread_map.h" |
Arnaldo Carvalho de Melo | 7f7c536 | 2019-07-04 11:32:27 -0300 | [diff] [blame] | 16 | #include <linux/zalloc.h> |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 17 | |
| 18 | void update_stats(struct stats *stats, u64 val) |
| 19 | { |
| 20 | double delta; |
| 21 | |
| 22 | stats->n++; |
| 23 | delta = val - stats->mean; |
| 24 | stats->mean += delta / stats->n; |
| 25 | stats->M2 += delta*(val - stats->mean); |
David Ahern | ffe4f3c | 2013-08-02 14:05:40 -0600 | [diff] [blame] | 26 | |
| 27 | if (val > stats->max) |
| 28 | stats->max = val; |
| 29 | |
| 30 | if (val < stats->min) |
| 31 | stats->min = val; |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 32 | } |
| 33 | |
| 34 | double avg_stats(struct stats *stats) |
| 35 | { |
| 36 | return stats->mean; |
| 37 | } |
| 38 | |
| 39 | /* |
| 40 | * http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance |
| 41 | * |
| 42 | * (\Sum n_i^2) - ((\Sum n_i)^2)/n |
| 43 | * s^2 = ------------------------------- |
| 44 | * n - 1 |
| 45 | * |
| 46 | * http://en.wikipedia.org/wiki/Stddev |
| 47 | * |
| 48 | * The std dev of the mean is related to the std dev by: |
| 49 | * |
| 50 | * s |
| 51 | * s_mean = ------- |
| 52 | * sqrt(n) |
| 53 | * |
| 54 | */ |
| 55 | double stddev_stats(struct stats *stats) |
| 56 | { |
| 57 | double variance, variance_mean; |
| 58 | |
David Ahern | 45528f7 | 2013-05-25 18:24:48 -0600 | [diff] [blame] | 59 | if (stats->n < 2) |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 60 | return 0.0; |
| 61 | |
| 62 | variance = stats->M2 / (stats->n - 1); |
| 63 | variance_mean = variance / stats->n; |
| 64 | |
| 65 | return sqrt(variance_mean); |
| 66 | } |
| 67 | |
| 68 | double rel_stddev_stats(double stddev, double avg) |
| 69 | { |
| 70 | double pct = 0.0; |
| 71 | |
| 72 | if (avg) |
| 73 | pct = 100.0 * stddev/avg; |
| 74 | |
| 75 | return pct; |
| 76 | } |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 77 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 78 | bool __perf_evsel_stat__is(struct evsel *evsel, |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 79 | enum perf_stat_evsel_id id) |
| 80 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 81 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 82 | |
| 83 | return ps->id == id; |
| 84 | } |
| 85 | |
| 86 | #define ID(id, name) [PERF_STAT_EVSEL_ID__##id] = #name |
| 87 | static const char *id_str[PERF_STAT_EVSEL_ID__MAX] = { |
Jiri Olsa | 4c358d5 | 2015-06-03 16:25:52 +0200 | [diff] [blame] | 88 | ID(NONE, x), |
| 89 | ID(CYCLES_IN_TX, cpu/cycles-t/), |
| 90 | ID(TRANSACTION_START, cpu/tx-start/), |
| 91 | ID(ELISION_START, cpu/el-start/), |
| 92 | ID(CYCLES_IN_TX_CP, cpu/cycles-ct/), |
Andi Kleen | 239bd47 | 2016-05-24 12:52:37 -0700 | [diff] [blame] | 93 | ID(TOPDOWN_TOTAL_SLOTS, topdown-total-slots), |
| 94 | ID(TOPDOWN_SLOTS_ISSUED, topdown-slots-issued), |
| 95 | ID(TOPDOWN_SLOTS_RETIRED, topdown-slots-retired), |
| 96 | ID(TOPDOWN_FETCH_BUBBLES, topdown-fetch-bubbles), |
| 97 | ID(TOPDOWN_RECOVERY_BUBBLES, topdown-recovery-bubbles), |
Andi Kleen | 55c36a9 | 2020-09-11 07:48:07 -0700 | [diff] [blame] | 98 | ID(TOPDOWN_RETIRING, topdown-retiring), |
| 99 | ID(TOPDOWN_BAD_SPEC, topdown-bad-spec), |
| 100 | ID(TOPDOWN_FE_BOUND, topdown-fe-bound), |
| 101 | ID(TOPDOWN_BE_BOUND, topdown-be-bound), |
Kan Liang | daefd0b | 2017-05-26 12:05:38 -0700 | [diff] [blame] | 102 | ID(SMI_NUM, msr/smi/), |
| 103 | ID(APERF, msr/aperf/), |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 104 | }; |
| 105 | #undef ID |
| 106 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 107 | static void perf_stat_evsel_id_init(struct evsel *evsel) |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 108 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 109 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 110 | int i; |
| 111 | |
| 112 | /* ps->id is 0 hence PERF_STAT_EVSEL_ID__NONE by default */ |
| 113 | |
| 114 | for (i = 0; i < PERF_STAT_EVSEL_ID__MAX; i++) { |
Arnaldo Carvalho de Melo | 8ab2e96 | 2020-04-29 16:07:09 -0300 | [diff] [blame] | 115 | if (!strcmp(evsel__name(evsel), id_str[i])) { |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 116 | ps->id = i; |
| 117 | break; |
| 118 | } |
| 119 | } |
| 120 | } |
Jiri Olsa | a9a3a4d | 2015-06-14 10:19:26 +0200 | [diff] [blame] | 121 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 122 | static void evsel__reset_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 123 | { |
| 124 | int i; |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 125 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 126 | |
| 127 | for (i = 0; i < 3; i++) |
| 128 | init_stats(&ps->res_stats[i]); |
| 129 | |
| 130 | perf_stat_evsel_id_init(evsel); |
| 131 | } |
| 132 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 133 | static int evsel__alloc_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 134 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 135 | evsel->stats = zalloc(sizeof(struct perf_stat_evsel)); |
| 136 | if (evsel->stats == NULL) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 137 | return -ENOMEM; |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 138 | evsel__reset_stat_priv(evsel); |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 139 | return 0; |
| 140 | } |
| 141 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 142 | static void evsel__free_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 143 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 144 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | f7794d5 | 2017-07-26 14:02:05 +0200 | [diff] [blame] | 145 | |
| 146 | if (ps) |
Arnaldo Carvalho de Melo | d8f9da2 | 2019-07-04 12:06:20 -0300 | [diff] [blame] | 147 | zfree(&ps->group_data); |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 148 | zfree(&evsel->stats); |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 149 | } |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 150 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 151 | static int evsel__alloc_prev_raw_counts(struct evsel *evsel, int ncpus, int nthreads) |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 152 | { |
| 153 | struct perf_counts *counts; |
| 154 | |
| 155 | counts = perf_counts__new(ncpus, nthreads); |
| 156 | if (counts) |
| 157 | evsel->prev_raw_counts = counts; |
| 158 | |
| 159 | return counts ? 0 : -ENOMEM; |
| 160 | } |
| 161 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 162 | static void evsel__free_prev_raw_counts(struct evsel *evsel) |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 163 | { |
| 164 | perf_counts__delete(evsel->prev_raw_counts); |
| 165 | evsel->prev_raw_counts = NULL; |
| 166 | } |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 167 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 168 | static void evsel__reset_prev_raw_counts(struct evsel *evsel) |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 169 | { |
Jin Yao | cf4d9bd | 2020-05-20 12:27:34 +0800 | [diff] [blame] | 170 | if (evsel->prev_raw_counts) |
| 171 | perf_counts__reset(evsel->prev_raw_counts); |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 172 | } |
| 173 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 174 | static int evsel__alloc_stats(struct evsel *evsel, bool alloc_raw) |
Jiri Olsa | a7d0a10 | 2015-06-26 11:29:17 +0200 | [diff] [blame] | 175 | { |
Arnaldo Carvalho de Melo | 5eb88f0 | 2020-04-29 15:45:09 -0300 | [diff] [blame] | 176 | int ncpus = evsel__nr_cpus(evsel); |
Jiri Olsa | a2f354e | 2019-08-22 13:11:41 +0200 | [diff] [blame] | 177 | int nthreads = perf_thread_map__nr(evsel->core.threads); |
Jiri Olsa | a7d0a10 | 2015-06-26 11:29:17 +0200 | [diff] [blame] | 178 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 179 | if (evsel__alloc_stat_priv(evsel) < 0 || |
| 180 | evsel__alloc_counts(evsel, ncpus, nthreads) < 0 || |
| 181 | (alloc_raw && evsel__alloc_prev_raw_counts(evsel, ncpus, nthreads) < 0)) |
Jiri Olsa | a7d0a10 | 2015-06-26 11:29:17 +0200 | [diff] [blame] | 182 | return -ENOMEM; |
| 183 | |
| 184 | return 0; |
| 185 | } |
| 186 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 187 | int evlist__alloc_stats(struct evlist *evlist, bool alloc_raw) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 188 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 189 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 190 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 191 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 192 | if (evsel__alloc_stats(evsel, alloc_raw)) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 193 | goto out_free; |
| 194 | } |
| 195 | |
| 196 | return 0; |
| 197 | |
| 198 | out_free: |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 199 | evlist__free_stats(evlist); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 200 | return -1; |
| 201 | } |
| 202 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 203 | void evlist__free_stats(struct evlist *evlist) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 204 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 205 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 206 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 207 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 208 | evsel__free_stat_priv(evsel); |
| 209 | evsel__free_counts(evsel); |
| 210 | evsel__free_prev_raw_counts(evsel); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 211 | } |
| 212 | } |
| 213 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 214 | void evlist__reset_stats(struct evlist *evlist) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 215 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 216 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 217 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 218 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 219 | evsel__reset_stat_priv(evsel); |
| 220 | evsel__reset_counts(evsel); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 221 | } |
| 222 | } |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 223 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 224 | void evlist__reset_prev_raw_counts(struct evlist *evlist) |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 225 | { |
| 226 | struct evsel *evsel; |
| 227 | |
| 228 | evlist__for_each_entry(evlist, evsel) |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 229 | evsel__reset_prev_raw_counts(evsel); |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 230 | } |
| 231 | |
Arnaldo Carvalho de Melo | 5693302 | 2020-11-30 09:08:24 -0300 | [diff] [blame] | 232 | static void evsel__copy_prev_raw_counts(struct evsel *evsel) |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 233 | { |
| 234 | int ncpus = evsel__nr_cpus(evsel); |
| 235 | int nthreads = perf_thread_map__nr(evsel->core.threads); |
| 236 | |
| 237 | for (int thread = 0; thread < nthreads; thread++) { |
| 238 | for (int cpu = 0; cpu < ncpus; cpu++) { |
| 239 | *perf_counts(evsel->counts, cpu, thread) = |
| 240 | *perf_counts(evsel->prev_raw_counts, cpu, |
| 241 | thread); |
| 242 | } |
| 243 | } |
| 244 | |
| 245 | evsel->counts->aggr = evsel->prev_raw_counts->aggr; |
| 246 | } |
| 247 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 248 | void evlist__copy_prev_raw_counts(struct evlist *evlist) |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 249 | { |
| 250 | struct evsel *evsel; |
| 251 | |
| 252 | evlist__for_each_entry(evlist, evsel) |
Arnaldo Carvalho de Melo | 5693302 | 2020-11-30 09:08:24 -0300 | [diff] [blame] | 253 | evsel__copy_prev_raw_counts(evsel); |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 254 | } |
| 255 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 256 | void evlist__save_aggr_prev_raw_counts(struct evlist *evlist) |
Jin Yao | 905365f | 2020-05-20 12:27:36 +0800 | [diff] [blame] | 257 | { |
| 258 | struct evsel *evsel; |
| 259 | |
| 260 | /* |
| 261 | * To collect the overall statistics for interval mode, |
| 262 | * we copy the counts from evsel->prev_raw_counts to |
| 263 | * evsel->counts. The perf_stat_process_counter creates |
| 264 | * aggr values from per cpu values, but the per cpu values |
| 265 | * are 0 for AGGR_GLOBAL. So we use a trick that saves the |
| 266 | * previous aggr value to the first member of perf_counts, |
| 267 | * then aggr calculation in process_counter_values can work |
| 268 | * correctly. |
| 269 | */ |
| 270 | evlist__for_each_entry(evlist, evsel) { |
| 271 | *perf_counts(evsel->prev_raw_counts, 0, 0) = |
| 272 | evsel->prev_raw_counts->aggr; |
| 273 | } |
| 274 | } |
| 275 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 276 | static void zero_per_pkg(struct evsel *counter) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 277 | { |
| 278 | if (counter->per_pkg_mask) |
Kyle Meyer | 92b5a15 | 2019-08-27 16:43:48 -0500 | [diff] [blame] | 279 | memset(counter->per_pkg_mask, 0, cpu__max_cpu()); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 280 | } |
| 281 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 282 | static int check_per_pkg(struct evsel *counter, |
Stephane Eranian | 02d8dab | 2015-09-03 15:23:40 +0200 | [diff] [blame] | 283 | struct perf_counts_values *vals, int cpu, bool *skip) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 284 | { |
| 285 | unsigned long *mask = counter->per_pkg_mask; |
Jiri Olsa | b49aca3 | 2019-07-21 13:24:05 +0200 | [diff] [blame] | 286 | struct perf_cpu_map *cpus = evsel__cpus(counter); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 287 | int s; |
| 288 | |
| 289 | *skip = false; |
| 290 | |
| 291 | if (!counter->per_pkg) |
| 292 | return 0; |
| 293 | |
Jiri Olsa | 315c0a1 | 2019-08-22 13:11:39 +0200 | [diff] [blame] | 294 | if (perf_cpu_map__empty(cpus)) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 295 | return 0; |
| 296 | |
| 297 | if (!mask) { |
Kyle Meyer | 92b5a15 | 2019-08-27 16:43:48 -0500 | [diff] [blame] | 298 | mask = zalloc(cpu__max_cpu()); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 299 | if (!mask) |
| 300 | return -ENOMEM; |
| 301 | |
| 302 | counter->per_pkg_mask = mask; |
| 303 | } |
| 304 | |
Stephane Eranian | 02d8dab | 2015-09-03 15:23:40 +0200 | [diff] [blame] | 305 | /* |
| 306 | * we do not consider an event that has not run as a good |
| 307 | * instance to mark a package as used (skip=1). Otherwise |
| 308 | * we may run into a situation where the first CPU in a package |
| 309 | * is not running anything, yet the second is, and this function |
| 310 | * would mark the package as used after the first CPU and would |
| 311 | * not read the values from the second CPU. |
| 312 | */ |
| 313 | if (!(vals->run && vals->ena)) |
| 314 | return 0; |
| 315 | |
James Clark | 1a270cb | 2020-11-26 16:13:25 +0200 | [diff] [blame^] | 316 | s = cpu_map__get_socket(cpus, cpu, NULL).socket; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 317 | if (s < 0) |
| 318 | return -1; |
| 319 | |
| 320 | *skip = test_and_set_bit(s, mask) == 1; |
| 321 | return 0; |
| 322 | } |
| 323 | |
| 324 | static int |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 325 | process_counter_values(struct perf_stat_config *config, struct evsel *evsel, |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 326 | int cpu, int thread, |
| 327 | struct perf_counts_values *count) |
| 328 | { |
| 329 | struct perf_counts_values *aggr = &evsel->counts->aggr; |
| 330 | static struct perf_counts_values zero; |
| 331 | bool skip = false; |
| 332 | |
Stephane Eranian | 02d8dab | 2015-09-03 15:23:40 +0200 | [diff] [blame] | 333 | if (check_per_pkg(evsel, count, cpu, &skip)) { |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 334 | pr_err("failed to read per-pkg counter\n"); |
| 335 | return -1; |
| 336 | } |
| 337 | |
| 338 | if (skip) |
| 339 | count = &zero; |
| 340 | |
| 341 | switch (config->aggr_mode) { |
| 342 | case AGGR_THREAD: |
| 343 | case AGGR_CORE: |
Kan Liang | db5742b | 2019-06-04 15:50:42 -0700 | [diff] [blame] | 344 | case AGGR_DIE: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 345 | case AGGR_SOCKET: |
Jiri Olsa | 86895b4 | 2019-08-28 10:17:43 +0200 | [diff] [blame] | 346 | case AGGR_NODE: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 347 | case AGGR_NONE: |
| 348 | if (!evsel->snapshot) |
Arnaldo Carvalho de Melo | 12f5261 | 2020-04-29 15:47:38 -0300 | [diff] [blame] | 349 | evsel__compute_deltas(evsel, cpu, thread, count); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 350 | perf_counts_values__scale(count, config->scale, NULL); |
Jin Yao | 4fc4d8d | 2019-04-12 21:59:49 +0800 | [diff] [blame] | 351 | if ((config->aggr_mode == AGGR_NONE) && (!evsel->percore)) { |
| 352 | perf_stat__update_shadow_stats(evsel, count->val, |
| 353 | cpu, &rt_stat); |
| 354 | } |
| 355 | |
Jin Yao | 14e72a2 | 2017-12-05 22:03:08 +0800 | [diff] [blame] | 356 | if (config->aggr_mode == AGGR_THREAD) { |
| 357 | if (config->stats) |
| 358 | perf_stat__update_shadow_stats(evsel, |
| 359 | count->val, 0, &config->stats[thread]); |
| 360 | else |
| 361 | perf_stat__update_shadow_stats(evsel, |
| 362 | count->val, 0, &rt_stat); |
| 363 | } |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 364 | break; |
| 365 | case AGGR_GLOBAL: |
| 366 | aggr->val += count->val; |
Andi Kleen | 75998bb | 2019-03-14 15:50:01 -0700 | [diff] [blame] | 367 | aggr->ena += count->ena; |
| 368 | aggr->run += count->run; |
Jiri Olsa | 208df99 | 2015-10-16 12:41:04 +0200 | [diff] [blame] | 369 | case AGGR_UNSET: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 370 | default: |
| 371 | break; |
| 372 | } |
| 373 | |
| 374 | return 0; |
| 375 | } |
| 376 | |
| 377 | static int process_counter_maps(struct perf_stat_config *config, |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 378 | struct evsel *counter) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 379 | { |
Jiri Olsa | a2f354e | 2019-08-22 13:11:41 +0200 | [diff] [blame] | 380 | int nthreads = perf_thread_map__nr(counter->core.threads); |
Arnaldo Carvalho de Melo | 5eb88f0 | 2020-04-29 15:45:09 -0300 | [diff] [blame] | 381 | int ncpus = evsel__nr_cpus(counter); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 382 | int cpu, thread; |
| 383 | |
Jiri Olsa | 648b5af | 2019-08-06 11:35:19 +0200 | [diff] [blame] | 384 | if (counter->core.system_wide) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 385 | nthreads = 1; |
| 386 | |
| 387 | for (thread = 0; thread < nthreads; thread++) { |
| 388 | for (cpu = 0; cpu < ncpus; cpu++) { |
| 389 | if (process_counter_values(config, counter, cpu, thread, |
| 390 | perf_counts(counter->counts, cpu, thread))) |
| 391 | return -1; |
| 392 | } |
| 393 | } |
| 394 | |
| 395 | return 0; |
| 396 | } |
| 397 | |
| 398 | int perf_stat_process_counter(struct perf_stat_config *config, |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 399 | struct evsel *counter) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 400 | { |
| 401 | struct perf_counts_values *aggr = &counter->counts->aggr; |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 402 | struct perf_stat_evsel *ps = counter->stats; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 403 | u64 *count = counter->counts->aggr.values; |
| 404 | int i, ret; |
| 405 | |
| 406 | aggr->val = aggr->ena = aggr->run = 0; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 407 | |
Jiri Olsa | 51fd2df | 2016-02-03 08:43:56 +0100 | [diff] [blame] | 408 | /* |
| 409 | * We calculate counter's data every interval, |
| 410 | * and the display code shows ps->res_stats |
| 411 | * avg value. We need to zero the stats for |
| 412 | * interval mode, otherwise overall avg running |
| 413 | * averages will be shown for each interval. |
| 414 | */ |
Jin Yao | c7e5b32 | 2020-05-20 12:27:37 +0800 | [diff] [blame] | 415 | if (config->interval || config->summary) { |
Jin Yao | 0e0bf1e | 2020-04-09 15:07:55 +0800 | [diff] [blame] | 416 | for (i = 0; i < 3; i++) |
| 417 | init_stats(&ps->res_stats[i]); |
| 418 | } |
Jiri Olsa | 51fd2df | 2016-02-03 08:43:56 +0100 | [diff] [blame] | 419 | |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 420 | if (counter->per_pkg) |
| 421 | zero_per_pkg(counter); |
| 422 | |
| 423 | ret = process_counter_maps(config, counter); |
| 424 | if (ret) |
| 425 | return ret; |
| 426 | |
| 427 | if (config->aggr_mode != AGGR_GLOBAL) |
| 428 | return 0; |
| 429 | |
| 430 | if (!counter->snapshot) |
Arnaldo Carvalho de Melo | 12f5261 | 2020-04-29 15:47:38 -0300 | [diff] [blame] | 431 | evsel__compute_deltas(counter, -1, -1, aggr); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 432 | perf_counts_values__scale(aggr, config->scale, &counter->counts->scaled); |
| 433 | |
| 434 | for (i = 0; i < 3; i++) |
| 435 | update_stats(&ps->res_stats[i], count[i]); |
| 436 | |
Namhyung Kim | bb963e1 | 2017-02-17 17:17:38 +0900 | [diff] [blame] | 437 | if (verbose > 0) { |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 438 | fprintf(config->output, "%s: %" PRIu64 " %" PRIu64 " %" PRIu64 "\n", |
Arnaldo Carvalho de Melo | 8ab2e96 | 2020-04-29 16:07:09 -0300 | [diff] [blame] | 439 | evsel__name(counter), count[0], count[1], count[2]); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 440 | } |
| 441 | |
| 442 | /* |
| 443 | * Save the full runtime - to allow normalization during printout: |
| 444 | */ |
Jin Yao | 1fcd039 | 2017-12-05 22:03:04 +0800 | [diff] [blame] | 445 | perf_stat__update_shadow_stats(counter, *count, 0, &rt_stat); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 446 | |
| 447 | return 0; |
| 448 | } |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 449 | |
Jiri Olsa | 89f1688 | 2018-09-13 14:54:03 +0200 | [diff] [blame] | 450 | int perf_event__process_stat_event(struct perf_session *session, |
| 451 | union perf_event *event) |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 452 | { |
| 453 | struct perf_counts_values count; |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 454 | struct perf_record_stat *st = &event->stat; |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 455 | struct evsel *counter; |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 456 | |
| 457 | count.val = st->val; |
| 458 | count.ena = st->ena; |
| 459 | count.run = st->run; |
| 460 | |
Arnaldo Carvalho de Melo | 3ccf8a7 | 2020-11-30 14:17:57 -0300 | [diff] [blame] | 461 | counter = evlist__id2evsel(session->evlist, st->id); |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 462 | if (!counter) { |
| 463 | pr_err("Failed to resolve counter for stat event.\n"); |
| 464 | return -EINVAL; |
| 465 | } |
| 466 | |
| 467 | *perf_counts(counter->counts, st->cpu, st->thread) = count; |
| 468 | counter->supported = true; |
| 469 | return 0; |
| 470 | } |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 471 | |
| 472 | size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp) |
| 473 | { |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 474 | struct perf_record_stat *st = (struct perf_record_stat *)event; |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 475 | size_t ret; |
| 476 | |
Jiri Olsa | 18a13a6 | 2019-08-28 15:57:10 +0200 | [diff] [blame] | 477 | ret = fprintf(fp, "\n... id %" PRI_lu64 ", cpu %d, thread %d\n", |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 478 | st->id, st->cpu, st->thread); |
Jiri Olsa | 18a13a6 | 2019-08-28 15:57:10 +0200 | [diff] [blame] | 479 | ret += fprintf(fp, "... value %" PRI_lu64 ", enabled %" PRI_lu64 ", running %" PRI_lu64 "\n", |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 480 | st->val, st->ena, st->run); |
| 481 | |
| 482 | return ret; |
| 483 | } |
| 484 | |
| 485 | size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp) |
| 486 | { |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 487 | struct perf_record_stat_round *rd = (struct perf_record_stat_round *)event; |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 488 | size_t ret; |
| 489 | |
Jiri Olsa | 782adbe | 2019-08-28 15:57:11 +0200 | [diff] [blame] | 490 | ret = fprintf(fp, "\n... time %" PRI_lu64 ", type %s\n", rd->time, |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 491 | rd->type == PERF_STAT_ROUND_TYPE__FINAL ? "FINAL" : "INTERVAL"); |
| 492 | |
| 493 | return ret; |
| 494 | } |
| 495 | |
| 496 | size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp) |
| 497 | { |
| 498 | struct perf_stat_config sc; |
| 499 | size_t ret; |
| 500 | |
| 501 | perf_event__read_stat_config(&sc, &event->stat_config); |
| 502 | |
| 503 | ret = fprintf(fp, "\n"); |
| 504 | ret += fprintf(fp, "... aggr_mode %d\n", sc.aggr_mode); |
| 505 | ret += fprintf(fp, "... scale %d\n", sc.scale); |
| 506 | ret += fprintf(fp, "... interval %u\n", sc.interval); |
| 507 | |
| 508 | return ret; |
| 509 | } |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 510 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 511 | int create_perf_stat_counter(struct evsel *evsel, |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 512 | struct perf_stat_config *config, |
Andi Kleen | 4804e01 | 2019-11-20 16:15:19 -0800 | [diff] [blame] | 513 | struct target *target, |
| 514 | int cpu) |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 515 | { |
Jiri Olsa | 1fc632c | 2019-07-21 13:24:29 +0200 | [diff] [blame] | 516 | struct perf_event_attr *attr = &evsel->core.attr; |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 517 | struct evsel *leader = evsel->leader; |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 518 | |
Andi Kleen | 75998bb | 2019-03-14 15:50:01 -0700 | [diff] [blame] | 519 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | |
| 520 | PERF_FORMAT_TOTAL_TIME_RUNNING; |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 521 | |
| 522 | /* |
| 523 | * The event is part of non trivial group, let's enable |
| 524 | * the group read (for leader) and ID retrieval for all |
| 525 | * members. |
| 526 | */ |
Jiri Olsa | 5643b1a | 2019-07-21 13:24:46 +0200 | [diff] [blame] | 527 | if (leader->core.nr_members > 1) |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 528 | attr->read_format |= PERF_FORMAT_ID|PERF_FORMAT_GROUP; |
| 529 | |
| 530 | attr->inherit = !config->no_inherit; |
| 531 | |
| 532 | /* |
| 533 | * Some events get initialized with sample_(period/type) set, |
| 534 | * like tracepoints. Clear it up for counting. |
| 535 | */ |
| 536 | attr->sample_period = 0; |
| 537 | |
| 538 | if (config->identifier) |
| 539 | attr->sample_type = PERF_SAMPLE_IDENTIFIER; |
| 540 | |
Jin Yao | dd07102 | 2019-10-11 13:05:45 +0800 | [diff] [blame] | 541 | if (config->all_user) { |
| 542 | attr->exclude_kernel = 1; |
| 543 | attr->exclude_user = 0; |
| 544 | } |
| 545 | |
| 546 | if (config->all_kernel) { |
| 547 | attr->exclude_kernel = 0; |
| 548 | attr->exclude_user = 1; |
| 549 | } |
| 550 | |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 551 | /* |
| 552 | * Disabling all counters initially, they will be enabled |
| 553 | * either manually by us or by kernel via enable_on_exec |
| 554 | * set later. |
| 555 | */ |
Arnaldo Carvalho de Melo | c754c38 | 2020-04-30 10:51:16 -0300 | [diff] [blame] | 556 | if (evsel__is_group_leader(evsel)) { |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 557 | attr->disabled = 1; |
| 558 | |
| 559 | /* |
| 560 | * In case of initial_delay we enable tracee |
| 561 | * events manually. |
| 562 | */ |
| 563 | if (target__none(target) && !config->initial_delay) |
| 564 | attr->enable_on_exec = 1; |
| 565 | } |
| 566 | |
| 567 | if (target__has_cpu(target) && !target__has_per_thread(target)) |
Arnaldo Carvalho de Melo | aa8c406 | 2020-04-29 16:21:03 -0300 | [diff] [blame] | 568 | return evsel__open_per_cpu(evsel, evsel__cpus(evsel), cpu); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 569 | |
Arnaldo Carvalho de Melo | aa8c406 | 2020-04-29 16:21:03 -0300 | [diff] [blame] | 570 | return evsel__open_per_thread(evsel, evsel->core.threads); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 571 | } |