Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Arnaldo Carvalho de Melo | a43783a | 2017-04-18 10:46:11 -0300 | [diff] [blame] | 2 | #include <errno.h> |
Arnaldo Carvalho de Melo | fd20e81 | 2017-04-17 15:23:08 -0300 | [diff] [blame] | 3 | #include <inttypes.h> |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 4 | #include <math.h> |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 5 | #include <string.h> |
Arnaldo Carvalho de Melo | bfc4918 | 2019-08-21 14:02:05 -0300 | [diff] [blame] | 6 | #include "counts.h" |
Arnaldo Carvalho de Melo | 87ffb6c | 2019-09-10 16:29:02 +0100 | [diff] [blame] | 7 | #include "cpumap.h" |
Arnaldo Carvalho de Melo | b420902 | 2019-08-29 15:56:40 -0300 | [diff] [blame] | 8 | #include "debug.h" |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 9 | #include "header.h" |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 10 | #include "stat.h" |
Arnaldo Carvalho de Melo | f2a39fe | 2019-08-30 14:45:20 -0300 | [diff] [blame] | 11 | #include "session.h" |
Arnaldo Carvalho de Melo | aeb00b1 | 2019-08-22 15:40:29 -0300 | [diff] [blame] | 12 | #include "target.h" |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 13 | #include "evlist.h" |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 14 | #include "evsel.h" |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 15 | #include "thread_map.h" |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 16 | #include "hashmap.h" |
Arnaldo Carvalho de Melo | 7f7c536 | 2019-07-04 11:32:27 -0300 | [diff] [blame] | 17 | #include <linux/zalloc.h> |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 18 | |
| 19 | void update_stats(struct stats *stats, u64 val) |
| 20 | { |
| 21 | double delta; |
| 22 | |
| 23 | stats->n++; |
| 24 | delta = val - stats->mean; |
| 25 | stats->mean += delta / stats->n; |
| 26 | stats->M2 += delta*(val - stats->mean); |
David Ahern | ffe4f3c | 2013-08-02 14:05:40 -0600 | [diff] [blame] | 27 | |
| 28 | if (val > stats->max) |
| 29 | stats->max = val; |
| 30 | |
| 31 | if (val < stats->min) |
| 32 | stats->min = val; |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 33 | } |
| 34 | |
| 35 | double avg_stats(struct stats *stats) |
| 36 | { |
| 37 | return stats->mean; |
| 38 | } |
| 39 | |
| 40 | /* |
| 41 | * http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance |
| 42 | * |
| 43 | * (\Sum n_i^2) - ((\Sum n_i)^2)/n |
| 44 | * s^2 = ------------------------------- |
| 45 | * n - 1 |
| 46 | * |
| 47 | * http://en.wikipedia.org/wiki/Stddev |
| 48 | * |
| 49 | * The std dev of the mean is related to the std dev by: |
| 50 | * |
| 51 | * s |
| 52 | * s_mean = ------- |
| 53 | * sqrt(n) |
| 54 | * |
| 55 | */ |
| 56 | double stddev_stats(struct stats *stats) |
| 57 | { |
| 58 | double variance, variance_mean; |
| 59 | |
David Ahern | 45528f7 | 2013-05-25 18:24:48 -0600 | [diff] [blame] | 60 | if (stats->n < 2) |
Xiao Guangrong | 0007ece | 2012-09-17 16:31:14 +0800 | [diff] [blame] | 61 | return 0.0; |
| 62 | |
| 63 | variance = stats->M2 / (stats->n - 1); |
| 64 | variance_mean = variance / stats->n; |
| 65 | |
| 66 | return sqrt(variance_mean); |
| 67 | } |
| 68 | |
| 69 | double rel_stddev_stats(double stddev, double avg) |
| 70 | { |
| 71 | double pct = 0.0; |
| 72 | |
| 73 | if (avg) |
| 74 | pct = 100.0 * stddev/avg; |
| 75 | |
| 76 | return pct; |
| 77 | } |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 78 | |
Arnaldo Carvalho de Melo | 9052034 | 2021-03-09 09:03:40 -0300 | [diff] [blame] | 79 | bool __perf_stat_evsel__is(struct evsel *evsel, enum perf_stat_evsel_id id) |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 80 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 81 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 82 | |
| 83 | return ps->id == id; |
| 84 | } |
| 85 | |
| 86 | #define ID(id, name) [PERF_STAT_EVSEL_ID__##id] = #name |
| 87 | static const char *id_str[PERF_STAT_EVSEL_ID__MAX] = { |
Jiri Olsa | 4c358d5 | 2015-06-03 16:25:52 +0200 | [diff] [blame] | 88 | ID(NONE, x), |
| 89 | ID(CYCLES_IN_TX, cpu/cycles-t/), |
| 90 | ID(TRANSACTION_START, cpu/tx-start/), |
| 91 | ID(ELISION_START, cpu/el-start/), |
| 92 | ID(CYCLES_IN_TX_CP, cpu/cycles-ct/), |
Andi Kleen | 239bd47 | 2016-05-24 12:52:37 -0700 | [diff] [blame] | 93 | ID(TOPDOWN_TOTAL_SLOTS, topdown-total-slots), |
| 94 | ID(TOPDOWN_SLOTS_ISSUED, topdown-slots-issued), |
| 95 | ID(TOPDOWN_SLOTS_RETIRED, topdown-slots-retired), |
| 96 | ID(TOPDOWN_FETCH_BUBBLES, topdown-fetch-bubbles), |
| 97 | ID(TOPDOWN_RECOVERY_BUBBLES, topdown-recovery-bubbles), |
Andi Kleen | 55c36a9 | 2020-09-11 07:48:07 -0700 | [diff] [blame] | 98 | ID(TOPDOWN_RETIRING, topdown-retiring), |
| 99 | ID(TOPDOWN_BAD_SPEC, topdown-bad-spec), |
| 100 | ID(TOPDOWN_FE_BOUND, topdown-fe-bound), |
| 101 | ID(TOPDOWN_BE_BOUND, topdown-be-bound), |
Kan Liang | 63e39aa | 2021-02-02 12:09:12 -0800 | [diff] [blame] | 102 | ID(TOPDOWN_HEAVY_OPS, topdown-heavy-ops), |
| 103 | ID(TOPDOWN_BR_MISPREDICT, topdown-br-mispredict), |
| 104 | ID(TOPDOWN_FETCH_LAT, topdown-fetch-lat), |
| 105 | ID(TOPDOWN_MEM_BOUND, topdown-mem-bound), |
Kan Liang | daefd0b | 2017-05-26 12:05:38 -0700 | [diff] [blame] | 106 | ID(SMI_NUM, msr/smi/), |
| 107 | ID(APERF, msr/aperf/), |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 108 | }; |
| 109 | #undef ID |
| 110 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 111 | static void perf_stat_evsel_id_init(struct evsel *evsel) |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 112 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 113 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 114 | int i; |
| 115 | |
| 116 | /* ps->id is 0 hence PERF_STAT_EVSEL_ID__NONE by default */ |
| 117 | |
| 118 | for (i = 0; i < PERF_STAT_EVSEL_ID__MAX; i++) { |
Arnaldo Carvalho de Melo | 8ab2e96 | 2020-04-29 16:07:09 -0300 | [diff] [blame] | 119 | if (!strcmp(evsel__name(evsel), id_str[i])) { |
Jiri Olsa | e2f56da | 2015-06-04 15:50:55 +0200 | [diff] [blame] | 120 | ps->id = i; |
| 121 | break; |
| 122 | } |
| 123 | } |
| 124 | } |
Jiri Olsa | a9a3a4d | 2015-06-14 10:19:26 +0200 | [diff] [blame] | 125 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 126 | static void evsel__reset_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 127 | { |
| 128 | int i; |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 129 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 130 | |
| 131 | for (i = 0; i < 3; i++) |
| 132 | init_stats(&ps->res_stats[i]); |
| 133 | |
| 134 | perf_stat_evsel_id_init(evsel); |
| 135 | } |
| 136 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 137 | static int evsel__alloc_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 138 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 139 | evsel->stats = zalloc(sizeof(struct perf_stat_evsel)); |
| 140 | if (evsel->stats == NULL) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 141 | return -ENOMEM; |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 142 | evsel__reset_stat_priv(evsel); |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 143 | return 0; |
| 144 | } |
| 145 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 146 | static void evsel__free_stat_priv(struct evsel *evsel) |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 147 | { |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 148 | struct perf_stat_evsel *ps = evsel->stats; |
Jiri Olsa | f7794d5 | 2017-07-26 14:02:05 +0200 | [diff] [blame] | 149 | |
| 150 | if (ps) |
Arnaldo Carvalho de Melo | d8f9da2 | 2019-07-04 12:06:20 -0300 | [diff] [blame] | 151 | zfree(&ps->group_data); |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 152 | zfree(&evsel->stats); |
Jiri Olsa | 9689edf | 2015-06-26 11:29:14 +0200 | [diff] [blame] | 153 | } |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 154 | |
Ian Rogers | 2ca0a37 | 2022-01-04 22:13:29 -0800 | [diff] [blame] | 155 | static int evsel__alloc_prev_raw_counts(struct evsel *evsel) |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 156 | { |
Ian Rogers | 2ca0a37 | 2022-01-04 22:13:29 -0800 | [diff] [blame] | 157 | int cpu_map_nr = evsel__nr_cpus(evsel); |
| 158 | int nthreads = perf_thread_map__nr(evsel->core.threads); |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 159 | struct perf_counts *counts; |
| 160 | |
Ian Rogers | 2ca0a37 | 2022-01-04 22:13:29 -0800 | [diff] [blame] | 161 | counts = perf_counts__new(cpu_map_nr, nthreads); |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 162 | if (counts) |
| 163 | evsel->prev_raw_counts = counts; |
| 164 | |
| 165 | return counts ? 0 : -ENOMEM; |
| 166 | } |
| 167 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 168 | static void evsel__free_prev_raw_counts(struct evsel *evsel) |
Jiri Olsa | a939512 | 2015-06-26 11:29:15 +0200 | [diff] [blame] | 169 | { |
| 170 | perf_counts__delete(evsel->prev_raw_counts); |
| 171 | evsel->prev_raw_counts = NULL; |
| 172 | } |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 173 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 174 | static void evsel__reset_prev_raw_counts(struct evsel *evsel) |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 175 | { |
Jin Yao | cf4d9bd | 2020-05-20 12:27:34 +0800 | [diff] [blame] | 176 | if (evsel->prev_raw_counts) |
| 177 | perf_counts__reset(evsel->prev_raw_counts); |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 178 | } |
| 179 | |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 180 | static int evsel__alloc_stats(struct evsel *evsel, bool alloc_raw) |
Jiri Olsa | a7d0a10 | 2015-06-26 11:29:17 +0200 | [diff] [blame] | 181 | { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 182 | if (evsel__alloc_stat_priv(evsel) < 0 || |
Ian Rogers | 2ca0a37 | 2022-01-04 22:13:29 -0800 | [diff] [blame] | 183 | evsel__alloc_counts(evsel) < 0 || |
| 184 | (alloc_raw && evsel__alloc_prev_raw_counts(evsel) < 0)) |
Jiri Olsa | a7d0a10 | 2015-06-26 11:29:17 +0200 | [diff] [blame] | 185 | return -ENOMEM; |
| 186 | |
| 187 | return 0; |
| 188 | } |
| 189 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 190 | int evlist__alloc_stats(struct evlist *evlist, bool alloc_raw) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 191 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 192 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 193 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 194 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 195 | if (evsel__alloc_stats(evsel, alloc_raw)) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 196 | goto out_free; |
| 197 | } |
| 198 | |
| 199 | return 0; |
| 200 | |
| 201 | out_free: |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 202 | evlist__free_stats(evlist); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 203 | return -1; |
| 204 | } |
| 205 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 206 | void evlist__free_stats(struct evlist *evlist) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 207 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 208 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 209 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 210 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 211 | evsel__free_stat_priv(evsel); |
| 212 | evsel__free_counts(evsel); |
| 213 | evsel__free_prev_raw_counts(evsel); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 214 | } |
| 215 | } |
| 216 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 217 | void evlist__reset_stats(struct evlist *evlist) |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 218 | { |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 219 | struct evsel *evsel; |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 220 | |
Arnaldo Carvalho de Melo | e5cadb9 | 2016-06-23 11:26:15 -0300 | [diff] [blame] | 221 | evlist__for_each_entry(evlist, evsel) { |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 222 | evsel__reset_stat_priv(evsel); |
| 223 | evsel__reset_counts(evsel); |
Jiri Olsa | 24e34f6 | 2015-06-26 11:29:16 +0200 | [diff] [blame] | 224 | } |
| 225 | } |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 226 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 227 | void evlist__reset_prev_raw_counts(struct evlist *evlist) |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 228 | { |
| 229 | struct evsel *evsel; |
| 230 | |
| 231 | evlist__for_each_entry(evlist, evsel) |
Arnaldo Carvalho de Melo | 7d1e239 | 2020-05-06 13:38:26 -0300 | [diff] [blame] | 232 | evsel__reset_prev_raw_counts(evsel); |
Srikar Dronamraju | b63fd11 | 2019-09-04 15:17:37 +0530 | [diff] [blame] | 233 | } |
| 234 | |
Arnaldo Carvalho de Melo | 5693302 | 2020-11-30 09:08:24 -0300 | [diff] [blame] | 235 | static void evsel__copy_prev_raw_counts(struct evsel *evsel) |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 236 | { |
| 237 | int ncpus = evsel__nr_cpus(evsel); |
| 238 | int nthreads = perf_thread_map__nr(evsel->core.threads); |
| 239 | |
| 240 | for (int thread = 0; thread < nthreads; thread++) { |
| 241 | for (int cpu = 0; cpu < ncpus; cpu++) { |
| 242 | *perf_counts(evsel->counts, cpu, thread) = |
| 243 | *perf_counts(evsel->prev_raw_counts, cpu, |
| 244 | thread); |
| 245 | } |
| 246 | } |
| 247 | |
| 248 | evsel->counts->aggr = evsel->prev_raw_counts->aggr; |
| 249 | } |
| 250 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 251 | void evlist__copy_prev_raw_counts(struct evlist *evlist) |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 252 | { |
| 253 | struct evsel *evsel; |
| 254 | |
| 255 | evlist__for_each_entry(evlist, evsel) |
Arnaldo Carvalho de Melo | 5693302 | 2020-11-30 09:08:24 -0300 | [diff] [blame] | 256 | evsel__copy_prev_raw_counts(evsel); |
Jin Yao | 297767a | 2020-05-20 12:27:35 +0800 | [diff] [blame] | 257 | } |
| 258 | |
Arnaldo Carvalho de Melo | 53f5e90 | 2020-11-30 09:31:04 -0300 | [diff] [blame] | 259 | void evlist__save_aggr_prev_raw_counts(struct evlist *evlist) |
Jin Yao | 905365f | 2020-05-20 12:27:36 +0800 | [diff] [blame] | 260 | { |
| 261 | struct evsel *evsel; |
| 262 | |
| 263 | /* |
| 264 | * To collect the overall statistics for interval mode, |
| 265 | * we copy the counts from evsel->prev_raw_counts to |
| 266 | * evsel->counts. The perf_stat_process_counter creates |
| 267 | * aggr values from per cpu values, but the per cpu values |
| 268 | * are 0 for AGGR_GLOBAL. So we use a trick that saves the |
| 269 | * previous aggr value to the first member of perf_counts, |
| 270 | * then aggr calculation in process_counter_values can work |
| 271 | * correctly. |
| 272 | */ |
| 273 | evlist__for_each_entry(evlist, evsel) { |
| 274 | *perf_counts(evsel->prev_raw_counts, 0, 0) = |
| 275 | evsel->prev_raw_counts->aggr; |
| 276 | } |
| 277 | } |
| 278 | |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 279 | static size_t pkg_id_hash(const void *__key, void *ctx __maybe_unused) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 280 | { |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 281 | uint64_t *key = (uint64_t *) __key; |
| 282 | |
| 283 | return *key & 0xffffffff; |
| 284 | } |
| 285 | |
| 286 | static bool pkg_id_equal(const void *__key1, const void *__key2, |
| 287 | void *ctx __maybe_unused) |
| 288 | { |
| 289 | uint64_t *key1 = (uint64_t *) __key1; |
| 290 | uint64_t *key2 = (uint64_t *) __key2; |
| 291 | |
| 292 | return *key1 == *key2; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 293 | } |
| 294 | |
Ian Rogers | 379c224 | 2022-01-04 22:13:44 -0800 | [diff] [blame] | 295 | static int check_per_pkg(struct evsel *counter, struct perf_counts_values *vals, |
| 296 | int cpu_map_idx, bool *skip) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 297 | { |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 298 | struct hashmap *mask = counter->per_pkg_mask; |
Jiri Olsa | b49aca3 | 2019-07-21 13:24:05 +0200 | [diff] [blame] | 299 | struct perf_cpu_map *cpus = evsel__cpus(counter); |
Ian Rogers | 6d18804 | 2022-01-04 22:13:51 -0800 | [diff] [blame^] | 300 | struct perf_cpu cpu = perf_cpu_map__cpu(cpus, cpu_map_idx); |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 301 | int s, d, ret = 0; |
| 302 | uint64_t *key; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 303 | |
| 304 | *skip = false; |
| 305 | |
| 306 | if (!counter->per_pkg) |
| 307 | return 0; |
| 308 | |
Jiri Olsa | 315c0a1 | 2019-08-22 13:11:39 +0200 | [diff] [blame] | 309 | if (perf_cpu_map__empty(cpus)) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 310 | return 0; |
| 311 | |
| 312 | if (!mask) { |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 313 | mask = hashmap__new(pkg_id_hash, pkg_id_equal, NULL); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 314 | if (!mask) |
| 315 | return -ENOMEM; |
| 316 | |
| 317 | counter->per_pkg_mask = mask; |
| 318 | } |
| 319 | |
Stephane Eranian | 02d8dab | 2015-09-03 15:23:40 +0200 | [diff] [blame] | 320 | /* |
| 321 | * we do not consider an event that has not run as a good |
| 322 | * instance to mark a package as used (skip=1). Otherwise |
| 323 | * we may run into a situation where the first CPU in a package |
| 324 | * is not running anything, yet the second is, and this function |
| 325 | * would mark the package as used after the first CPU and would |
| 326 | * not read the values from the second CPU. |
| 327 | */ |
| 328 | if (!(vals->run && vals->ena)) |
| 329 | return 0; |
| 330 | |
Ian Rogers | 4e90e5c | 2022-01-04 22:13:19 -0800 | [diff] [blame] | 331 | s = cpu__get_socket_id(cpu); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 332 | if (s < 0) |
| 333 | return -1; |
| 334 | |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 335 | /* |
| 336 | * On multi-die system, die_id > 0. On no-die system, die_id = 0. |
| 337 | * We use hashmap(socket, die) to check the used socket+die pair. |
| 338 | */ |
Ian Rogers | 4e90e5c | 2022-01-04 22:13:19 -0800 | [diff] [blame] | 339 | d = cpu__get_die_id(cpu); |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 340 | if (d < 0) |
| 341 | return -1; |
| 342 | |
| 343 | key = malloc(sizeof(*key)); |
| 344 | if (!key) |
| 345 | return -ENOMEM; |
| 346 | |
| 347 | *key = (uint64_t)d << 32 | s; |
Ian Rogers | f9e891e | 2022-01-04 22:13:26 -0800 | [diff] [blame] | 348 | if (hashmap__find(mask, (void *)key, NULL)) { |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 349 | *skip = true; |
Ian Rogers | f9e891e | 2022-01-04 22:13:26 -0800 | [diff] [blame] | 350 | free(key); |
| 351 | } else |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 352 | ret = hashmap__add(mask, (void *)key, (void *)1); |
| 353 | |
| 354 | return ret; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 355 | } |
| 356 | |
| 357 | static int |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 358 | process_counter_values(struct perf_stat_config *config, struct evsel *evsel, |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 359 | int cpu_map_idx, int thread, |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 360 | struct perf_counts_values *count) |
| 361 | { |
| 362 | struct perf_counts_values *aggr = &evsel->counts->aggr; |
| 363 | static struct perf_counts_values zero; |
| 364 | bool skip = false; |
| 365 | |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 366 | if (check_per_pkg(evsel, count, cpu_map_idx, &skip)) { |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 367 | pr_err("failed to read per-pkg counter\n"); |
| 368 | return -1; |
| 369 | } |
| 370 | |
| 371 | if (skip) |
| 372 | count = &zero; |
| 373 | |
| 374 | switch (config->aggr_mode) { |
| 375 | case AGGR_THREAD: |
| 376 | case AGGR_CORE: |
Kan Liang | db5742b | 2019-06-04 15:50:42 -0700 | [diff] [blame] | 377 | case AGGR_DIE: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 378 | case AGGR_SOCKET: |
Jiri Olsa | 86895b4 | 2019-08-28 10:17:43 +0200 | [diff] [blame] | 379 | case AGGR_NODE: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 380 | case AGGR_NONE: |
| 381 | if (!evsel->snapshot) |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 382 | evsel__compute_deltas(evsel, cpu_map_idx, thread, count); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 383 | perf_counts_values__scale(count, config->scale, NULL); |
Jin Yao | 4fc4d8d | 2019-04-12 21:59:49 +0800 | [diff] [blame] | 384 | if ((config->aggr_mode == AGGR_NONE) && (!evsel->percore)) { |
| 385 | perf_stat__update_shadow_stats(evsel, count->val, |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 386 | cpu_map_idx, &rt_stat); |
Jin Yao | 4fc4d8d | 2019-04-12 21:59:49 +0800 | [diff] [blame] | 387 | } |
| 388 | |
Jin Yao | 14e72a2 | 2017-12-05 22:03:08 +0800 | [diff] [blame] | 389 | if (config->aggr_mode == AGGR_THREAD) { |
| 390 | if (config->stats) |
| 391 | perf_stat__update_shadow_stats(evsel, |
| 392 | count->val, 0, &config->stats[thread]); |
| 393 | else |
| 394 | perf_stat__update_shadow_stats(evsel, |
| 395 | count->val, 0, &rt_stat); |
| 396 | } |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 397 | break; |
| 398 | case AGGR_GLOBAL: |
| 399 | aggr->val += count->val; |
Andi Kleen | 75998bb | 2019-03-14 15:50:01 -0700 | [diff] [blame] | 400 | aggr->ena += count->ena; |
| 401 | aggr->run += count->run; |
Jiri Olsa | 208df99 | 2015-10-16 12:41:04 +0200 | [diff] [blame] | 402 | case AGGR_UNSET: |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 403 | default: |
| 404 | break; |
| 405 | } |
| 406 | |
| 407 | return 0; |
| 408 | } |
| 409 | |
| 410 | static int process_counter_maps(struct perf_stat_config *config, |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 411 | struct evsel *counter) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 412 | { |
Jiri Olsa | a2f354e | 2019-08-22 13:11:41 +0200 | [diff] [blame] | 413 | int nthreads = perf_thread_map__nr(counter->core.threads); |
Arnaldo Carvalho de Melo | 5eb88f0 | 2020-04-29 15:45:09 -0300 | [diff] [blame] | 414 | int ncpus = evsel__nr_cpus(counter); |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 415 | int idx, thread; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 416 | |
Jiri Olsa | 648b5af | 2019-08-06 11:35:19 +0200 | [diff] [blame] | 417 | if (counter->core.system_wide) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 418 | nthreads = 1; |
| 419 | |
| 420 | for (thread = 0; thread < nthreads; thread++) { |
Ian Rogers | 5b1af93 | 2022-01-04 22:13:45 -0800 | [diff] [blame] | 421 | for (idx = 0; idx < ncpus; idx++) { |
| 422 | if (process_counter_values(config, counter, idx, thread, |
| 423 | perf_counts(counter->counts, idx, thread))) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 424 | return -1; |
| 425 | } |
| 426 | } |
| 427 | |
| 428 | return 0; |
| 429 | } |
| 430 | |
| 431 | int perf_stat_process_counter(struct perf_stat_config *config, |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 432 | struct evsel *counter) |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 433 | { |
| 434 | struct perf_counts_values *aggr = &counter->counts->aggr; |
Arnaldo Carvalho de Melo | e669e83 | 2017-10-26 14:22:34 -0300 | [diff] [blame] | 435 | struct perf_stat_evsel *ps = counter->stats; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 436 | u64 *count = counter->counts->aggr.values; |
| 437 | int i, ret; |
| 438 | |
| 439 | aggr->val = aggr->ena = aggr->run = 0; |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 440 | |
| 441 | if (counter->per_pkg) |
Jin Yao | 034f7ee | 2021-01-28 09:34:17 +0800 | [diff] [blame] | 442 | evsel__zero_per_pkg(counter); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 443 | |
| 444 | ret = process_counter_maps(config, counter); |
| 445 | if (ret) |
| 446 | return ret; |
| 447 | |
| 448 | if (config->aggr_mode != AGGR_GLOBAL) |
| 449 | return 0; |
| 450 | |
| 451 | if (!counter->snapshot) |
Arnaldo Carvalho de Melo | 12f5261 | 2020-04-29 15:47:38 -0300 | [diff] [blame] | 452 | evsel__compute_deltas(counter, -1, -1, aggr); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 453 | perf_counts_values__scale(aggr, config->scale, &counter->counts->scaled); |
| 454 | |
| 455 | for (i = 0; i < 3; i++) |
| 456 | update_stats(&ps->res_stats[i], count[i]); |
| 457 | |
Namhyung Kim | bb963e1 | 2017-02-17 17:17:38 +0900 | [diff] [blame] | 458 | if (verbose > 0) { |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 459 | fprintf(config->output, "%s: %" PRIu64 " %" PRIu64 " %" PRIu64 "\n", |
Arnaldo Carvalho de Melo | 8ab2e96 | 2020-04-29 16:07:09 -0300 | [diff] [blame] | 460 | evsel__name(counter), count[0], count[1], count[2]); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 461 | } |
| 462 | |
| 463 | /* |
| 464 | * Save the full runtime - to allow normalization during printout: |
| 465 | */ |
Jin Yao | 1fcd039 | 2017-12-05 22:03:04 +0800 | [diff] [blame] | 466 | perf_stat__update_shadow_stats(counter, *count, 0, &rt_stat); |
Jiri Olsa | f80010e | 2015-07-21 14:31:27 +0200 | [diff] [blame] | 467 | |
| 468 | return 0; |
| 469 | } |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 470 | |
Jiri Olsa | 89f1688 | 2018-09-13 14:54:03 +0200 | [diff] [blame] | 471 | int perf_event__process_stat_event(struct perf_session *session, |
| 472 | union perf_event *event) |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 473 | { |
| 474 | struct perf_counts_values count; |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 475 | struct perf_record_stat *st = &event->stat; |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 476 | struct evsel *counter; |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 477 | |
| 478 | count.val = st->val; |
| 479 | count.ena = st->ena; |
| 480 | count.run = st->run; |
| 481 | |
Arnaldo Carvalho de Melo | 3ccf8a7 | 2020-11-30 14:17:57 -0300 | [diff] [blame] | 482 | counter = evlist__id2evsel(session->evlist, st->id); |
Jiri Olsa | 0ea0e35 | 2015-10-25 15:51:32 +0100 | [diff] [blame] | 483 | if (!counter) { |
| 484 | pr_err("Failed to resolve counter for stat event.\n"); |
| 485 | return -EINVAL; |
| 486 | } |
| 487 | |
| 488 | *perf_counts(counter->counts, st->cpu, st->thread) = count; |
| 489 | counter->supported = true; |
| 490 | return 0; |
| 491 | } |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 492 | |
| 493 | size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp) |
| 494 | { |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 495 | struct perf_record_stat *st = (struct perf_record_stat *)event; |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 496 | size_t ret; |
| 497 | |
Jiri Olsa | 18a13a6 | 2019-08-28 15:57:10 +0200 | [diff] [blame] | 498 | ret = fprintf(fp, "\n... id %" PRI_lu64 ", cpu %d, thread %d\n", |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 499 | st->id, st->cpu, st->thread); |
Jiri Olsa | 18a13a6 | 2019-08-28 15:57:10 +0200 | [diff] [blame] | 500 | ret += fprintf(fp, "... value %" PRI_lu64 ", enabled %" PRI_lu64 ", running %" PRI_lu64 "\n", |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 501 | st->val, st->ena, st->run); |
| 502 | |
| 503 | return ret; |
| 504 | } |
| 505 | |
| 506 | size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp) |
| 507 | { |
Jiri Olsa | 7293237 | 2019-08-28 15:57:16 +0200 | [diff] [blame] | 508 | struct perf_record_stat_round *rd = (struct perf_record_stat_round *)event; |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 509 | size_t ret; |
| 510 | |
Jiri Olsa | 782adbe | 2019-08-28 15:57:11 +0200 | [diff] [blame] | 511 | ret = fprintf(fp, "\n... time %" PRI_lu64 ", type %s\n", rd->time, |
Jiri Olsa | e08a456 | 2015-10-25 15:51:35 +0100 | [diff] [blame] | 512 | rd->type == PERF_STAT_ROUND_TYPE__FINAL ? "FINAL" : "INTERVAL"); |
| 513 | |
| 514 | return ret; |
| 515 | } |
| 516 | |
| 517 | size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp) |
| 518 | { |
| 519 | struct perf_stat_config sc; |
| 520 | size_t ret; |
| 521 | |
| 522 | perf_event__read_stat_config(&sc, &event->stat_config); |
| 523 | |
| 524 | ret = fprintf(fp, "\n"); |
| 525 | ret += fprintf(fp, "... aggr_mode %d\n", sc.aggr_mode); |
| 526 | ret += fprintf(fp, "... scale %d\n", sc.scale); |
| 527 | ret += fprintf(fp, "... interval %u\n", sc.interval); |
| 528 | |
| 529 | return ret; |
| 530 | } |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 531 | |
Jiri Olsa | 32dcd02 | 2019-07-21 13:23:51 +0200 | [diff] [blame] | 532 | int create_perf_stat_counter(struct evsel *evsel, |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 533 | struct perf_stat_config *config, |
Andi Kleen | 4804e01 | 2019-11-20 16:15:19 -0800 | [diff] [blame] | 534 | struct target *target, |
Ian Rogers | 6f844b1 | 2022-01-04 22:13:42 -0800 | [diff] [blame] | 535 | int cpu_map_idx) |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 536 | { |
Jiri Olsa | 1fc632c | 2019-07-21 13:24:29 +0200 | [diff] [blame] | 537 | struct perf_event_attr *attr = &evsel->core.attr; |
Jiri Olsa | fba7c86 | 2021-07-06 17:17:00 +0200 | [diff] [blame] | 538 | struct evsel *leader = evsel__leader(evsel); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 539 | |
Andi Kleen | 75998bb | 2019-03-14 15:50:01 -0700 | [diff] [blame] | 540 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | |
| 541 | PERF_FORMAT_TOTAL_TIME_RUNNING; |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 542 | |
| 543 | /* |
| 544 | * The event is part of non trivial group, let's enable |
| 545 | * the group read (for leader) and ID retrieval for all |
| 546 | * members. |
| 547 | */ |
Jiri Olsa | 5643b1a | 2019-07-21 13:24:46 +0200 | [diff] [blame] | 548 | if (leader->core.nr_members > 1) |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 549 | attr->read_format |= PERF_FORMAT_ID|PERF_FORMAT_GROUP; |
| 550 | |
Song Liu | fa853c4 | 2020-12-29 13:42:14 -0800 | [diff] [blame] | 551 | attr->inherit = !config->no_inherit && list_empty(&evsel->bpf_counter_list); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 552 | |
| 553 | /* |
| 554 | * Some events get initialized with sample_(period/type) set, |
| 555 | * like tracepoints. Clear it up for counting. |
| 556 | */ |
| 557 | attr->sample_period = 0; |
| 558 | |
| 559 | if (config->identifier) |
| 560 | attr->sample_type = PERF_SAMPLE_IDENTIFIER; |
| 561 | |
Jin Yao | dd07102 | 2019-10-11 13:05:45 +0800 | [diff] [blame] | 562 | if (config->all_user) { |
| 563 | attr->exclude_kernel = 1; |
| 564 | attr->exclude_user = 0; |
| 565 | } |
| 566 | |
| 567 | if (config->all_kernel) { |
| 568 | attr->exclude_kernel = 0; |
| 569 | attr->exclude_user = 1; |
| 570 | } |
| 571 | |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 572 | /* |
| 573 | * Disabling all counters initially, they will be enabled |
| 574 | * either manually by us or by kernel via enable_on_exec |
| 575 | * set later. |
| 576 | */ |
Arnaldo Carvalho de Melo | c754c38 | 2020-04-30 10:51:16 -0300 | [diff] [blame] | 577 | if (evsel__is_group_leader(evsel)) { |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 578 | attr->disabled = 1; |
| 579 | |
| 580 | /* |
| 581 | * In case of initial_delay we enable tracee |
| 582 | * events manually. |
| 583 | */ |
| 584 | if (target__none(target) && !config->initial_delay) |
| 585 | attr->enable_on_exec = 1; |
| 586 | } |
| 587 | |
| 588 | if (target__has_cpu(target) && !target__has_per_thread(target)) |
Ian Rogers | 6f844b1 | 2022-01-04 22:13:42 -0800 | [diff] [blame] | 589 | return evsel__open_per_cpu(evsel, evsel__cpus(evsel), cpu_map_idx); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 590 | |
Arnaldo Carvalho de Melo | aa8c406 | 2020-04-29 16:21:03 -0300 | [diff] [blame] | 591 | return evsel__open_per_thread(evsel, evsel->core.threads); |
Jiri Olsa | d09cefd | 2018-08-30 08:32:17 +0200 | [diff] [blame] | 592 | } |