1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0 2a43783aeSArnaldo Carvalho de Melo #include <errno.h> 3d73f5d14SLv Ruyi #include <linux/err.h> 4fd20e811SArnaldo Carvalho de Melo #include <inttypes.h> 50007eceaSXiao Guangrong #include <math.h> 6f2a39fe8SArnaldo Carvalho de Melo #include <string.h> 7bfc49182SArnaldo Carvalho de Melo #include "counts.h" 887ffb6c6SArnaldo Carvalho de Melo #include "cpumap.h" 9b4209025SArnaldo Carvalho de Melo #include "debug.h" 10f2a39fe8SArnaldo Carvalho de Melo #include "header.h" 110007eceaSXiao Guangrong #include "stat.h" 12f2a39fe8SArnaldo Carvalho de Melo #include "session.h" 13aeb00b1aSArnaldo Carvalho de Melo #include "target.h" 1424e34f68SJiri Olsa #include "evlist.h" 15e2f56da1SJiri Olsa #include "evsel.h" 1624e34f68SJiri Olsa #include "thread_map.h" 17bdf45725SIan Rogers #ifdef HAVE_LIBBPF_SUPPORT 18bdf45725SIan Rogers #include <bpf/hashmap.h> 19bdf45725SIan Rogers #else 20bdf45725SIan Rogers #include "util/hashmap.h" 21bdf45725SIan Rogers #endif 227f7c536fSArnaldo Carvalho de Melo #include <linux/zalloc.h> 230007eceaSXiao Guangrong 240007eceaSXiao Guangrong void update_stats(struct stats *stats, u64 val) 250007eceaSXiao Guangrong { 260007eceaSXiao Guangrong double delta; 270007eceaSXiao Guangrong 280007eceaSXiao Guangrong stats->n++; 290007eceaSXiao Guangrong delta = val - stats->mean; 300007eceaSXiao Guangrong stats->mean += delta / stats->n; 310007eceaSXiao Guangrong stats->M2 += delta*(val - stats->mean); 32ffe4f3c0SDavid Ahern 33ffe4f3c0SDavid Ahern if (val > stats->max) 34ffe4f3c0SDavid Ahern stats->max = val; 35ffe4f3c0SDavid Ahern 36ffe4f3c0SDavid Ahern if (val < stats->min) 37ffe4f3c0SDavid Ahern stats->min = val; 380007eceaSXiao Guangrong } 390007eceaSXiao Guangrong 400007eceaSXiao Guangrong double avg_stats(struct stats *stats) 410007eceaSXiao Guangrong { 420007eceaSXiao Guangrong return stats->mean; 430007eceaSXiao Guangrong } 440007eceaSXiao Guangrong 450007eceaSXiao Guangrong /* 460007eceaSXiao Guangrong * http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance 470007eceaSXiao Guangrong * 480007eceaSXiao Guangrong * (\Sum n_i^2) - ((\Sum n_i)^2)/n 490007eceaSXiao Guangrong * s^2 = ------------------------------- 500007eceaSXiao Guangrong * n - 1 510007eceaSXiao Guangrong * 520007eceaSXiao Guangrong * http://en.wikipedia.org/wiki/Stddev 530007eceaSXiao Guangrong * 540007eceaSXiao Guangrong * The std dev of the mean is related to the std dev by: 550007eceaSXiao Guangrong * 560007eceaSXiao Guangrong * s 570007eceaSXiao Guangrong * s_mean = ------- 580007eceaSXiao Guangrong * sqrt(n) 590007eceaSXiao Guangrong * 600007eceaSXiao Guangrong */ 610007eceaSXiao Guangrong double stddev_stats(struct stats *stats) 620007eceaSXiao Guangrong { 630007eceaSXiao Guangrong double variance, variance_mean; 640007eceaSXiao Guangrong 6545528f7cSDavid Ahern if (stats->n < 2) 660007eceaSXiao Guangrong return 0.0; 670007eceaSXiao Guangrong 680007eceaSXiao Guangrong variance = stats->M2 / (stats->n - 1); 690007eceaSXiao Guangrong variance_mean = variance / stats->n; 700007eceaSXiao Guangrong 710007eceaSXiao Guangrong return sqrt(variance_mean); 720007eceaSXiao Guangrong } 730007eceaSXiao Guangrong 740007eceaSXiao Guangrong double rel_stddev_stats(double stddev, double avg) 750007eceaSXiao Guangrong { 760007eceaSXiao Guangrong double pct = 0.0; 770007eceaSXiao Guangrong 780007eceaSXiao Guangrong if (avg) 790007eceaSXiao Guangrong pct = 100.0 * stddev/avg; 800007eceaSXiao Guangrong 810007eceaSXiao Guangrong return pct; 820007eceaSXiao Guangrong } 83e2f56da1SJiri Olsa 8490520341SArnaldo Carvalho de Melo bool __perf_stat_evsel__is(struct evsel *evsel, enum perf_stat_evsel_id id) 85e2f56da1SJiri Olsa { 86e669e833SArnaldo Carvalho de Melo struct perf_stat_evsel *ps = evsel->stats; 87e2f56da1SJiri Olsa 88e2f56da1SJiri Olsa return ps->id == id; 89e2f56da1SJiri Olsa } 90e2f56da1SJiri Olsa 91e2f56da1SJiri Olsa #define ID(id, name) [PERF_STAT_EVSEL_ID__##id] = #name 92e2f56da1SJiri Olsa static const char *id_str[PERF_STAT_EVSEL_ID__MAX] = { 93e2f56da1SJiri Olsa ID(NONE, x), 944c358d5cSJiri Olsa ID(CYCLES_IN_TX, cpu/cycles-t/), 954c358d5cSJiri Olsa ID(TRANSACTION_START, cpu/tx-start/), 964c358d5cSJiri Olsa ID(ELISION_START, cpu/el-start/), 974c358d5cSJiri Olsa ID(CYCLES_IN_TX_CP, cpu/cycles-ct/), 98239bd47fSAndi Kleen ID(TOPDOWN_TOTAL_SLOTS, topdown-total-slots), 99239bd47fSAndi Kleen ID(TOPDOWN_SLOTS_ISSUED, topdown-slots-issued), 100239bd47fSAndi Kleen ID(TOPDOWN_SLOTS_RETIRED, topdown-slots-retired), 101239bd47fSAndi Kleen ID(TOPDOWN_FETCH_BUBBLES, topdown-fetch-bubbles), 102239bd47fSAndi Kleen ID(TOPDOWN_RECOVERY_BUBBLES, topdown-recovery-bubbles), 10355c36a9fSAndi Kleen ID(TOPDOWN_RETIRING, topdown-retiring), 10455c36a9fSAndi Kleen ID(TOPDOWN_BAD_SPEC, topdown-bad-spec), 10555c36a9fSAndi Kleen ID(TOPDOWN_FE_BOUND, topdown-fe-bound), 10655c36a9fSAndi Kleen ID(TOPDOWN_BE_BOUND, topdown-be-bound), 10763e39aa6SKan Liang ID(TOPDOWN_HEAVY_OPS, topdown-heavy-ops), 10863e39aa6SKan Liang ID(TOPDOWN_BR_MISPREDICT, topdown-br-mispredict), 10963e39aa6SKan Liang ID(TOPDOWN_FETCH_LAT, topdown-fetch-lat), 11063e39aa6SKan Liang ID(TOPDOWN_MEM_BOUND, topdown-mem-bound), 111daefd0bcSKan Liang ID(SMI_NUM, msr/smi/), 112daefd0bcSKan Liang ID(APERF, msr/aperf/), 113e2f56da1SJiri Olsa }; 114e2f56da1SJiri Olsa #undef ID 115e2f56da1SJiri Olsa 11632dcd021SJiri Olsa static void perf_stat_evsel_id_init(struct evsel *evsel) 117e2f56da1SJiri Olsa { 118e669e833SArnaldo Carvalho de Melo struct perf_stat_evsel *ps = evsel->stats; 119e2f56da1SJiri Olsa int i; 120e2f56da1SJiri Olsa 121e2f56da1SJiri Olsa /* ps->id is 0 hence PERF_STAT_EVSEL_ID__NONE by default */ 122e2f56da1SJiri Olsa 123e2f56da1SJiri Olsa for (i = 0; i < PERF_STAT_EVSEL_ID__MAX; i++) { 124d7e3c397SZhengjun Xing if (!strcmp(evsel__name(evsel), id_str[i]) || 125d7e3c397SZhengjun Xing (strstr(evsel__name(evsel), id_str[i]) && evsel->pmu_name 126d7e3c397SZhengjun Xing && strstr(evsel__name(evsel), evsel->pmu_name))) { 127e2f56da1SJiri Olsa ps->id = i; 128e2f56da1SJiri Olsa break; 129e2f56da1SJiri Olsa } 130e2f56da1SJiri Olsa } 131e2f56da1SJiri Olsa } 132a9a3a4d9SJiri Olsa 133*8f97963eSNamhyung Kim static void evsel__reset_aggr_stats(struct evsel *evsel) 1349689edfaSJiri Olsa { 135e669e833SArnaldo Carvalho de Melo struct perf_stat_evsel *ps = evsel->stats; 136ca68b374SNamhyung Kim struct perf_stat_aggr *aggr = ps->aggr; 1379689edfaSJiri Olsa 138ca68b374SNamhyung Kim if (aggr) 139ca68b374SNamhyung Kim memset(aggr, 0, sizeof(*aggr) * ps->nr_aggr); 1409689edfaSJiri Olsa } 1419689edfaSJiri Olsa 142*8f97963eSNamhyung Kim static void evsel__reset_stat_priv(struct evsel *evsel) 143*8f97963eSNamhyung Kim { 144*8f97963eSNamhyung Kim struct perf_stat_evsel *ps = evsel->stats; 145*8f97963eSNamhyung Kim 146*8f97963eSNamhyung Kim init_stats(&ps->res_stats); 147*8f97963eSNamhyung Kim evsel__reset_aggr_stats(evsel); 148*8f97963eSNamhyung Kim } 149*8f97963eSNamhyung Kim 150ae7e6492SNamhyung Kim static int evsel__alloc_aggr_stats(struct evsel *evsel, int nr_aggr) 151ae7e6492SNamhyung Kim { 152ae7e6492SNamhyung Kim struct perf_stat_evsel *ps = evsel->stats; 153ae7e6492SNamhyung Kim 154ae7e6492SNamhyung Kim if (ps == NULL) 155ae7e6492SNamhyung Kim return 0; 156ae7e6492SNamhyung Kim 157ae7e6492SNamhyung Kim ps->nr_aggr = nr_aggr; 158ae7e6492SNamhyung Kim ps->aggr = calloc(nr_aggr, sizeof(*ps->aggr)); 159ae7e6492SNamhyung Kim if (ps->aggr == NULL) 160ae7e6492SNamhyung Kim return -ENOMEM; 161ae7e6492SNamhyung Kim 162ae7e6492SNamhyung Kim return 0; 163ae7e6492SNamhyung Kim } 164ae7e6492SNamhyung Kim 165ae7e6492SNamhyung Kim int evlist__alloc_aggr_stats(struct evlist *evlist, int nr_aggr) 166ae7e6492SNamhyung Kim { 167ae7e6492SNamhyung Kim struct evsel *evsel; 168ae7e6492SNamhyung Kim 169ae7e6492SNamhyung Kim evlist__for_each_entry(evlist, evsel) { 170ae7e6492SNamhyung Kim if (evsel__alloc_aggr_stats(evsel, nr_aggr) < 0) 171ae7e6492SNamhyung Kim return -1; 172ae7e6492SNamhyung Kim } 173ae7e6492SNamhyung Kim return 0; 174ae7e6492SNamhyung Kim } 175ca68b374SNamhyung Kim 176ca68b374SNamhyung Kim static int evsel__alloc_stat_priv(struct evsel *evsel, int nr_aggr) 1779689edfaSJiri Olsa { 178ca68b374SNamhyung Kim struct perf_stat_evsel *ps; 179ca68b374SNamhyung Kim 180ca68b374SNamhyung Kim ps = zalloc(sizeof(*ps)); 181ca68b374SNamhyung Kim if (ps == NULL) 1829689edfaSJiri Olsa return -ENOMEM; 183ca68b374SNamhyung Kim 184ae7e6492SNamhyung Kim evsel->stats = ps; 185ae7e6492SNamhyung Kim 186ae7e6492SNamhyung Kim if (nr_aggr && evsel__alloc_aggr_stats(evsel, nr_aggr) < 0) { 187ae7e6492SNamhyung Kim evsel->stats = NULL; 188ca68b374SNamhyung Kim free(ps); 189ca68b374SNamhyung Kim return -ENOMEM; 190ca68b374SNamhyung Kim } 191ca68b374SNamhyung Kim 192429b8e84SNamhyung Kim perf_stat_evsel_id_init(evsel); 1937d1e239eSArnaldo Carvalho de Melo evsel__reset_stat_priv(evsel); 1949689edfaSJiri Olsa return 0; 1959689edfaSJiri Olsa } 1969689edfaSJiri Olsa 1977d1e239eSArnaldo Carvalho de Melo static void evsel__free_stat_priv(struct evsel *evsel) 1989689edfaSJiri Olsa { 199e669e833SArnaldo Carvalho de Melo struct perf_stat_evsel *ps = evsel->stats; 200f7794d52SJiri Olsa 201ca68b374SNamhyung Kim if (ps) { 202ca68b374SNamhyung Kim zfree(&ps->aggr); 203d8f9da24SArnaldo Carvalho de Melo zfree(&ps->group_data); 204ca68b374SNamhyung Kim } 205e669e833SArnaldo Carvalho de Melo zfree(&evsel->stats); 2069689edfaSJiri Olsa } 207a939512dSJiri Olsa 2082ca0a371SIan Rogers static int evsel__alloc_prev_raw_counts(struct evsel *evsel) 209a939512dSJiri Olsa { 2102ca0a371SIan Rogers int cpu_map_nr = evsel__nr_cpus(evsel); 2112ca0a371SIan Rogers int nthreads = perf_thread_map__nr(evsel->core.threads); 212a939512dSJiri Olsa struct perf_counts *counts; 213a939512dSJiri Olsa 2142ca0a371SIan Rogers counts = perf_counts__new(cpu_map_nr, nthreads); 215a939512dSJiri Olsa if (counts) 216a939512dSJiri Olsa evsel->prev_raw_counts = counts; 217a939512dSJiri Olsa 218a939512dSJiri Olsa return counts ? 0 : -ENOMEM; 219a939512dSJiri Olsa } 220a939512dSJiri Olsa 2217d1e239eSArnaldo Carvalho de Melo static void evsel__free_prev_raw_counts(struct evsel *evsel) 222a939512dSJiri Olsa { 223a939512dSJiri Olsa perf_counts__delete(evsel->prev_raw_counts); 224a939512dSJiri Olsa evsel->prev_raw_counts = NULL; 225a939512dSJiri Olsa } 22624e34f68SJiri Olsa 2277d1e239eSArnaldo Carvalho de Melo static void evsel__reset_prev_raw_counts(struct evsel *evsel) 228b63fd11cSSrikar Dronamraju { 229cf4d9bd6SJin Yao if (evsel->prev_raw_counts) 230cf4d9bd6SJin Yao perf_counts__reset(evsel->prev_raw_counts); 231b63fd11cSSrikar Dronamraju } 232b63fd11cSSrikar Dronamraju 233ca68b374SNamhyung Kim static int evsel__alloc_stats(struct evsel *evsel, int nr_aggr, bool alloc_raw) 23424e34f68SJiri Olsa { 235ca68b374SNamhyung Kim if (evsel__alloc_stat_priv(evsel, nr_aggr) < 0 || 2362ca0a371SIan Rogers evsel__alloc_counts(evsel) < 0 || 2372ca0a371SIan Rogers (alloc_raw && evsel__alloc_prev_raw_counts(evsel) < 0)) 238a7d0a102SJiri Olsa return -ENOMEM; 239a7d0a102SJiri Olsa 240a7d0a102SJiri Olsa return 0; 241a7d0a102SJiri Olsa } 242a7d0a102SJiri Olsa 2431f297a6eSNamhyung Kim int evlist__alloc_stats(struct perf_stat_config *config, 2441f297a6eSNamhyung Kim struct evlist *evlist, bool alloc_raw) 245a7d0a102SJiri Olsa { 24632dcd021SJiri Olsa struct evsel *evsel; 2471f297a6eSNamhyung Kim int nr_aggr = 0; 2481f297a6eSNamhyung Kim 2491f297a6eSNamhyung Kim if (config && config->aggr_map) 2501f297a6eSNamhyung Kim nr_aggr = config->aggr_map->nr; 251a7d0a102SJiri Olsa 252e5cadb93SArnaldo Carvalho de Melo evlist__for_each_entry(evlist, evsel) { 2531f297a6eSNamhyung Kim if (evsel__alloc_stats(evsel, nr_aggr, alloc_raw)) 25424e34f68SJiri Olsa goto out_free; 25524e34f68SJiri Olsa } 25624e34f68SJiri Olsa 25724e34f68SJiri Olsa return 0; 25824e34f68SJiri Olsa 25924e34f68SJiri Olsa out_free: 26053f5e908SArnaldo Carvalho de Melo evlist__free_stats(evlist); 26124e34f68SJiri Olsa return -1; 26224e34f68SJiri Olsa } 26324e34f68SJiri Olsa 26453f5e908SArnaldo Carvalho de Melo void evlist__free_stats(struct evlist *evlist) 26524e34f68SJiri Olsa { 26632dcd021SJiri Olsa struct evsel *evsel; 26724e34f68SJiri Olsa 268e5cadb93SArnaldo Carvalho de Melo evlist__for_each_entry(evlist, evsel) { 2697d1e239eSArnaldo Carvalho de Melo evsel__free_stat_priv(evsel); 2707d1e239eSArnaldo Carvalho de Melo evsel__free_counts(evsel); 2717d1e239eSArnaldo Carvalho de Melo evsel__free_prev_raw_counts(evsel); 27224e34f68SJiri Olsa } 27324e34f68SJiri Olsa } 27424e34f68SJiri Olsa 27553f5e908SArnaldo Carvalho de Melo void evlist__reset_stats(struct evlist *evlist) 27624e34f68SJiri Olsa { 27732dcd021SJiri Olsa struct evsel *evsel; 27824e34f68SJiri Olsa 279e5cadb93SArnaldo Carvalho de Melo evlist__for_each_entry(evlist, evsel) { 2807d1e239eSArnaldo Carvalho de Melo evsel__reset_stat_priv(evsel); 2817d1e239eSArnaldo Carvalho de Melo evsel__reset_counts(evsel); 28224e34f68SJiri Olsa } 28324e34f68SJiri Olsa } 284f80010ebSJiri Olsa 285*8f97963eSNamhyung Kim void evlist__reset_aggr_stats(struct evlist *evlist) 286*8f97963eSNamhyung Kim { 287*8f97963eSNamhyung Kim struct evsel *evsel; 288*8f97963eSNamhyung Kim 289*8f97963eSNamhyung Kim evlist__for_each_entry(evlist, evsel) 290*8f97963eSNamhyung Kim evsel__reset_aggr_stats(evsel); 291*8f97963eSNamhyung Kim } 292*8f97963eSNamhyung Kim 29353f5e908SArnaldo Carvalho de Melo void evlist__reset_prev_raw_counts(struct evlist *evlist) 294b63fd11cSSrikar Dronamraju { 295b63fd11cSSrikar Dronamraju struct evsel *evsel; 296b63fd11cSSrikar Dronamraju 297b63fd11cSSrikar Dronamraju evlist__for_each_entry(evlist, evsel) 2987d1e239eSArnaldo Carvalho de Melo evsel__reset_prev_raw_counts(evsel); 299b63fd11cSSrikar Dronamraju } 300b63fd11cSSrikar Dronamraju 30156933029SArnaldo Carvalho de Melo static void evsel__copy_prev_raw_counts(struct evsel *evsel) 302297767acSJin Yao { 3030b9462d0SIan Rogers int idx, nthreads = perf_thread_map__nr(evsel->core.threads); 304297767acSJin Yao 305297767acSJin Yao for (int thread = 0; thread < nthreads; thread++) { 3060b9462d0SIan Rogers perf_cpu_map__for_each_idx(idx, evsel__cpus(evsel)) { 3070b9462d0SIan Rogers *perf_counts(evsel->counts, idx, thread) = 3080b9462d0SIan Rogers *perf_counts(evsel->prev_raw_counts, idx, thread); 309297767acSJin Yao } 310297767acSJin Yao } 311297767acSJin Yao 312297767acSJin Yao evsel->counts->aggr = evsel->prev_raw_counts->aggr; 313297767acSJin Yao } 314297767acSJin Yao 31553f5e908SArnaldo Carvalho de Melo void evlist__copy_prev_raw_counts(struct evlist *evlist) 316297767acSJin Yao { 317297767acSJin Yao struct evsel *evsel; 318297767acSJin Yao 319297767acSJin Yao evlist__for_each_entry(evlist, evsel) 32056933029SArnaldo Carvalho de Melo evsel__copy_prev_raw_counts(evsel); 321297767acSJin Yao } 322297767acSJin Yao 32353f5e908SArnaldo Carvalho de Melo void evlist__save_aggr_prev_raw_counts(struct evlist *evlist) 324905365f4SJin Yao { 325905365f4SJin Yao struct evsel *evsel; 326905365f4SJin Yao 327905365f4SJin Yao /* 328905365f4SJin Yao * To collect the overall statistics for interval mode, 329905365f4SJin Yao * we copy the counts from evsel->prev_raw_counts to 330905365f4SJin Yao * evsel->counts. The perf_stat_process_counter creates 331905365f4SJin Yao * aggr values from per cpu values, but the per cpu values 332905365f4SJin Yao * are 0 for AGGR_GLOBAL. So we use a trick that saves the 333905365f4SJin Yao * previous aggr value to the first member of perf_counts, 334905365f4SJin Yao * then aggr calculation in process_counter_values can work 335905365f4SJin Yao * correctly. 336905365f4SJin Yao */ 337905365f4SJin Yao evlist__for_each_entry(evlist, evsel) { 338905365f4SJin Yao *perf_counts(evsel->prev_raw_counts, 0, 0) = 339905365f4SJin Yao evsel->prev_raw_counts->aggr; 340905365f4SJin Yao } 341905365f4SJin Yao } 342905365f4SJin Yao 343034f7ee1SJin Yao static size_t pkg_id_hash(const void *__key, void *ctx __maybe_unused) 344f80010ebSJiri Olsa { 345034f7ee1SJin Yao uint64_t *key = (uint64_t *) __key; 346034f7ee1SJin Yao 347034f7ee1SJin Yao return *key & 0xffffffff; 348034f7ee1SJin Yao } 349034f7ee1SJin Yao 350034f7ee1SJin Yao static bool pkg_id_equal(const void *__key1, const void *__key2, 351034f7ee1SJin Yao void *ctx __maybe_unused) 352034f7ee1SJin Yao { 353034f7ee1SJin Yao uint64_t *key1 = (uint64_t *) __key1; 354034f7ee1SJin Yao uint64_t *key2 = (uint64_t *) __key2; 355034f7ee1SJin Yao 356034f7ee1SJin Yao return *key1 == *key2; 357f80010ebSJiri Olsa } 358f80010ebSJiri Olsa 359379c224bSIan Rogers static int check_per_pkg(struct evsel *counter, struct perf_counts_values *vals, 360379c224bSIan Rogers int cpu_map_idx, bool *skip) 361f80010ebSJiri Olsa { 362034f7ee1SJin Yao struct hashmap *mask = counter->per_pkg_mask; 363b49aca3eSJiri Olsa struct perf_cpu_map *cpus = evsel__cpus(counter); 3646d18804bSIan Rogers struct perf_cpu cpu = perf_cpu_map__cpu(cpus, cpu_map_idx); 365034f7ee1SJin Yao int s, d, ret = 0; 366034f7ee1SJin Yao uint64_t *key; 367f80010ebSJiri Olsa 368f80010ebSJiri Olsa *skip = false; 369f80010ebSJiri Olsa 370f80010ebSJiri Olsa if (!counter->per_pkg) 371f80010ebSJiri Olsa return 0; 372f80010ebSJiri Olsa 373315c0a1fSJiri Olsa if (perf_cpu_map__empty(cpus)) 374f80010ebSJiri Olsa return 0; 375f80010ebSJiri Olsa 376f80010ebSJiri Olsa if (!mask) { 377034f7ee1SJin Yao mask = hashmap__new(pkg_id_hash, pkg_id_equal, NULL); 378d73f5d14SLv Ruyi if (IS_ERR(mask)) 379f80010ebSJiri Olsa return -ENOMEM; 380f80010ebSJiri Olsa 381f80010ebSJiri Olsa counter->per_pkg_mask = mask; 382f80010ebSJiri Olsa } 383f80010ebSJiri Olsa 38402d8dabcSStephane Eranian /* 38502d8dabcSStephane Eranian * we do not consider an event that has not run as a good 38602d8dabcSStephane Eranian * instance to mark a package as used (skip=1). Otherwise 38702d8dabcSStephane Eranian * we may run into a situation where the first CPU in a package 38802d8dabcSStephane Eranian * is not running anything, yet the second is, and this function 38902d8dabcSStephane Eranian * would mark the package as used after the first CPU and would 39002d8dabcSStephane Eranian * not read the values from the second CPU. 39102d8dabcSStephane Eranian */ 39202d8dabcSStephane Eranian if (!(vals->run && vals->ena)) 39302d8dabcSStephane Eranian return 0; 39402d8dabcSStephane Eranian 3954e90e5ccSIan Rogers s = cpu__get_socket_id(cpu); 396f80010ebSJiri Olsa if (s < 0) 397f80010ebSJiri Olsa return -1; 398f80010ebSJiri Olsa 399034f7ee1SJin Yao /* 400034f7ee1SJin Yao * On multi-die system, die_id > 0. On no-die system, die_id = 0. 401034f7ee1SJin Yao * We use hashmap(socket, die) to check the used socket+die pair. 402034f7ee1SJin Yao */ 4034e90e5ccSIan Rogers d = cpu__get_die_id(cpu); 404034f7ee1SJin Yao if (d < 0) 405034f7ee1SJin Yao return -1; 406034f7ee1SJin Yao 407034f7ee1SJin Yao key = malloc(sizeof(*key)); 408034f7ee1SJin Yao if (!key) 409034f7ee1SJin Yao return -ENOMEM; 410034f7ee1SJin Yao 411034f7ee1SJin Yao *key = (uint64_t)d << 32 | s; 412f9e891eaSIan Rogers if (hashmap__find(mask, (void *)key, NULL)) { 413034f7ee1SJin Yao *skip = true; 414f9e891eaSIan Rogers free(key); 415f9e891eaSIan Rogers } else 416034f7ee1SJin Yao ret = hashmap__add(mask, (void *)key, (void *)1); 417034f7ee1SJin Yao 418034f7ee1SJin Yao return ret; 419f80010ebSJiri Olsa } 420f80010ebSJiri Olsa 421049aba09SNamhyung Kim static bool evsel__count_has_error(struct evsel *evsel, 422049aba09SNamhyung Kim struct perf_counts_values *count, 423049aba09SNamhyung Kim struct perf_stat_config *config) 424049aba09SNamhyung Kim { 425049aba09SNamhyung Kim /* the evsel was failed already */ 426049aba09SNamhyung Kim if (evsel->err || evsel->counts->scaled == -1) 427049aba09SNamhyung Kim return true; 428049aba09SNamhyung Kim 429049aba09SNamhyung Kim /* this is meaningful for CPU aggregation modes only */ 430049aba09SNamhyung Kim if (config->aggr_mode == AGGR_GLOBAL) 431049aba09SNamhyung Kim return false; 432049aba09SNamhyung Kim 433049aba09SNamhyung Kim /* it's considered ok when it actually ran */ 434049aba09SNamhyung Kim if (count->ena != 0 && count->run != 0) 435049aba09SNamhyung Kim return false; 436049aba09SNamhyung Kim 437049aba09SNamhyung Kim return true; 438049aba09SNamhyung Kim } 439049aba09SNamhyung Kim 440f80010ebSJiri Olsa static int 44132dcd021SJiri Olsa process_counter_values(struct perf_stat_config *config, struct evsel *evsel, 4425b1af93dSIan Rogers int cpu_map_idx, int thread, 443f80010ebSJiri Olsa struct perf_counts_values *count) 444f80010ebSJiri Olsa { 445f80010ebSJiri Olsa struct perf_counts_values *aggr = &evsel->counts->aggr; 446f976bc6bSNamhyung Kim struct perf_stat_evsel *ps = evsel->stats; 447f80010ebSJiri Olsa static struct perf_counts_values zero; 448f80010ebSJiri Olsa bool skip = false; 449f80010ebSJiri Olsa 4505b1af93dSIan Rogers if (check_per_pkg(evsel, count, cpu_map_idx, &skip)) { 451f80010ebSJiri Olsa pr_err("failed to read per-pkg counter\n"); 452f80010ebSJiri Olsa return -1; 453f80010ebSJiri Olsa } 454f80010ebSJiri Olsa 455f80010ebSJiri Olsa if (skip) 456f80010ebSJiri Olsa count = &zero; 457f80010ebSJiri Olsa 458f976bc6bSNamhyung Kim if (!evsel->snapshot) 459f976bc6bSNamhyung Kim evsel__compute_deltas(evsel, cpu_map_idx, thread, count); 460f976bc6bSNamhyung Kim perf_counts_values__scale(count, config->scale, NULL); 461f976bc6bSNamhyung Kim 462050059e1SNamhyung Kim if (config->aggr_mode == AGGR_THREAD) { 463050059e1SNamhyung Kim struct perf_counts_values *aggr_counts = &ps->aggr[thread].counts; 464050059e1SNamhyung Kim 465050059e1SNamhyung Kim /* 466050059e1SNamhyung Kim * Skip value 0 when enabling --per-thread globally, 467050059e1SNamhyung Kim * otherwise too many 0 output. 468050059e1SNamhyung Kim */ 469050059e1SNamhyung Kim if (count->val == 0 && config->system_wide) 470050059e1SNamhyung Kim return 0; 471050059e1SNamhyung Kim 472050059e1SNamhyung Kim ps->aggr[thread].nr++; 473050059e1SNamhyung Kim 474050059e1SNamhyung Kim aggr_counts->val += count->val; 475050059e1SNamhyung Kim aggr_counts->ena += count->ena; 476050059e1SNamhyung Kim aggr_counts->run += count->run; 477050059e1SNamhyung Kim goto update; 478050059e1SNamhyung Kim } 479050059e1SNamhyung Kim 480f976bc6bSNamhyung Kim if (ps->aggr) { 481f976bc6bSNamhyung Kim struct perf_cpu cpu = perf_cpu_map__cpu(evsel->core.cpus, cpu_map_idx); 482f976bc6bSNamhyung Kim struct aggr_cpu_id aggr_id = config->aggr_get_id(config, cpu); 483f976bc6bSNamhyung Kim struct perf_stat_aggr *ps_aggr; 484f976bc6bSNamhyung Kim int i; 485f976bc6bSNamhyung Kim 486f976bc6bSNamhyung Kim for (i = 0; i < ps->nr_aggr; i++) { 487f976bc6bSNamhyung Kim if (!aggr_cpu_id__equal(&aggr_id, &config->aggr_map->map[i])) 488f976bc6bSNamhyung Kim continue; 489f976bc6bSNamhyung Kim 490f976bc6bSNamhyung Kim ps_aggr = &ps->aggr[i]; 491f976bc6bSNamhyung Kim ps_aggr->nr++; 492f976bc6bSNamhyung Kim 493f976bc6bSNamhyung Kim /* 494050059e1SNamhyung Kim * When any result is bad, make them all to give consistent output 495050059e1SNamhyung Kim * in interval mode. But per-task counters can have 0 enabled time 496050059e1SNamhyung Kim * when some tasks are idle. 497f976bc6bSNamhyung Kim */ 498049aba09SNamhyung Kim if (evsel__count_has_error(evsel, count, config) && !ps_aggr->failed) { 499f976bc6bSNamhyung Kim ps_aggr->counts.val = 0; 500f976bc6bSNamhyung Kim ps_aggr->counts.ena = 0; 501f976bc6bSNamhyung Kim ps_aggr->counts.run = 0; 502f976bc6bSNamhyung Kim ps_aggr->failed = true; 503f976bc6bSNamhyung Kim } 504f976bc6bSNamhyung Kim 505f976bc6bSNamhyung Kim if (!ps_aggr->failed) { 506f976bc6bSNamhyung Kim ps_aggr->counts.val += count->val; 507f976bc6bSNamhyung Kim ps_aggr->counts.ena += count->ena; 508f976bc6bSNamhyung Kim ps_aggr->counts.run += count->run; 509f976bc6bSNamhyung Kim } 510f976bc6bSNamhyung Kim break; 511f976bc6bSNamhyung Kim } 512f976bc6bSNamhyung Kim } 513f976bc6bSNamhyung Kim 514050059e1SNamhyung Kim update: 515f80010ebSJiri Olsa switch (config->aggr_mode) { 516f80010ebSJiri Olsa case AGGR_THREAD: 517f80010ebSJiri Olsa case AGGR_CORE: 518db5742b6SKan Liang case AGGR_DIE: 519f80010ebSJiri Olsa case AGGR_SOCKET: 52086895b48SJiri Olsa case AGGR_NODE: 521f80010ebSJiri Olsa case AGGR_NONE: 5224fc4d8dfSJin Yao if ((config->aggr_mode == AGGR_NONE) && (!evsel->percore)) { 5234fc4d8dfSJin Yao perf_stat__update_shadow_stats(evsel, count->val, 5245b1af93dSIan Rogers cpu_map_idx, &rt_stat); 5254fc4d8dfSJin Yao } 5264fc4d8dfSJin Yao 52714e72a21SJin Yao if (config->aggr_mode == AGGR_THREAD) { 52887ae87fdSNamhyung Kim perf_stat__update_shadow_stats(evsel, count->val, 52987ae87fdSNamhyung Kim thread, &rt_stat); 53014e72a21SJin Yao } 531f80010ebSJiri Olsa break; 532f80010ebSJiri Olsa case AGGR_GLOBAL: 533f80010ebSJiri Olsa aggr->val += count->val; 534f80010ebSJiri Olsa aggr->ena += count->ena; 535f80010ebSJiri Olsa aggr->run += count->run; 536208df99eSJiri Olsa case AGGR_UNSET: 537df936cadSClaire Jensen case AGGR_MAX: 538f80010ebSJiri Olsa default: 539f80010ebSJiri Olsa break; 540f80010ebSJiri Olsa } 541f80010ebSJiri Olsa 542f80010ebSJiri Olsa return 0; 543f80010ebSJiri Olsa } 544f80010ebSJiri Olsa 545f80010ebSJiri Olsa static int process_counter_maps(struct perf_stat_config *config, 54632dcd021SJiri Olsa struct evsel *counter) 547f80010ebSJiri Olsa { 548a2f354e3SJiri Olsa int nthreads = perf_thread_map__nr(counter->core.threads); 5495eb88f04SArnaldo Carvalho de Melo int ncpus = evsel__nr_cpus(counter); 5505b1af93dSIan Rogers int idx, thread; 551f80010ebSJiri Olsa 552f80010ebSJiri Olsa for (thread = 0; thread < nthreads; thread++) { 5535b1af93dSIan Rogers for (idx = 0; idx < ncpus; idx++) { 5545b1af93dSIan Rogers if (process_counter_values(config, counter, idx, thread, 5555b1af93dSIan Rogers perf_counts(counter->counts, idx, thread))) 556f80010ebSJiri Olsa return -1; 557f80010ebSJiri Olsa } 558f80010ebSJiri Olsa } 559f80010ebSJiri Olsa 560f80010ebSJiri Olsa return 0; 561f80010ebSJiri Olsa } 562f80010ebSJiri Olsa 563f80010ebSJiri Olsa int perf_stat_process_counter(struct perf_stat_config *config, 56432dcd021SJiri Olsa struct evsel *counter) 565f80010ebSJiri Olsa { 566f80010ebSJiri Olsa struct perf_counts_values *aggr = &counter->counts->aggr; 567e669e833SArnaldo Carvalho de Melo struct perf_stat_evsel *ps = counter->stats; 568f80010ebSJiri Olsa u64 *count = counter->counts->aggr.values; 56966b76e30SNamhyung Kim int ret; 570f80010ebSJiri Olsa 571f80010ebSJiri Olsa aggr->val = aggr->ena = aggr->run = 0; 572f80010ebSJiri Olsa 573f80010ebSJiri Olsa if (counter->per_pkg) 574034f7ee1SJin Yao evsel__zero_per_pkg(counter); 575f80010ebSJiri Olsa 576f80010ebSJiri Olsa ret = process_counter_maps(config, counter); 577f80010ebSJiri Olsa if (ret) 578f80010ebSJiri Olsa return ret; 579f80010ebSJiri Olsa 580f80010ebSJiri Olsa if (config->aggr_mode != AGGR_GLOBAL) 581f80010ebSJiri Olsa return 0; 582f80010ebSJiri Olsa 58366b76e30SNamhyung Kim update_stats(&ps->res_stats, *count); 584f80010ebSJiri Olsa 585bb963e16SNamhyung Kim if (verbose > 0) { 586f80010ebSJiri Olsa fprintf(config->output, "%s: %" PRIu64 " %" PRIu64 " %" PRIu64 "\n", 5878ab2e96dSArnaldo Carvalho de Melo evsel__name(counter), count[0], count[1], count[2]); 588f80010ebSJiri Olsa } 589f80010ebSJiri Olsa 590f80010ebSJiri Olsa /* 591f80010ebSJiri Olsa * Save the full runtime - to allow normalization during printout: 592f80010ebSJiri Olsa */ 5931fcd0394SJin Yao perf_stat__update_shadow_stats(counter, *count, 0, &rt_stat); 594f80010ebSJiri Olsa 595f80010ebSJiri Olsa return 0; 596f80010ebSJiri Olsa } 5970ea0e355SJiri Olsa 59889f1688aSJiri Olsa int perf_event__process_stat_event(struct perf_session *session, 59989f1688aSJiri Olsa union perf_event *event) 6000ea0e355SJiri Olsa { 60192d579eaSIan Rogers struct perf_counts_values count, *ptr; 60272932371SJiri Olsa struct perf_record_stat *st = &event->stat; 60332dcd021SJiri Olsa struct evsel *counter; 60492d579eaSIan Rogers int cpu_map_idx; 6050ea0e355SJiri Olsa 6060ea0e355SJiri Olsa count.val = st->val; 6070ea0e355SJiri Olsa count.ena = st->ena; 6080ea0e355SJiri Olsa count.run = st->run; 6090ea0e355SJiri Olsa 6103ccf8a7bSArnaldo Carvalho de Melo counter = evlist__id2evsel(session->evlist, st->id); 6110ea0e355SJiri Olsa if (!counter) { 6120ea0e355SJiri Olsa pr_err("Failed to resolve counter for stat event.\n"); 6130ea0e355SJiri Olsa return -EINVAL; 6140ea0e355SJiri Olsa } 61592d579eaSIan Rogers cpu_map_idx = perf_cpu_map__idx(evsel__cpus(counter), (struct perf_cpu){.cpu = st->cpu}); 61692d579eaSIan Rogers if (cpu_map_idx == -1) { 61792d579eaSIan Rogers pr_err("Invalid CPU %d for event %s.\n", st->cpu, evsel__name(counter)); 61892d579eaSIan Rogers return -EINVAL; 61992d579eaSIan Rogers } 62092d579eaSIan Rogers ptr = perf_counts(counter->counts, cpu_map_idx, st->thread); 62192d579eaSIan Rogers if (ptr == NULL) { 62292d579eaSIan Rogers pr_err("Failed to find perf count for CPU %d thread %d on event %s.\n", 62392d579eaSIan Rogers st->cpu, st->thread, evsel__name(counter)); 62492d579eaSIan Rogers return -EINVAL; 62592d579eaSIan Rogers } 62692d579eaSIan Rogers *ptr = count; 6270ea0e355SJiri Olsa counter->supported = true; 6280ea0e355SJiri Olsa return 0; 6290ea0e355SJiri Olsa } 630e08a4564SJiri Olsa 631e08a4564SJiri Olsa size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp) 632e08a4564SJiri Olsa { 63372932371SJiri Olsa struct perf_record_stat *st = (struct perf_record_stat *)event; 634e08a4564SJiri Olsa size_t ret; 635e08a4564SJiri Olsa 63618a13a60SJiri Olsa ret = fprintf(fp, "\n... id %" PRI_lu64 ", cpu %d, thread %d\n", 637e08a4564SJiri Olsa st->id, st->cpu, st->thread); 63818a13a60SJiri Olsa ret += fprintf(fp, "... value %" PRI_lu64 ", enabled %" PRI_lu64 ", running %" PRI_lu64 "\n", 639e08a4564SJiri Olsa st->val, st->ena, st->run); 640e08a4564SJiri Olsa 641e08a4564SJiri Olsa return ret; 642e08a4564SJiri Olsa } 643e08a4564SJiri Olsa 644e08a4564SJiri Olsa size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp) 645e08a4564SJiri Olsa { 64672932371SJiri Olsa struct perf_record_stat_round *rd = (struct perf_record_stat_round *)event; 647e08a4564SJiri Olsa size_t ret; 648e08a4564SJiri Olsa 649782adbe2SJiri Olsa ret = fprintf(fp, "\n... time %" PRI_lu64 ", type %s\n", rd->time, 650e08a4564SJiri Olsa rd->type == PERF_STAT_ROUND_TYPE__FINAL ? "FINAL" : "INTERVAL"); 651e08a4564SJiri Olsa 652e08a4564SJiri Olsa return ret; 653e08a4564SJiri Olsa } 654e08a4564SJiri Olsa 655e08a4564SJiri Olsa size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp) 656e08a4564SJiri Olsa { 657e08a4564SJiri Olsa struct perf_stat_config sc; 658e08a4564SJiri Olsa size_t ret; 659e08a4564SJiri Olsa 660e08a4564SJiri Olsa perf_event__read_stat_config(&sc, &event->stat_config); 661e08a4564SJiri Olsa 662e08a4564SJiri Olsa ret = fprintf(fp, "\n"); 663e08a4564SJiri Olsa ret += fprintf(fp, "... aggr_mode %d\n", sc.aggr_mode); 664e08a4564SJiri Olsa ret += fprintf(fp, "... scale %d\n", sc.scale); 665e08a4564SJiri Olsa ret += fprintf(fp, "... interval %u\n", sc.interval); 666e08a4564SJiri Olsa 667e08a4564SJiri Olsa return ret; 668e08a4564SJiri Olsa } 669d09cefd2SJiri Olsa 67032dcd021SJiri Olsa int create_perf_stat_counter(struct evsel *evsel, 671d09cefd2SJiri Olsa struct perf_stat_config *config, 6724804e011SAndi Kleen struct target *target, 6736f844b1fSIan Rogers int cpu_map_idx) 674d09cefd2SJiri Olsa { 6751fc632ceSJiri Olsa struct perf_event_attr *attr = &evsel->core.attr; 676fba7c866SJiri Olsa struct evsel *leader = evsel__leader(evsel); 677d09cefd2SJiri Olsa 678d09cefd2SJiri Olsa attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | 679d09cefd2SJiri Olsa PERF_FORMAT_TOTAL_TIME_RUNNING; 680d09cefd2SJiri Olsa 681d09cefd2SJiri Olsa /* 682d09cefd2SJiri Olsa * The event is part of non trivial group, let's enable 683d09cefd2SJiri Olsa * the group read (for leader) and ID retrieval for all 684d09cefd2SJiri Olsa * members. 685d09cefd2SJiri Olsa */ 6865643b1a5SJiri Olsa if (leader->core.nr_members > 1) 687d09cefd2SJiri Olsa attr->read_format |= PERF_FORMAT_ID|PERF_FORMAT_GROUP; 688d09cefd2SJiri Olsa 689fa853c4bSSong Liu attr->inherit = !config->no_inherit && list_empty(&evsel->bpf_counter_list); 690d09cefd2SJiri Olsa 691d09cefd2SJiri Olsa /* 692d09cefd2SJiri Olsa * Some events get initialized with sample_(period/type) set, 693d09cefd2SJiri Olsa * like tracepoints. Clear it up for counting. 694d09cefd2SJiri Olsa */ 695d09cefd2SJiri Olsa attr->sample_period = 0; 696d09cefd2SJiri Olsa 697d09cefd2SJiri Olsa if (config->identifier) 698d09cefd2SJiri Olsa attr->sample_type = PERF_SAMPLE_IDENTIFIER; 699d09cefd2SJiri Olsa 700dd071024SJin Yao if (config->all_user) { 701dd071024SJin Yao attr->exclude_kernel = 1; 702dd071024SJin Yao attr->exclude_user = 0; 703dd071024SJin Yao } 704dd071024SJin Yao 705dd071024SJin Yao if (config->all_kernel) { 706dd071024SJin Yao attr->exclude_kernel = 0; 707dd071024SJin Yao attr->exclude_user = 1; 708dd071024SJin Yao } 709dd071024SJin Yao 710d09cefd2SJiri Olsa /* 711d09cefd2SJiri Olsa * Disabling all counters initially, they will be enabled 712d09cefd2SJiri Olsa * either manually by us or by kernel via enable_on_exec 713d09cefd2SJiri Olsa * set later. 714d09cefd2SJiri Olsa */ 715c754c382SArnaldo Carvalho de Melo if (evsel__is_group_leader(evsel)) { 716d09cefd2SJiri Olsa attr->disabled = 1; 717d09cefd2SJiri Olsa 718d09cefd2SJiri Olsa /* 719d09cefd2SJiri Olsa * In case of initial_delay we enable tracee 720d09cefd2SJiri Olsa * events manually. 721d09cefd2SJiri Olsa */ 722d09cefd2SJiri Olsa if (target__none(target) && !config->initial_delay) 723d09cefd2SJiri Olsa attr->enable_on_exec = 1; 724d09cefd2SJiri Olsa } 725d09cefd2SJiri Olsa 726d09cefd2SJiri Olsa if (target__has_cpu(target) && !target__has_per_thread(target)) 7276f844b1fSIan Rogers return evsel__open_per_cpu(evsel, evsel__cpus(evsel), cpu_map_idx); 728d09cefd2SJiri Olsa 729aa8c406bSArnaldo Carvalho de Melo return evsel__open_per_thread(evsel, evsel->core.threads); 730d09cefd2SJiri Olsa } 731