1103a8feaSLen Brown /* 2103a8feaSLen Brown * turbostat -- show CPU frequency and C-state residency 3103a8feaSLen Brown * on modern Intel turbo-capable processors. 4103a8feaSLen Brown * 5144b44b1SLen Brown * Copyright (c) 2013 Intel Corporation. 6103a8feaSLen Brown * Len Brown <len.brown@intel.com> 7103a8feaSLen Brown * 8103a8feaSLen Brown * This program is free software; you can redistribute it and/or modify it 9103a8feaSLen Brown * under the terms and conditions of the GNU General Public License, 10103a8feaSLen Brown * version 2, as published by the Free Software Foundation. 11103a8feaSLen Brown * 12103a8feaSLen Brown * This program is distributed in the hope it will be useful, but WITHOUT 13103a8feaSLen Brown * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 14103a8feaSLen Brown * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 15103a8feaSLen Brown * more details. 16103a8feaSLen Brown * 17103a8feaSLen Brown * You should have received a copy of the GNU General Public License along with 18103a8feaSLen Brown * this program; if not, write to the Free Software Foundation, Inc., 19103a8feaSLen Brown * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. 20103a8feaSLen Brown */ 21103a8feaSLen Brown 2288c3281fSLen Brown #define _GNU_SOURCE 23b731f311SJosh Triplett #include MSRHEADER 2495aebc44SJosh Triplett #include <stdarg.h> 25103a8feaSLen Brown #include <stdio.h> 26b2c95d90SJosh Triplett #include <err.h> 27103a8feaSLen Brown #include <unistd.h> 28103a8feaSLen Brown #include <sys/types.h> 29103a8feaSLen Brown #include <sys/wait.h> 30103a8feaSLen Brown #include <sys/stat.h> 31103a8feaSLen Brown #include <sys/resource.h> 32103a8feaSLen Brown #include <fcntl.h> 33103a8feaSLen Brown #include <signal.h> 34103a8feaSLen Brown #include <sys/time.h> 35103a8feaSLen Brown #include <stdlib.h> 36d8af6f5fSLen Brown #include <getopt.h> 37103a8feaSLen Brown #include <dirent.h> 38103a8feaSLen Brown #include <string.h> 39103a8feaSLen Brown #include <ctype.h> 4088c3281fSLen Brown #include <sched.h> 412b92865eSJosh Triplett #include <cpuid.h> 4298481e79SLen Brown #include <linux/capability.h> 4398481e79SLen Brown #include <errno.h> 44103a8feaSLen Brown 45103a8feaSLen Brown char *proc_stat = "/proc/stat"; 46d8af6f5fSLen Brown unsigned int interval_sec = 5; 47d8af6f5fSLen Brown unsigned int debug; 48d8af6f5fSLen Brown unsigned int rapl_joules; 49d8af6f5fSLen Brown unsigned int summary_only; 50d8af6f5fSLen Brown unsigned int dump_only; 51103a8feaSLen Brown unsigned int skip_c0; 52103a8feaSLen Brown unsigned int skip_c1; 53103a8feaSLen Brown unsigned int do_nhm_cstates; 54103a8feaSLen Brown unsigned int do_snb_cstates; 55ee7e38e3SLen Brown unsigned int do_pc2; 56ee7e38e3SLen Brown unsigned int do_pc3; 57ee7e38e3SLen Brown unsigned int do_pc6; 58ee7e38e3SLen Brown unsigned int do_pc7; 59ca58710fSKristen Carlson Accardi unsigned int do_c8_c9_c10; 60*0b2bb692SLen Brown unsigned int do_skl_residency; 61144b44b1SLen Brown unsigned int do_slm_cstates; 62144b44b1SLen Brown unsigned int use_c1_residency_msr; 63103a8feaSLen Brown unsigned int has_aperf; 64889facbeSLen Brown unsigned int has_epb; 65fc04cc67SLen Brown unsigned int units = 1000000; /* MHz etc */ 66103a8feaSLen Brown unsigned int genuine_intel; 67103a8feaSLen Brown unsigned int has_invariant_tsc; 68d7899447SLen Brown unsigned int do_nhm_platform_info; 692f32edf1SLen Brown unsigned int extra_msr_offset32; 702f32edf1SLen Brown unsigned int extra_msr_offset64; 718e180f3cSLen Brown unsigned int extra_delta_offset32; 728e180f3cSLen Brown unsigned int extra_delta_offset64; 731ed51011SLen Brown int do_smi; 74103a8feaSLen Brown double bclk; 75103a8feaSLen Brown unsigned int show_pkg; 76103a8feaSLen Brown unsigned int show_core; 77103a8feaSLen Brown unsigned int show_cpu; 78c98d5d94SLen Brown unsigned int show_pkg_only; 79c98d5d94SLen Brown unsigned int show_core_only; 80c98d5d94SLen Brown char *output_buffer, *outp; 81889facbeSLen Brown unsigned int do_rapl; 82889facbeSLen Brown unsigned int do_dts; 83889facbeSLen Brown unsigned int do_ptm; 84889facbeSLen Brown unsigned int tcc_activation_temp; 85889facbeSLen Brown unsigned int tcc_activation_temp_override; 86889facbeSLen Brown double rapl_power_units, rapl_energy_units, rapl_time_units; 87889facbeSLen Brown double rapl_joule_counter_range; 883a9a941dSLen Brown unsigned int do_core_perf_limit_reasons; 893a9a941dSLen Brown unsigned int do_gfx_perf_limit_reasons; 903a9a941dSLen Brown unsigned int do_ring_perf_limit_reasons; 91889facbeSLen Brown 92889facbeSLen Brown #define RAPL_PKG (1 << 0) 93e6f9bb3cSLen Brown /* 0x610 MSR_PKG_POWER_LIMIT */ 94e6f9bb3cSLen Brown /* 0x611 MSR_PKG_ENERGY_STATUS */ 95e6f9bb3cSLen Brown #define RAPL_PKG_PERF_STATUS (1 << 1) 96e6f9bb3cSLen Brown /* 0x613 MSR_PKG_PERF_STATUS */ 97e6f9bb3cSLen Brown #define RAPL_PKG_POWER_INFO (1 << 2) 98e6f9bb3cSLen Brown /* 0x614 MSR_PKG_POWER_INFO */ 99e6f9bb3cSLen Brown 100889facbeSLen Brown #define RAPL_DRAM (1 << 3) 101e6f9bb3cSLen Brown /* 0x618 MSR_DRAM_POWER_LIMIT */ 102e6f9bb3cSLen Brown /* 0x619 MSR_DRAM_ENERGY_STATUS */ 103e6f9bb3cSLen Brown #define RAPL_DRAM_PERF_STATUS (1 << 4) 104e6f9bb3cSLen Brown /* 0x61b MSR_DRAM_PERF_STATUS */ 105*0b2bb692SLen Brown #define RAPL_DRAM_POWER_INFO (1 << 5) 106*0b2bb692SLen Brown /* 0x61c MSR_DRAM_POWER_INFO */ 107e6f9bb3cSLen Brown 108*0b2bb692SLen Brown #define RAPL_CORES (1 << 6) 109e6f9bb3cSLen Brown /* 0x638 MSR_PP0_POWER_LIMIT */ 110e6f9bb3cSLen Brown /* 0x639 MSR_PP0_ENERGY_STATUS */ 111*0b2bb692SLen Brown #define RAPL_CORE_POLICY (1 << 7) 112e6f9bb3cSLen Brown /* 0x63a MSR_PP0_POLICY */ 113e6f9bb3cSLen Brown 114*0b2bb692SLen Brown #define RAPL_GFX (1 << 8) 115e6f9bb3cSLen Brown /* 0x640 MSR_PP1_POWER_LIMIT */ 116e6f9bb3cSLen Brown /* 0x641 MSR_PP1_ENERGY_STATUS */ 117e6f9bb3cSLen Brown /* 0x642 MSR_PP1_POLICY */ 118889facbeSLen Brown #define TJMAX_DEFAULT 100 119889facbeSLen Brown 120889facbeSLen Brown #define MAX(a, b) ((a) > (b) ? (a) : (b)) 121103a8feaSLen Brown 122103a8feaSLen Brown int aperf_mperf_unstable; 123103a8feaSLen Brown int backwards_count; 124103a8feaSLen Brown char *progname; 125103a8feaSLen Brown 126c98d5d94SLen Brown cpu_set_t *cpu_present_set, *cpu_affinity_set; 127c98d5d94SLen Brown size_t cpu_present_setsize, cpu_affinity_setsize; 128c98d5d94SLen Brown 129c98d5d94SLen Brown struct thread_data { 130c98d5d94SLen Brown unsigned long long tsc; 131c98d5d94SLen Brown unsigned long long aperf; 132c98d5d94SLen Brown unsigned long long mperf; 133144b44b1SLen Brown unsigned long long c1; 1342f32edf1SLen Brown unsigned long long extra_msr64; 1358e180f3cSLen Brown unsigned long long extra_delta64; 1368e180f3cSLen Brown unsigned long long extra_msr32; 1378e180f3cSLen Brown unsigned long long extra_delta32; 1381ed51011SLen Brown unsigned int smi_count; 139c98d5d94SLen Brown unsigned int cpu_id; 140c98d5d94SLen Brown unsigned int flags; 141c98d5d94SLen Brown #define CPU_IS_FIRST_THREAD_IN_CORE 0x2 142c98d5d94SLen Brown #define CPU_IS_FIRST_CORE_IN_PACKAGE 0x4 143c98d5d94SLen Brown } *thread_even, *thread_odd; 144c98d5d94SLen Brown 145c98d5d94SLen Brown struct core_data { 146c98d5d94SLen Brown unsigned long long c3; 147c98d5d94SLen Brown unsigned long long c6; 148c98d5d94SLen Brown unsigned long long c7; 149889facbeSLen Brown unsigned int core_temp_c; 150c98d5d94SLen Brown unsigned int core_id; 151c98d5d94SLen Brown } *core_even, *core_odd; 152c98d5d94SLen Brown 153c98d5d94SLen Brown struct pkg_data { 154c98d5d94SLen Brown unsigned long long pc2; 155c98d5d94SLen Brown unsigned long long pc3; 156c98d5d94SLen Brown unsigned long long pc6; 157c98d5d94SLen Brown unsigned long long pc7; 158ca58710fSKristen Carlson Accardi unsigned long long pc8; 159ca58710fSKristen Carlson Accardi unsigned long long pc9; 160ca58710fSKristen Carlson Accardi unsigned long long pc10; 161*0b2bb692SLen Brown unsigned long long pkg_wtd_core_c0; 162*0b2bb692SLen Brown unsigned long long pkg_any_core_c0; 163*0b2bb692SLen Brown unsigned long long pkg_any_gfxe_c0; 164*0b2bb692SLen Brown unsigned long long pkg_both_core_gfxe_c0; 165c98d5d94SLen Brown unsigned int package_id; 166889facbeSLen Brown unsigned int energy_pkg; /* MSR_PKG_ENERGY_STATUS */ 167889facbeSLen Brown unsigned int energy_dram; /* MSR_DRAM_ENERGY_STATUS */ 168889facbeSLen Brown unsigned int energy_cores; /* MSR_PP0_ENERGY_STATUS */ 169889facbeSLen Brown unsigned int energy_gfx; /* MSR_PP1_ENERGY_STATUS */ 170889facbeSLen Brown unsigned int rapl_pkg_perf_status; /* MSR_PKG_PERF_STATUS */ 171889facbeSLen Brown unsigned int rapl_dram_perf_status; /* MSR_DRAM_PERF_STATUS */ 172889facbeSLen Brown unsigned int pkg_temp_c; 173889facbeSLen Brown 174c98d5d94SLen Brown } *package_even, *package_odd; 175c98d5d94SLen Brown 176c98d5d94SLen Brown #define ODD_COUNTERS thread_odd, core_odd, package_odd 177c98d5d94SLen Brown #define EVEN_COUNTERS thread_even, core_even, package_even 178c98d5d94SLen Brown 179c98d5d94SLen Brown #define GET_THREAD(thread_base, thread_no, core_no, pkg_no) \ 180c98d5d94SLen Brown (thread_base + (pkg_no) * topo.num_cores_per_pkg * \ 181c98d5d94SLen Brown topo.num_threads_per_core + \ 182c98d5d94SLen Brown (core_no) * topo.num_threads_per_core + (thread_no)) 183c98d5d94SLen Brown #define GET_CORE(core_base, core_no, pkg_no) \ 184c98d5d94SLen Brown (core_base + (pkg_no) * topo.num_cores_per_pkg + (core_no)) 185c98d5d94SLen Brown #define GET_PKG(pkg_base, pkg_no) (pkg_base + pkg_no) 186c98d5d94SLen Brown 187c98d5d94SLen Brown struct system_summary { 188c98d5d94SLen Brown struct thread_data threads; 189c98d5d94SLen Brown struct core_data cores; 190c98d5d94SLen Brown struct pkg_data packages; 191c98d5d94SLen Brown } sum, average; 192c98d5d94SLen Brown 193c98d5d94SLen Brown 194c98d5d94SLen Brown struct topo_params { 195c98d5d94SLen Brown int num_packages; 196103a8feaSLen Brown int num_cpus; 197c98d5d94SLen Brown int num_cores; 198c98d5d94SLen Brown int max_cpu_num; 199c98d5d94SLen Brown int num_cores_per_pkg; 200c98d5d94SLen Brown int num_threads_per_core; 201c98d5d94SLen Brown } topo; 202103a8feaSLen Brown 203c98d5d94SLen Brown struct timeval tv_even, tv_odd, tv_delta; 204103a8feaSLen Brown 205c98d5d94SLen Brown void setup_all_buffers(void); 206103a8feaSLen Brown 207c98d5d94SLen Brown int cpu_is_not_present(int cpu) 208d15cf7c1SLen Brown { 209c98d5d94SLen Brown return !CPU_ISSET_S(cpu, cpu_present_setsize, cpu_present_set); 210c98d5d94SLen Brown } 211c98d5d94SLen Brown /* 212c98d5d94SLen Brown * run func(thread, core, package) in topology order 213c98d5d94SLen Brown * skip non-present cpus 214c98d5d94SLen Brown */ 215c98d5d94SLen Brown 216c98d5d94SLen Brown int for_all_cpus(int (func)(struct thread_data *, struct core_data *, struct pkg_data *), 217c98d5d94SLen Brown struct thread_data *thread_base, struct core_data *core_base, struct pkg_data *pkg_base) 218c98d5d94SLen Brown { 219c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 220c98d5d94SLen Brown 221c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 222c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 223c98d5d94SLen Brown for (thread_no = 0; thread_no < 224c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 225c98d5d94SLen Brown struct thread_data *t; 226c98d5d94SLen Brown struct core_data *c; 227c98d5d94SLen Brown struct pkg_data *p; 228c98d5d94SLen Brown 229c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 230c98d5d94SLen Brown 231c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 232c98d5d94SLen Brown continue; 233c98d5d94SLen Brown 234c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 235c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 236c98d5d94SLen Brown 237c98d5d94SLen Brown retval = func(t, c, p); 238c98d5d94SLen Brown if (retval) 239c98d5d94SLen Brown return retval; 240c98d5d94SLen Brown } 241c98d5d94SLen Brown } 242c98d5d94SLen Brown } 243d15cf7c1SLen Brown return 0; 244d15cf7c1SLen Brown } 245d15cf7c1SLen Brown 24688c3281fSLen Brown int cpu_migrate(int cpu) 24788c3281fSLen Brown { 248c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 249c98d5d94SLen Brown CPU_SET_S(cpu, cpu_affinity_setsize, cpu_affinity_set); 250c98d5d94SLen Brown if (sched_setaffinity(0, cpu_affinity_setsize, cpu_affinity_set) == -1) 25188c3281fSLen Brown return -1; 25288c3281fSLen Brown else 25388c3281fSLen Brown return 0; 25488c3281fSLen Brown } 25588c3281fSLen Brown 25615aaa346SLen Brown int get_msr(int cpu, off_t offset, unsigned long long *msr) 257103a8feaSLen Brown { 258103a8feaSLen Brown ssize_t retval; 259103a8feaSLen Brown char pathname[32]; 260103a8feaSLen Brown int fd; 261103a8feaSLen Brown 262103a8feaSLen Brown sprintf(pathname, "/dev/cpu/%d/msr", cpu); 263103a8feaSLen Brown fd = open(pathname, O_RDONLY); 26415aaa346SLen Brown if (fd < 0) 26598481e79SLen Brown err(-1, "%s open failed, try chown or chmod +r /dev/cpu/*/msr, or run as root", pathname); 266103a8feaSLen Brown 26715aaa346SLen Brown retval = pread(fd, msr, sizeof *msr, offset); 268103a8feaSLen Brown close(fd); 26915aaa346SLen Brown 27098481e79SLen Brown if (retval != sizeof *msr) 27198481e79SLen Brown err(-1, "%s offset 0x%llx read failed", pathname, (unsigned long long)offset); 27215aaa346SLen Brown 27315aaa346SLen Brown return 0; 274103a8feaSLen Brown } 275103a8feaSLen Brown 276fc04cc67SLen Brown /* 277fc04cc67SLen Brown * Example Format w/ field column widths: 278fc04cc67SLen Brown * 279fc04cc67SLen Brown * Package Core CPU Avg_MHz Bzy_MHz TSC_MHz SMI %Busy CPU_%c1 CPU_%c3 CPU_%c6 CPU_%c7 CoreTmp PkgTmp Pkg%pc2 Pkg%pc3 Pkg%pc6 Pkg%pc7 PkgWatt CorWatt GFXWatt 280e7c95ff3SLen Brown * 123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678 281fc04cc67SLen Brown */ 282fc04cc67SLen Brown 283a829eb4dSLen Brown void print_header(void) 284103a8feaSLen Brown { 285103a8feaSLen Brown if (show_pkg) 286fc04cc67SLen Brown outp += sprintf(outp, " Package"); 287103a8feaSLen Brown if (show_core) 288fc04cc67SLen Brown outp += sprintf(outp, " Core"); 289103a8feaSLen Brown if (show_cpu) 290c98d5d94SLen Brown outp += sprintf(outp, " CPU"); 291103a8feaSLen Brown if (has_aperf) 292fc04cc67SLen Brown outp += sprintf(outp, " Avg_MHz"); 293d7899447SLen Brown if (has_aperf) 294fc04cc67SLen Brown outp += sprintf(outp, " %%Busy"); 295fc04cc67SLen Brown if (has_aperf) 296fc04cc67SLen Brown outp += sprintf(outp, " Bzy_MHz"); 297fc04cc67SLen Brown outp += sprintf(outp, " TSC_MHz"); 2981cc21f7bSLen Brown 2998e180f3cSLen Brown if (extra_delta_offset32) 300f9240813SLen Brown outp += sprintf(outp, " count 0x%03X", extra_delta_offset32); 3018e180f3cSLen Brown if (extra_delta_offset64) 302f9240813SLen Brown outp += sprintf(outp, " COUNT 0x%03X", extra_delta_offset64); 3032f32edf1SLen Brown if (extra_msr_offset32) 3048e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset32); 3052f32edf1SLen Brown if (extra_msr_offset64) 3068e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset64); 3071cc21f7bSLen Brown 3081cc21f7bSLen Brown if (!debug) 3091cc21f7bSLen Brown goto done; 3101cc21f7bSLen Brown 3111cc21f7bSLen Brown if (do_smi) 3121cc21f7bSLen Brown outp += sprintf(outp, " SMI"); 3131cc21f7bSLen Brown 314103a8feaSLen Brown if (do_nhm_cstates) 315fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c1"); 316144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 317fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c3"); 318103a8feaSLen Brown if (do_nhm_cstates) 319fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c6"); 320103a8feaSLen Brown if (do_snb_cstates) 321fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c7"); 322889facbeSLen Brown 323889facbeSLen Brown if (do_dts) 324fc04cc67SLen Brown outp += sprintf(outp, " CoreTmp"); 325889facbeSLen Brown if (do_ptm) 326fc04cc67SLen Brown outp += sprintf(outp, " PkgTmp"); 327889facbeSLen Brown 328*0b2bb692SLen Brown if (do_skl_residency) { 329*0b2bb692SLen Brown outp += sprintf(outp, " Totl%%C0"); 330*0b2bb692SLen Brown outp += sprintf(outp, " Any%%C0"); 331*0b2bb692SLen Brown outp += sprintf(outp, " GFX%%C0"); 332*0b2bb692SLen Brown outp += sprintf(outp, " CPUGFX%%"); 333*0b2bb692SLen Brown } 334*0b2bb692SLen Brown 335ee7e38e3SLen Brown if (do_pc2) 336fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc2"); 337ee7e38e3SLen Brown if (do_pc3) 338fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc3"); 339ee7e38e3SLen Brown if (do_pc6) 340fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc6"); 341ee7e38e3SLen Brown if (do_pc7) 342fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc7"); 343ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 344fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc8"); 345fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc9"); 346fc04cc67SLen Brown outp += sprintf(outp, " Pk%%pc10"); 347ca58710fSKristen Carlson Accardi } 348103a8feaSLen Brown 3495c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 350889facbeSLen Brown if (do_rapl & RAPL_PKG) 351fc04cc67SLen Brown outp += sprintf(outp, " PkgWatt"); 352889facbeSLen Brown if (do_rapl & RAPL_CORES) 353fc04cc67SLen Brown outp += sprintf(outp, " CorWatt"); 354889facbeSLen Brown if (do_rapl & RAPL_GFX) 355fc04cc67SLen Brown outp += sprintf(outp, " GFXWatt"); 356889facbeSLen Brown if (do_rapl & RAPL_DRAM) 357fc04cc67SLen Brown outp += sprintf(outp, " RAMWatt"); 358889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 359889facbeSLen Brown outp += sprintf(outp, " PKG_%%"); 360889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 361889facbeSLen Brown outp += sprintf(outp, " RAM_%%"); 362d7899447SLen Brown } else if (do_rapl && rapl_joules) { 3635c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 3645c56be9aSDirk Brandewie outp += sprintf(outp, " Pkg_J"); 3655c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 3665c56be9aSDirk Brandewie outp += sprintf(outp, " Cor_J"); 3675c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 3685c56be9aSDirk Brandewie outp += sprintf(outp, " GFX_J"); 3695c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 3705c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_W"); 3715c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 3725c56be9aSDirk Brandewie outp += sprintf(outp, " PKG_%%"); 3735c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 3745c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_%%"); 3755c56be9aSDirk Brandewie outp += sprintf(outp, " time"); 376889facbeSLen Brown 3775c56be9aSDirk Brandewie } 3781cc21f7bSLen Brown done: 379c98d5d94SLen Brown outp += sprintf(outp, "\n"); 380103a8feaSLen Brown } 381103a8feaSLen Brown 382c98d5d94SLen Brown int dump_counters(struct thread_data *t, struct core_data *c, 383c98d5d94SLen Brown struct pkg_data *p) 384103a8feaSLen Brown { 3853b4d5c7fSAndy Shevchenko outp += sprintf(outp, "t %p, c %p, p %p\n", t, c, p); 386c98d5d94SLen Brown 387c98d5d94SLen Brown if (t) { 3883b4d5c7fSAndy Shevchenko outp += sprintf(outp, "CPU: %d flags 0x%x\n", 3893b4d5c7fSAndy Shevchenko t->cpu_id, t->flags); 3903b4d5c7fSAndy Shevchenko outp += sprintf(outp, "TSC: %016llX\n", t->tsc); 3913b4d5c7fSAndy Shevchenko outp += sprintf(outp, "aperf: %016llX\n", t->aperf); 3923b4d5c7fSAndy Shevchenko outp += sprintf(outp, "mperf: %016llX\n", t->mperf); 3933b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c1: %016llX\n", t->c1); 3943b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %08llX\n", 3958e180f3cSLen Brown extra_delta_offset32, t->extra_delta32); 3963b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %016llX\n", 3978e180f3cSLen Brown extra_delta_offset64, t->extra_delta64); 3983b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %08llX\n", 3992f32edf1SLen Brown extra_msr_offset32, t->extra_msr32); 4003b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %016llX\n", 4012f32edf1SLen Brown extra_msr_offset64, t->extra_msr64); 4021ed51011SLen Brown if (do_smi) 4033b4d5c7fSAndy Shevchenko outp += sprintf(outp, "SMI: %08X\n", t->smi_count); 404103a8feaSLen Brown } 405103a8feaSLen Brown 406c98d5d94SLen Brown if (c) { 4073b4d5c7fSAndy Shevchenko outp += sprintf(outp, "core: %d\n", c->core_id); 4083b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c3: %016llX\n", c->c3); 4093b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c6: %016llX\n", c->c6); 4103b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c7: %016llX\n", c->c7); 4113b4d5c7fSAndy Shevchenko outp += sprintf(outp, "DTS: %dC\n", c->core_temp_c); 412c98d5d94SLen Brown } 413103a8feaSLen Brown 414c98d5d94SLen Brown if (p) { 4153b4d5c7fSAndy Shevchenko outp += sprintf(outp, "package: %d\n", p->package_id); 416*0b2bb692SLen Brown 417*0b2bb692SLen Brown outp += sprintf(outp, "Weighted cores: %016llX\n", p->pkg_wtd_core_c0); 418*0b2bb692SLen Brown outp += sprintf(outp, "Any cores: %016llX\n", p->pkg_any_core_c0); 419*0b2bb692SLen Brown outp += sprintf(outp, "Any GFX: %016llX\n", p->pkg_any_gfxe_c0); 420*0b2bb692SLen Brown outp += sprintf(outp, "CPU + GFX: %016llX\n", p->pkg_both_core_gfxe_c0); 421*0b2bb692SLen Brown 4223b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc2: %016llX\n", p->pc2); 423ee7e38e3SLen Brown if (do_pc3) 4243b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc3: %016llX\n", p->pc3); 425ee7e38e3SLen Brown if (do_pc6) 4263b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc6: %016llX\n", p->pc6); 427ee7e38e3SLen Brown if (do_pc7) 4283b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc7: %016llX\n", p->pc7); 4293b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc8: %016llX\n", p->pc8); 4303b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc9: %016llX\n", p->pc9); 4313b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc10: %016llX\n", p->pc10); 4323b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules PKG: %0X\n", p->energy_pkg); 4333b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules COR: %0X\n", p->energy_cores); 4343b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules GFX: %0X\n", p->energy_gfx); 4353b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules RAM: %0X\n", p->energy_dram); 4363b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Throttle PKG: %0X\n", 4373b4d5c7fSAndy Shevchenko p->rapl_pkg_perf_status); 4383b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Throttle RAM: %0X\n", 4393b4d5c7fSAndy Shevchenko p->rapl_dram_perf_status); 4403b4d5c7fSAndy Shevchenko outp += sprintf(outp, "PTM: %dC\n", p->pkg_temp_c); 441c98d5d94SLen Brown } 4423b4d5c7fSAndy Shevchenko 4433b4d5c7fSAndy Shevchenko outp += sprintf(outp, "\n"); 4443b4d5c7fSAndy Shevchenko 445c98d5d94SLen Brown return 0; 446103a8feaSLen Brown } 447103a8feaSLen Brown 448e23da037SLen Brown /* 449e23da037SLen Brown * column formatting convention & formats 450e23da037SLen Brown */ 451c98d5d94SLen Brown int format_counters(struct thread_data *t, struct core_data *c, 452c98d5d94SLen Brown struct pkg_data *p) 453103a8feaSLen Brown { 454103a8feaSLen Brown double interval_float; 455fc04cc67SLen Brown char *fmt8; 456103a8feaSLen Brown 457c98d5d94SLen Brown /* if showing only 1st thread in core and this isn't one, bail out */ 458c98d5d94SLen Brown if (show_core_only && !(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 459c98d5d94SLen Brown return 0; 460c98d5d94SLen Brown 461c98d5d94SLen Brown /* if showing only 1st thread in pkg and this isn't one, bail out */ 462c98d5d94SLen Brown if (show_pkg_only && !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 463c98d5d94SLen Brown return 0; 464c98d5d94SLen Brown 465103a8feaSLen Brown interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0; 466103a8feaSLen Brown 467c98d5d94SLen Brown /* topo columns, print blanks on 1st (average) line */ 468c98d5d94SLen Brown if (t == &average.threads) { 469103a8feaSLen Brown if (show_pkg) 470fc04cc67SLen Brown outp += sprintf(outp, " -"); 471103a8feaSLen Brown if (show_core) 472fc04cc67SLen Brown outp += sprintf(outp, " -"); 473103a8feaSLen Brown if (show_cpu) 474fc04cc67SLen Brown outp += sprintf(outp, " -"); 475103a8feaSLen Brown } else { 476c98d5d94SLen Brown if (show_pkg) { 477c98d5d94SLen Brown if (p) 478fc04cc67SLen Brown outp += sprintf(outp, "%8d", p->package_id); 479c98d5d94SLen Brown else 480fc04cc67SLen Brown outp += sprintf(outp, " -"); 481c98d5d94SLen Brown } 482c98d5d94SLen Brown if (show_core) { 483c98d5d94SLen Brown if (c) 484fc04cc67SLen Brown outp += sprintf(outp, "%8d", c->core_id); 485c98d5d94SLen Brown else 486fc04cc67SLen Brown outp += sprintf(outp, " -"); 487c98d5d94SLen Brown } 488103a8feaSLen Brown if (show_cpu) 489fc04cc67SLen Brown outp += sprintf(outp, "%8d", t->cpu_id); 490103a8feaSLen Brown } 491fc04cc67SLen Brown 492d7899447SLen Brown /* Avg_MHz */ 493fc04cc67SLen Brown if (has_aperf) 494fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 495fc04cc67SLen Brown 1.0 / units * t->aperf / interval_float); 496fc04cc67SLen Brown 497d7899447SLen Brown /* %Busy */ 498d7899447SLen Brown if (has_aperf) { 499103a8feaSLen Brown if (!skip_c0) 500fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * t->mperf/t->tsc); 501103a8feaSLen Brown else 502fc04cc67SLen Brown outp += sprintf(outp, "********"); 503103a8feaSLen Brown } 504103a8feaSLen Brown 505d7899447SLen Brown /* Bzy_MHz */ 506fc04cc67SLen Brown if (has_aperf) 507fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 508fc04cc67SLen Brown 1.0 * t->tsc / units * t->aperf / t->mperf / interval_float); 509103a8feaSLen Brown 510d7899447SLen Brown /* TSC_MHz */ 511fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 1.0 * t->tsc/units/interval_float); 512103a8feaSLen Brown 5138e180f3cSLen Brown /* delta */ 5148e180f3cSLen Brown if (extra_delta_offset32) 5158e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta32); 5168e180f3cSLen Brown 5178e180f3cSLen Brown /* DELTA */ 5188e180f3cSLen Brown if (extra_delta_offset64) 5198e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta64); 5202f32edf1SLen Brown /* msr */ 5212f32edf1SLen Brown if (extra_msr_offset32) 5228e180f3cSLen Brown outp += sprintf(outp, " 0x%08llx", t->extra_msr32); 5232f32edf1SLen Brown 524130ff304SLen Brown /* MSR */ 5252f32edf1SLen Brown if (extra_msr_offset64) 5262f32edf1SLen Brown outp += sprintf(outp, " 0x%016llx", t->extra_msr64); 527130ff304SLen Brown 5281cc21f7bSLen Brown if (!debug) 5291cc21f7bSLen Brown goto done; 5301cc21f7bSLen Brown 5311cc21f7bSLen Brown /* SMI */ 5321cc21f7bSLen Brown if (do_smi) 5331cc21f7bSLen Brown outp += sprintf(outp, "%8d", t->smi_count); 5341cc21f7bSLen Brown 535103a8feaSLen Brown if (do_nhm_cstates) { 536103a8feaSLen Brown if (!skip_c1) 537fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * t->c1/t->tsc); 538103a8feaSLen Brown else 539fc04cc67SLen Brown outp += sprintf(outp, "********"); 540103a8feaSLen Brown } 541c98d5d94SLen Brown 542c98d5d94SLen Brown /* print per-core data only for 1st thread in core */ 543c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 544c98d5d94SLen Brown goto done; 545c98d5d94SLen Brown 546144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 547fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c3/t->tsc); 548103a8feaSLen Brown if (do_nhm_cstates) 549fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c6/t->tsc); 550103a8feaSLen Brown if (do_snb_cstates) 551fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c7/t->tsc); 552c98d5d94SLen Brown 553889facbeSLen Brown if (do_dts) 554fc04cc67SLen Brown outp += sprintf(outp, "%8d", c->core_temp_c); 555889facbeSLen Brown 556c98d5d94SLen Brown /* print per-package data only for 1st core in package */ 557c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 558c98d5d94SLen Brown goto done; 559c98d5d94SLen Brown 560*0b2bb692SLen Brown /* PkgTmp */ 561889facbeSLen Brown if (do_ptm) 562fc04cc67SLen Brown outp += sprintf(outp, "%8d", p->pkg_temp_c); 563889facbeSLen Brown 564*0b2bb692SLen Brown /* Totl%C0, Any%C0 GFX%C0 CPUGFX% */ 565*0b2bb692SLen Brown if (do_skl_residency) { 566*0b2bb692SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pkg_wtd_core_c0/t->tsc); 567*0b2bb692SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pkg_any_core_c0/t->tsc); 568*0b2bb692SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pkg_any_gfxe_c0/t->tsc); 569*0b2bb692SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pkg_both_core_gfxe_c0/t->tsc); 570*0b2bb692SLen Brown } 571*0b2bb692SLen Brown 572ee7e38e3SLen Brown if (do_pc2) 573fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc2/t->tsc); 574ee7e38e3SLen Brown if (do_pc3) 575fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc3/t->tsc); 576ee7e38e3SLen Brown if (do_pc6) 577fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc6/t->tsc); 578ee7e38e3SLen Brown if (do_pc7) 579fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc7/t->tsc); 580ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 581fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc8/t->tsc); 582fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc9/t->tsc); 583fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc10/t->tsc); 584ca58710fSKristen Carlson Accardi } 585889facbeSLen Brown 586889facbeSLen Brown /* 587889facbeSLen Brown * If measurement interval exceeds minimum RAPL Joule Counter range, 588889facbeSLen Brown * indicate that results are suspect by printing "**" in fraction place. 589889facbeSLen Brown */ 590fc04cc67SLen Brown if (interval_float < rapl_joule_counter_range) 591fc04cc67SLen Brown fmt8 = "%8.2f"; 592fc04cc67SLen Brown else 593fc04cc67SLen Brown fmt8 = " %6.0f**"; 594889facbeSLen Brown 5955c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 596889facbeSLen Brown if (do_rapl & RAPL_PKG) 597fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_pkg * rapl_energy_units / interval_float); 598889facbeSLen Brown if (do_rapl & RAPL_CORES) 599fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_cores * rapl_energy_units / interval_float); 600889facbeSLen Brown if (do_rapl & RAPL_GFX) 601fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_gfx * rapl_energy_units / interval_float); 602889facbeSLen Brown if (do_rapl & RAPL_DRAM) 603fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_dram * rapl_energy_units / interval_float); 604889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 605fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 606889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 607fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 608d7899447SLen Brown } else if (do_rapl && rapl_joules) { 6095c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 610fc04cc67SLen Brown outp += sprintf(outp, fmt8, 6115c56be9aSDirk Brandewie p->energy_pkg * rapl_energy_units); 6125c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 613fc04cc67SLen Brown outp += sprintf(outp, fmt8, 6145c56be9aSDirk Brandewie p->energy_cores * rapl_energy_units); 6155c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 616fc04cc67SLen Brown outp += sprintf(outp, fmt8, 6175c56be9aSDirk Brandewie p->energy_gfx * rapl_energy_units); 6185c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 619fc04cc67SLen Brown outp += sprintf(outp, fmt8, 6205c56be9aSDirk Brandewie p->energy_dram * rapl_energy_units); 6215c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 622fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 6235c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 624fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 625889facbeSLen Brown 626d7899447SLen Brown outp += sprintf(outp, fmt8, interval_float); 6275c56be9aSDirk Brandewie } 628c98d5d94SLen Brown done: 629c98d5d94SLen Brown outp += sprintf(outp, "\n"); 630c98d5d94SLen Brown 631c98d5d94SLen Brown return 0; 632103a8feaSLen Brown } 633103a8feaSLen Brown 634c98d5d94SLen Brown void flush_stdout() 635103a8feaSLen Brown { 636c98d5d94SLen Brown fputs(output_buffer, stdout); 637ddac0d68SLen Brown fflush(stdout); 638c98d5d94SLen Brown outp = output_buffer; 639c98d5d94SLen Brown } 640c98d5d94SLen Brown void flush_stderr() 641c98d5d94SLen Brown { 642c98d5d94SLen Brown fputs(output_buffer, stderr); 643c98d5d94SLen Brown outp = output_buffer; 644c98d5d94SLen Brown } 645c98d5d94SLen Brown void format_all_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 646c98d5d94SLen Brown { 647e23da037SLen Brown static int printed; 648103a8feaSLen Brown 649e23da037SLen Brown if (!printed || !summary_only) 650103a8feaSLen Brown print_header(); 651103a8feaSLen Brown 652c98d5d94SLen Brown if (topo.num_cpus > 1) 653c98d5d94SLen Brown format_counters(&average.threads, &average.cores, 654c98d5d94SLen Brown &average.packages); 655103a8feaSLen Brown 656e23da037SLen Brown printed = 1; 657e23da037SLen Brown 658e23da037SLen Brown if (summary_only) 659e23da037SLen Brown return; 660e23da037SLen Brown 661c98d5d94SLen Brown for_all_cpus(format_counters, t, c, p); 662103a8feaSLen Brown } 663103a8feaSLen Brown 664889facbeSLen Brown #define DELTA_WRAP32(new, old) \ 665889facbeSLen Brown if (new > old) { \ 666889facbeSLen Brown old = new - old; \ 667889facbeSLen Brown } else { \ 668889facbeSLen Brown old = 0x100000000 + new - old; \ 669889facbeSLen Brown } 670889facbeSLen Brown 671c98d5d94SLen Brown void 672c98d5d94SLen Brown delta_package(struct pkg_data *new, struct pkg_data *old) 673103a8feaSLen Brown { 674*0b2bb692SLen Brown 675*0b2bb692SLen Brown if (do_skl_residency) { 676*0b2bb692SLen Brown old->pkg_wtd_core_c0 = new->pkg_wtd_core_c0 - old->pkg_wtd_core_c0; 677*0b2bb692SLen Brown old->pkg_any_core_c0 = new->pkg_any_core_c0 - old->pkg_any_core_c0; 678*0b2bb692SLen Brown old->pkg_any_gfxe_c0 = new->pkg_any_gfxe_c0 - old->pkg_any_gfxe_c0; 679*0b2bb692SLen Brown old->pkg_both_core_gfxe_c0 = new->pkg_both_core_gfxe_c0 - old->pkg_both_core_gfxe_c0; 680*0b2bb692SLen Brown } 681c98d5d94SLen Brown old->pc2 = new->pc2 - old->pc2; 682ee7e38e3SLen Brown if (do_pc3) 683c98d5d94SLen Brown old->pc3 = new->pc3 - old->pc3; 684ee7e38e3SLen Brown if (do_pc6) 685c98d5d94SLen Brown old->pc6 = new->pc6 - old->pc6; 686ee7e38e3SLen Brown if (do_pc7) 687c98d5d94SLen Brown old->pc7 = new->pc7 - old->pc7; 688ca58710fSKristen Carlson Accardi old->pc8 = new->pc8 - old->pc8; 689ca58710fSKristen Carlson Accardi old->pc9 = new->pc9 - old->pc9; 690ca58710fSKristen Carlson Accardi old->pc10 = new->pc10 - old->pc10; 691889facbeSLen Brown old->pkg_temp_c = new->pkg_temp_c; 692889facbeSLen Brown 693889facbeSLen Brown DELTA_WRAP32(new->energy_pkg, old->energy_pkg); 694889facbeSLen Brown DELTA_WRAP32(new->energy_cores, old->energy_cores); 695889facbeSLen Brown DELTA_WRAP32(new->energy_gfx, old->energy_gfx); 696889facbeSLen Brown DELTA_WRAP32(new->energy_dram, old->energy_dram); 697889facbeSLen Brown DELTA_WRAP32(new->rapl_pkg_perf_status, old->rapl_pkg_perf_status); 698889facbeSLen Brown DELTA_WRAP32(new->rapl_dram_perf_status, old->rapl_dram_perf_status); 699103a8feaSLen Brown } 700103a8feaSLen Brown 701c98d5d94SLen Brown void 702c98d5d94SLen Brown delta_core(struct core_data *new, struct core_data *old) 703c98d5d94SLen Brown { 704c98d5d94SLen Brown old->c3 = new->c3 - old->c3; 705c98d5d94SLen Brown old->c6 = new->c6 - old->c6; 706c98d5d94SLen Brown old->c7 = new->c7 - old->c7; 707889facbeSLen Brown old->core_temp_c = new->core_temp_c; 708103a8feaSLen Brown } 709c98d5d94SLen Brown 710c3ae331dSLen Brown /* 711c3ae331dSLen Brown * old = new - old 712c3ae331dSLen Brown */ 713c98d5d94SLen Brown void 714c98d5d94SLen Brown delta_thread(struct thread_data *new, struct thread_data *old, 715c98d5d94SLen Brown struct core_data *core_delta) 716c98d5d94SLen Brown { 717c98d5d94SLen Brown old->tsc = new->tsc - old->tsc; 718c98d5d94SLen Brown 719103a8feaSLen Brown /* check for TSC < 1 Mcycles over interval */ 720b2c95d90SJosh Triplett if (old->tsc < (1000 * 1000)) 721b2c95d90SJosh Triplett errx(-3, "Insanely slow TSC rate, TSC stops in idle?\n" 722b2c95d90SJosh Triplett "You can disable all c-states by booting with \"idle=poll\"\n" 723b2c95d90SJosh Triplett "or just the deep ones with \"processor.max_cstate=1\""); 724103a8feaSLen Brown 725c98d5d94SLen Brown old->c1 = new->c1 - old->c1; 726c98d5d94SLen Brown 727a729617cSLen Brown if (has_aperf) { 728c98d5d94SLen Brown if ((new->aperf > old->aperf) && (new->mperf > old->mperf)) { 729c98d5d94SLen Brown old->aperf = new->aperf - old->aperf; 730c98d5d94SLen Brown old->mperf = new->mperf - old->mperf; 731c98d5d94SLen Brown } else { 732c98d5d94SLen Brown 733103a8feaSLen Brown if (!aperf_mperf_unstable) { 734103a8feaSLen Brown fprintf(stderr, "%s: APERF or MPERF went backwards *\n", progname); 735103a8feaSLen Brown fprintf(stderr, "* Frequency results do not cover entire interval *\n"); 736103a8feaSLen Brown fprintf(stderr, "* fix this by running Linux-2.6.30 or later *\n"); 737103a8feaSLen Brown 738103a8feaSLen Brown aperf_mperf_unstable = 1; 739103a8feaSLen Brown } 740103a8feaSLen Brown /* 741103a8feaSLen Brown * mperf delta is likely a huge "positive" number 742103a8feaSLen Brown * can not use it for calculating c0 time 743103a8feaSLen Brown */ 744103a8feaSLen Brown skip_c0 = 1; 745103a8feaSLen Brown skip_c1 = 1; 746103a8feaSLen Brown } 747a729617cSLen Brown } 748103a8feaSLen Brown 749c98d5d94SLen Brown 750144b44b1SLen Brown if (use_c1_residency_msr) { 751144b44b1SLen Brown /* 752144b44b1SLen Brown * Some models have a dedicated C1 residency MSR, 753144b44b1SLen Brown * which should be more accurate than the derivation below. 754144b44b1SLen Brown */ 755144b44b1SLen Brown } else { 756103a8feaSLen Brown /* 757c3ae331dSLen Brown * As counter collection is not atomic, 758c3ae331dSLen Brown * it is possible for mperf's non-halted cycles + idle states 759103a8feaSLen Brown * to exceed TSC's all cycles: show c1 = 0% in that case. 760103a8feaSLen Brown */ 761c3ae331dSLen Brown if ((old->mperf + core_delta->c3 + core_delta->c6 + core_delta->c7) > old->tsc) 762c98d5d94SLen Brown old->c1 = 0; 763c98d5d94SLen Brown else { 764c98d5d94SLen Brown /* normal case, derive c1 */ 765c98d5d94SLen Brown old->c1 = old->tsc - old->mperf - core_delta->c3 766c98d5d94SLen Brown - core_delta->c6 - core_delta->c7; 767c98d5d94SLen Brown } 768144b44b1SLen Brown } 769c3ae331dSLen Brown 770c98d5d94SLen Brown if (old->mperf == 0) { 771d8af6f5fSLen Brown if (debug > 1) fprintf(stderr, "cpu%d MPERF 0!\n", old->cpu_id); 772c98d5d94SLen Brown old->mperf = 1; /* divide by 0 protection */ 773c98d5d94SLen Brown } 774103a8feaSLen Brown 7758e180f3cSLen Brown old->extra_delta32 = new->extra_delta32 - old->extra_delta32; 7768e180f3cSLen Brown old->extra_delta32 &= 0xFFFFFFFF; 7778e180f3cSLen Brown 7788e180f3cSLen Brown old->extra_delta64 = new->extra_delta64 - old->extra_delta64; 7798e180f3cSLen Brown 780103a8feaSLen Brown /* 7818e180f3cSLen Brown * Extra MSR is just a snapshot, simply copy latest w/o subtracting 782103a8feaSLen Brown */ 7832f32edf1SLen Brown old->extra_msr32 = new->extra_msr32; 7842f32edf1SLen Brown old->extra_msr64 = new->extra_msr64; 7851ed51011SLen Brown 7861ed51011SLen Brown if (do_smi) 7871ed51011SLen Brown old->smi_count = new->smi_count - old->smi_count; 788103a8feaSLen Brown } 789c98d5d94SLen Brown 790c98d5d94SLen Brown int delta_cpu(struct thread_data *t, struct core_data *c, 791c98d5d94SLen Brown struct pkg_data *p, struct thread_data *t2, 792c98d5d94SLen Brown struct core_data *c2, struct pkg_data *p2) 793c98d5d94SLen Brown { 794c98d5d94SLen Brown /* calculate core delta only for 1st thread in core */ 795c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_THREAD_IN_CORE) 796c98d5d94SLen Brown delta_core(c, c2); 797c98d5d94SLen Brown 798c98d5d94SLen Brown /* always calculate thread delta */ 799c98d5d94SLen Brown delta_thread(t, t2, c2); /* c2 is core delta */ 800c98d5d94SLen Brown 801c98d5d94SLen Brown /* calculate package delta only for 1st core in package */ 802c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE) 803c98d5d94SLen Brown delta_package(p, p2); 804c98d5d94SLen Brown 805103a8feaSLen Brown return 0; 806103a8feaSLen Brown } 807103a8feaSLen Brown 808c98d5d94SLen Brown void clear_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 809103a8feaSLen Brown { 810c98d5d94SLen Brown t->tsc = 0; 811c98d5d94SLen Brown t->aperf = 0; 812c98d5d94SLen Brown t->mperf = 0; 813c98d5d94SLen Brown t->c1 = 0; 814103a8feaSLen Brown 8151ed51011SLen Brown t->smi_count = 0; 8168e180f3cSLen Brown t->extra_delta32 = 0; 8178e180f3cSLen Brown t->extra_delta64 = 0; 8188e180f3cSLen Brown 819c98d5d94SLen Brown /* tells format_counters to dump all fields from this set */ 820c98d5d94SLen Brown t->flags = CPU_IS_FIRST_THREAD_IN_CORE | CPU_IS_FIRST_CORE_IN_PACKAGE; 821c98d5d94SLen Brown 822c98d5d94SLen Brown c->c3 = 0; 823c98d5d94SLen Brown c->c6 = 0; 824c98d5d94SLen Brown c->c7 = 0; 825889facbeSLen Brown c->core_temp_c = 0; 826c98d5d94SLen Brown 827*0b2bb692SLen Brown p->pkg_wtd_core_c0 = 0; 828*0b2bb692SLen Brown p->pkg_any_core_c0 = 0; 829*0b2bb692SLen Brown p->pkg_any_gfxe_c0 = 0; 830*0b2bb692SLen Brown p->pkg_both_core_gfxe_c0 = 0; 831*0b2bb692SLen Brown 832c98d5d94SLen Brown p->pc2 = 0; 833ee7e38e3SLen Brown if (do_pc3) 834c98d5d94SLen Brown p->pc3 = 0; 835ee7e38e3SLen Brown if (do_pc6) 836c98d5d94SLen Brown p->pc6 = 0; 837ee7e38e3SLen Brown if (do_pc7) 838c98d5d94SLen Brown p->pc7 = 0; 839ca58710fSKristen Carlson Accardi p->pc8 = 0; 840ca58710fSKristen Carlson Accardi p->pc9 = 0; 841ca58710fSKristen Carlson Accardi p->pc10 = 0; 842889facbeSLen Brown 843889facbeSLen Brown p->energy_pkg = 0; 844889facbeSLen Brown p->energy_dram = 0; 845889facbeSLen Brown p->energy_cores = 0; 846889facbeSLen Brown p->energy_gfx = 0; 847889facbeSLen Brown p->rapl_pkg_perf_status = 0; 848889facbeSLen Brown p->rapl_dram_perf_status = 0; 849889facbeSLen Brown p->pkg_temp_c = 0; 850103a8feaSLen Brown } 851c98d5d94SLen Brown int sum_counters(struct thread_data *t, struct core_data *c, 852c98d5d94SLen Brown struct pkg_data *p) 853103a8feaSLen Brown { 854c98d5d94SLen Brown average.threads.tsc += t->tsc; 855c98d5d94SLen Brown average.threads.aperf += t->aperf; 856c98d5d94SLen Brown average.threads.mperf += t->mperf; 857c98d5d94SLen Brown average.threads.c1 += t->c1; 85815aaa346SLen Brown 8598e180f3cSLen Brown average.threads.extra_delta32 += t->extra_delta32; 8608e180f3cSLen Brown average.threads.extra_delta64 += t->extra_delta64; 8618e180f3cSLen Brown 862c98d5d94SLen Brown /* sum per-core values only for 1st thread in core */ 863c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 864c98d5d94SLen Brown return 0; 865c98d5d94SLen Brown 866c98d5d94SLen Brown average.cores.c3 += c->c3; 867c98d5d94SLen Brown average.cores.c6 += c->c6; 868c98d5d94SLen Brown average.cores.c7 += c->c7; 869c98d5d94SLen Brown 870889facbeSLen Brown average.cores.core_temp_c = MAX(average.cores.core_temp_c, c->core_temp_c); 871889facbeSLen Brown 872c98d5d94SLen Brown /* sum per-pkg values only for 1st core in pkg */ 873c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 874c98d5d94SLen Brown return 0; 875c98d5d94SLen Brown 876*0b2bb692SLen Brown if (do_skl_residency) { 877*0b2bb692SLen Brown average.packages.pkg_wtd_core_c0 += p->pkg_wtd_core_c0; 878*0b2bb692SLen Brown average.packages.pkg_any_core_c0 += p->pkg_any_core_c0; 879*0b2bb692SLen Brown average.packages.pkg_any_gfxe_c0 += p->pkg_any_gfxe_c0; 880*0b2bb692SLen Brown average.packages.pkg_both_core_gfxe_c0 += p->pkg_both_core_gfxe_c0; 881*0b2bb692SLen Brown } 882*0b2bb692SLen Brown 883c98d5d94SLen Brown average.packages.pc2 += p->pc2; 884ee7e38e3SLen Brown if (do_pc3) 885c98d5d94SLen Brown average.packages.pc3 += p->pc3; 886ee7e38e3SLen Brown if (do_pc6) 887c98d5d94SLen Brown average.packages.pc6 += p->pc6; 888ee7e38e3SLen Brown if (do_pc7) 889c98d5d94SLen Brown average.packages.pc7 += p->pc7; 890ca58710fSKristen Carlson Accardi average.packages.pc8 += p->pc8; 891ca58710fSKristen Carlson Accardi average.packages.pc9 += p->pc9; 892ca58710fSKristen Carlson Accardi average.packages.pc10 += p->pc10; 893c98d5d94SLen Brown 894889facbeSLen Brown average.packages.energy_pkg += p->energy_pkg; 895889facbeSLen Brown average.packages.energy_dram += p->energy_dram; 896889facbeSLen Brown average.packages.energy_cores += p->energy_cores; 897889facbeSLen Brown average.packages.energy_gfx += p->energy_gfx; 898889facbeSLen Brown 899889facbeSLen Brown average.packages.pkg_temp_c = MAX(average.packages.pkg_temp_c, p->pkg_temp_c); 900889facbeSLen Brown 901889facbeSLen Brown average.packages.rapl_pkg_perf_status += p->rapl_pkg_perf_status; 902889facbeSLen Brown average.packages.rapl_dram_perf_status += p->rapl_dram_perf_status; 903c98d5d94SLen Brown return 0; 904c98d5d94SLen Brown } 905c98d5d94SLen Brown /* 906c98d5d94SLen Brown * sum the counters for all cpus in the system 907c98d5d94SLen Brown * compute the weighted average 908c98d5d94SLen Brown */ 909c98d5d94SLen Brown void compute_average(struct thread_data *t, struct core_data *c, 910c98d5d94SLen Brown struct pkg_data *p) 911c98d5d94SLen Brown { 912c98d5d94SLen Brown clear_counters(&average.threads, &average.cores, &average.packages); 913c98d5d94SLen Brown 914c98d5d94SLen Brown for_all_cpus(sum_counters, t, c, p); 915c98d5d94SLen Brown 916c98d5d94SLen Brown average.threads.tsc /= topo.num_cpus; 917c98d5d94SLen Brown average.threads.aperf /= topo.num_cpus; 918c98d5d94SLen Brown average.threads.mperf /= topo.num_cpus; 919c98d5d94SLen Brown average.threads.c1 /= topo.num_cpus; 920c98d5d94SLen Brown 9218e180f3cSLen Brown average.threads.extra_delta32 /= topo.num_cpus; 9228e180f3cSLen Brown average.threads.extra_delta32 &= 0xFFFFFFFF; 9238e180f3cSLen Brown 9248e180f3cSLen Brown average.threads.extra_delta64 /= topo.num_cpus; 9258e180f3cSLen Brown 926c98d5d94SLen Brown average.cores.c3 /= topo.num_cores; 927c98d5d94SLen Brown average.cores.c6 /= topo.num_cores; 928c98d5d94SLen Brown average.cores.c7 /= topo.num_cores; 929c98d5d94SLen Brown 930*0b2bb692SLen Brown if (do_skl_residency) { 931*0b2bb692SLen Brown average.packages.pkg_wtd_core_c0 /= topo.num_packages; 932*0b2bb692SLen Brown average.packages.pkg_any_core_c0 /= topo.num_packages; 933*0b2bb692SLen Brown average.packages.pkg_any_gfxe_c0 /= topo.num_packages; 934*0b2bb692SLen Brown average.packages.pkg_both_core_gfxe_c0 /= topo.num_packages; 935*0b2bb692SLen Brown } 936*0b2bb692SLen Brown 937c98d5d94SLen Brown average.packages.pc2 /= topo.num_packages; 938ee7e38e3SLen Brown if (do_pc3) 939c98d5d94SLen Brown average.packages.pc3 /= topo.num_packages; 940ee7e38e3SLen Brown if (do_pc6) 941c98d5d94SLen Brown average.packages.pc6 /= topo.num_packages; 942ee7e38e3SLen Brown if (do_pc7) 943c98d5d94SLen Brown average.packages.pc7 /= topo.num_packages; 944ca58710fSKristen Carlson Accardi 945ca58710fSKristen Carlson Accardi average.packages.pc8 /= topo.num_packages; 946ca58710fSKristen Carlson Accardi average.packages.pc9 /= topo.num_packages; 947ca58710fSKristen Carlson Accardi average.packages.pc10 /= topo.num_packages; 948c98d5d94SLen Brown } 949c98d5d94SLen Brown 950c98d5d94SLen Brown static unsigned long long rdtsc(void) 951c98d5d94SLen Brown { 952c98d5d94SLen Brown unsigned int low, high; 953c98d5d94SLen Brown 954c98d5d94SLen Brown asm volatile("rdtsc" : "=a" (low), "=d" (high)); 955c98d5d94SLen Brown 956c98d5d94SLen Brown return low | ((unsigned long long)high) << 32; 957c98d5d94SLen Brown } 958c98d5d94SLen Brown 959c98d5d94SLen Brown 960c98d5d94SLen Brown /* 961c98d5d94SLen Brown * get_counters(...) 962c98d5d94SLen Brown * migrate to cpu 963c98d5d94SLen Brown * acquire and record local counters for that cpu 964c98d5d94SLen Brown */ 965c98d5d94SLen Brown int get_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 966c98d5d94SLen Brown { 967c98d5d94SLen Brown int cpu = t->cpu_id; 968889facbeSLen Brown unsigned long long msr; 969c98d5d94SLen Brown 970e52966c0SLen Brown if (cpu_migrate(cpu)) { 971e52966c0SLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 97215aaa346SLen Brown return -1; 973e52966c0SLen Brown } 97415aaa346SLen Brown 975c98d5d94SLen Brown t->tsc = rdtsc(); /* we are running on local CPU of interest */ 97615aaa346SLen Brown 97715aaa346SLen Brown if (has_aperf) { 9789c63a650SLen Brown if (get_msr(cpu, MSR_IA32_APERF, &t->aperf)) 979c98d5d94SLen Brown return -3; 9809c63a650SLen Brown if (get_msr(cpu, MSR_IA32_MPERF, &t->mperf)) 981c98d5d94SLen Brown return -4; 98288c3281fSLen Brown } 98388c3281fSLen Brown 9841ed51011SLen Brown if (do_smi) { 9851ed51011SLen Brown if (get_msr(cpu, MSR_SMI_COUNT, &msr)) 9861ed51011SLen Brown return -5; 9871ed51011SLen Brown t->smi_count = msr & 0xFFFFFFFF; 9881ed51011SLen Brown } 9898e180f3cSLen Brown if (extra_delta_offset32) { 990889facbeSLen Brown if (get_msr(cpu, extra_delta_offset32, &msr)) 9912f32edf1SLen Brown return -5; 992889facbeSLen Brown t->extra_delta32 = msr & 0xFFFFFFFF; 9938e180f3cSLen Brown } 9948e180f3cSLen Brown 9958e180f3cSLen Brown if (extra_delta_offset64) 9968e180f3cSLen Brown if (get_msr(cpu, extra_delta_offset64, &t->extra_delta64)) 9978e180f3cSLen Brown return -5; 9988e180f3cSLen Brown 9998e180f3cSLen Brown if (extra_msr_offset32) { 1000889facbeSLen Brown if (get_msr(cpu, extra_msr_offset32, &msr)) 10018e180f3cSLen Brown return -5; 1002889facbeSLen Brown t->extra_msr32 = msr & 0xFFFFFFFF; 10038e180f3cSLen Brown } 10042f32edf1SLen Brown 10052f32edf1SLen Brown if (extra_msr_offset64) 10062f32edf1SLen Brown if (get_msr(cpu, extra_msr_offset64, &t->extra_msr64)) 1007c98d5d94SLen Brown return -5; 1008c98d5d94SLen Brown 1009144b44b1SLen Brown if (use_c1_residency_msr) { 1010144b44b1SLen Brown if (get_msr(cpu, MSR_CORE_C1_RES, &t->c1)) 1011144b44b1SLen Brown return -6; 1012144b44b1SLen Brown } 1013144b44b1SLen Brown 1014c98d5d94SLen Brown /* collect core counters only for 1st thread in core */ 1015c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 1016c98d5d94SLen Brown return 0; 1017c98d5d94SLen Brown 1018144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) { 1019c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C3_RESIDENCY, &c->c3)) 1020c98d5d94SLen Brown return -6; 1021144b44b1SLen Brown } 1022144b44b1SLen Brown 1023144b44b1SLen Brown if (do_nhm_cstates) { 1024c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C6_RESIDENCY, &c->c6)) 1025c98d5d94SLen Brown return -7; 1026103a8feaSLen Brown } 102715aaa346SLen Brown 102815aaa346SLen Brown if (do_snb_cstates) 1029c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C7_RESIDENCY, &c->c7)) 1030c98d5d94SLen Brown return -8; 1031c98d5d94SLen Brown 1032889facbeSLen Brown if (do_dts) { 1033889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 1034889facbeSLen Brown return -9; 1035889facbeSLen Brown c->core_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 1036889facbeSLen Brown } 1037889facbeSLen Brown 1038889facbeSLen Brown 1039c98d5d94SLen Brown /* collect package counters only for 1st core in package */ 1040c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1041c98d5d94SLen Brown return 0; 104215aaa346SLen Brown 1043*0b2bb692SLen Brown if (do_skl_residency) { 1044*0b2bb692SLen Brown if (get_msr(cpu, MSR_PKG_WEIGHTED_CORE_C0_RES, &p->pkg_wtd_core_c0)) 1045*0b2bb692SLen Brown return -10; 1046*0b2bb692SLen Brown if (get_msr(cpu, MSR_PKG_ANY_CORE_C0_RES, &p->pkg_any_core_c0)) 1047*0b2bb692SLen Brown return -11; 1048*0b2bb692SLen Brown if (get_msr(cpu, MSR_PKG_ANY_GFXE_C0_RES, &p->pkg_any_gfxe_c0)) 1049*0b2bb692SLen Brown return -12; 1050*0b2bb692SLen Brown if (get_msr(cpu, MSR_PKG_BOTH_CORE_GFXE_C0_RES, &p->pkg_both_core_gfxe_c0)) 1051*0b2bb692SLen Brown return -13; 1052*0b2bb692SLen Brown } 1053ee7e38e3SLen Brown if (do_pc3) 1054c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C3_RESIDENCY, &p->pc3)) 1055c98d5d94SLen Brown return -9; 1056ee7e38e3SLen Brown if (do_pc6) 1057c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C6_RESIDENCY, &p->pc6)) 1058c98d5d94SLen Brown return -10; 1059ee7e38e3SLen Brown if (do_pc2) 1060c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C2_RESIDENCY, &p->pc2)) 1061c98d5d94SLen Brown return -11; 1062ee7e38e3SLen Brown if (do_pc7) 1063c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C7_RESIDENCY, &p->pc7)) 1064c98d5d94SLen Brown return -12; 1065ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 1066ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C8_RESIDENCY, &p->pc8)) 1067ca58710fSKristen Carlson Accardi return -13; 1068ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C9_RESIDENCY, &p->pc9)) 1069ca58710fSKristen Carlson Accardi return -13; 1070ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C10_RESIDENCY, &p->pc10)) 1071ca58710fSKristen Carlson Accardi return -13; 1072ca58710fSKristen Carlson Accardi } 1073889facbeSLen Brown if (do_rapl & RAPL_PKG) { 1074889facbeSLen Brown if (get_msr(cpu, MSR_PKG_ENERGY_STATUS, &msr)) 1075889facbeSLen Brown return -13; 1076889facbeSLen Brown p->energy_pkg = msr & 0xFFFFFFFF; 1077889facbeSLen Brown } 1078889facbeSLen Brown if (do_rapl & RAPL_CORES) { 1079889facbeSLen Brown if (get_msr(cpu, MSR_PP0_ENERGY_STATUS, &msr)) 1080889facbeSLen Brown return -14; 1081889facbeSLen Brown p->energy_cores = msr & 0xFFFFFFFF; 1082889facbeSLen Brown } 1083889facbeSLen Brown if (do_rapl & RAPL_DRAM) { 1084889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_ENERGY_STATUS, &msr)) 1085889facbeSLen Brown return -15; 1086889facbeSLen Brown p->energy_dram = msr & 0xFFFFFFFF; 1087889facbeSLen Brown } 1088889facbeSLen Brown if (do_rapl & RAPL_GFX) { 1089889facbeSLen Brown if (get_msr(cpu, MSR_PP1_ENERGY_STATUS, &msr)) 1090889facbeSLen Brown return -16; 1091889facbeSLen Brown p->energy_gfx = msr & 0xFFFFFFFF; 1092889facbeSLen Brown } 1093889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) { 1094889facbeSLen Brown if (get_msr(cpu, MSR_PKG_PERF_STATUS, &msr)) 1095889facbeSLen Brown return -16; 1096889facbeSLen Brown p->rapl_pkg_perf_status = msr & 0xFFFFFFFF; 1097889facbeSLen Brown } 1098889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) { 1099889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_PERF_STATUS, &msr)) 1100889facbeSLen Brown return -16; 1101889facbeSLen Brown p->rapl_dram_perf_status = msr & 0xFFFFFFFF; 1102889facbeSLen Brown } 1103889facbeSLen Brown if (do_ptm) { 1104889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 1105889facbeSLen Brown return -17; 1106889facbeSLen Brown p->pkg_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 1107889facbeSLen Brown } 110815aaa346SLen Brown return 0; 1109103a8feaSLen Brown } 1110103a8feaSLen Brown 1111ee7e38e3SLen Brown /* 1112ee7e38e3SLen Brown * MSR_PKG_CST_CONFIG_CONTROL decoding for pkg_cstate_limit: 1113ee7e38e3SLen Brown * If you change the values, note they are used both in comparisons 1114ee7e38e3SLen Brown * (>= PCL__7) and to index pkg_cstate_limit_strings[]. 1115ee7e38e3SLen Brown */ 1116ee7e38e3SLen Brown 1117ee7e38e3SLen Brown #define PCLUKN 0 /* Unknown */ 1118ee7e38e3SLen Brown #define PCLRSV 1 /* Reserved */ 1119ee7e38e3SLen Brown #define PCL__0 2 /* PC0 */ 1120ee7e38e3SLen Brown #define PCL__1 3 /* PC1 */ 1121ee7e38e3SLen Brown #define PCL__2 4 /* PC2 */ 1122ee7e38e3SLen Brown #define PCL__3 5 /* PC3 */ 1123ee7e38e3SLen Brown #define PCL__4 6 /* PC4 */ 1124ee7e38e3SLen Brown #define PCL__6 7 /* PC6 */ 1125ee7e38e3SLen Brown #define PCL_6N 8 /* PC6 No Retention */ 1126ee7e38e3SLen Brown #define PCL_6R 9 /* PC6 Retention */ 1127ee7e38e3SLen Brown #define PCL__7 10 /* PC7 */ 1128ee7e38e3SLen Brown #define PCL_7S 11 /* PC7 Shrink */ 1129*0b2bb692SLen Brown #define PCL__8 12 /* PC8 */ 1130*0b2bb692SLen Brown #define PCL__9 13 /* PC9 */ 1131*0b2bb692SLen Brown #define PCLUNL 14 /* Unlimited */ 1132ee7e38e3SLen Brown 1133ee7e38e3SLen Brown int pkg_cstate_limit = PCLUKN; 1134ee7e38e3SLen Brown char *pkg_cstate_limit_strings[] = { "reserved", "unknown", "pc0", "pc1", "pc2", 1135*0b2bb692SLen Brown "pc3", "pc4", "pc6", "pc6n", "pc6r", "pc7", "pc7s", "pc8", "pc9", "unlimited"}; 1136ee7e38e3SLen Brown 1137ee7e38e3SLen Brown int nhm_pkg_cstate_limits[8] = {PCL__0, PCL__1, PCL__3, PCL__6, PCL__7, PCLRSV, PCLRSV, PCLUNL}; 1138ee7e38e3SLen Brown int snb_pkg_cstate_limits[8] = {PCL__0, PCL__2, PCL_6N, PCL_6R, PCL__7, PCL_7S, PCLRSV, PCLUNL}; 1139ee7e38e3SLen Brown int hsw_pkg_cstate_limits[8] = {PCL__0, PCL__2, PCL__3, PCL__6, PCL__7, PCL_7S, PCLRSV, PCLUNL}; 1140*0b2bb692SLen Brown int skl_pkg_cstate_limits[8] = {PCL__0, PCL__2, PCL__3, PCL__6, PCL__7, PCL_7S, PCL__8, PCL__9}; 1141ee7e38e3SLen Brown int slv_pkg_cstate_limits[8] = {PCL__0, PCL__1, PCLRSV, PCLRSV, PCL__4, PCLRSV, PCL__6, PCL__7}; 1142ee7e38e3SLen Brown int amt_pkg_cstate_limits[8] = {PCL__0, PCL__1, PCL__2, PCLRSV, PCLRSV, PCLRSV, PCL__6, PCL__7}; 1143ee7e38e3SLen Brown int phi_pkg_cstate_limits[8] = {PCL__0, PCL__2, PCL_6N, PCL_6R, PCLRSV, PCLRSV, PCLRSV, PCLUNL}; 1144ee7e38e3SLen Brown 1145fcd17211SLen Brown static void 1146fcd17211SLen Brown dump_nhm_platform_info(void) 1147103a8feaSLen Brown { 1148103a8feaSLen Brown unsigned long long msr; 1149103a8feaSLen Brown unsigned int ratio; 1150103a8feaSLen Brown 11519c63a650SLen Brown get_msr(0, MSR_NHM_PLATFORM_INFO, &msr); 1152103a8feaSLen Brown 1153889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_PLATFORM_INFO: 0x%08llx\n", msr); 11546574a5d5SLen Brown 1155103a8feaSLen Brown ratio = (msr >> 40) & 0xFF; 11568f61f359SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max efficiency frequency\n", 1157103a8feaSLen Brown ratio, bclk, ratio * bclk); 1158103a8feaSLen Brown 1159103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 11608f61f359SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz base frequency\n", 1161103a8feaSLen Brown ratio, bclk, ratio * bclk); 1162103a8feaSLen Brown 116367920418SLen Brown get_msr(0, MSR_IA32_POWER_CTL, &msr); 1164144b44b1SLen Brown fprintf(stderr, "cpu0: MSR_IA32_POWER_CTL: 0x%08llx (C1E auto-promotion: %sabled)\n", 116567920418SLen Brown msr, msr & 0x2 ? "EN" : "DIS"); 116667920418SLen Brown 1167fcd17211SLen Brown return; 1168fcd17211SLen Brown } 1169fcd17211SLen Brown 1170fcd17211SLen Brown static void 1171fcd17211SLen Brown dump_hsw_turbo_ratio_limits(void) 1172fcd17211SLen Brown { 1173fcd17211SLen Brown unsigned long long msr; 1174fcd17211SLen Brown unsigned int ratio; 1175fcd17211SLen Brown 1176fcd17211SLen Brown get_msr(0, MSR_TURBO_RATIO_LIMIT2, &msr); 1177fcd17211SLen Brown 1178fcd17211SLen Brown fprintf(stderr, "cpu0: MSR_TURBO_RATIO_LIMIT2: 0x%08llx\n", msr); 1179fcd17211SLen Brown 1180fcd17211SLen Brown ratio = (msr >> 8) & 0xFF; 1181fcd17211SLen Brown if (ratio) 1182fcd17211SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 18 active cores\n", 1183fcd17211SLen Brown ratio, bclk, ratio * bclk); 1184fcd17211SLen Brown 1185fcd17211SLen Brown ratio = (msr >> 0) & 0xFF; 1186fcd17211SLen Brown if (ratio) 1187fcd17211SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 17 active cores\n", 1188fcd17211SLen Brown ratio, bclk, ratio * bclk); 1189fcd17211SLen Brown return; 1190fcd17211SLen Brown } 1191fcd17211SLen Brown 1192fcd17211SLen Brown static void 1193fcd17211SLen Brown dump_ivt_turbo_ratio_limits(void) 1194fcd17211SLen Brown { 1195fcd17211SLen Brown unsigned long long msr; 1196fcd17211SLen Brown unsigned int ratio; 11976574a5d5SLen Brown 119812bb43c6SLen Brown get_msr(0, MSR_TURBO_RATIO_LIMIT1, &msr); 11996574a5d5SLen Brown 120012bb43c6SLen Brown fprintf(stderr, "cpu0: MSR_TURBO_RATIO_LIMIT1: 0x%08llx\n", msr); 12016574a5d5SLen Brown 12026574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 12036574a5d5SLen Brown if (ratio) 12046574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 16 active cores\n", 12056574a5d5SLen Brown ratio, bclk, ratio * bclk); 12066574a5d5SLen Brown 12076574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 12086574a5d5SLen Brown if (ratio) 12096574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 15 active cores\n", 12106574a5d5SLen Brown ratio, bclk, ratio * bclk); 12116574a5d5SLen Brown 12126574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 12136574a5d5SLen Brown if (ratio) 12146574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 14 active cores\n", 12156574a5d5SLen Brown ratio, bclk, ratio * bclk); 12166574a5d5SLen Brown 12176574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 12186574a5d5SLen Brown if (ratio) 12196574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 13 active cores\n", 12206574a5d5SLen Brown ratio, bclk, ratio * bclk); 12216574a5d5SLen Brown 12226574a5d5SLen Brown ratio = (msr >> 24) & 0xFF; 12236574a5d5SLen Brown if (ratio) 12246574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 12 active cores\n", 12256574a5d5SLen Brown ratio, bclk, ratio * bclk); 12266574a5d5SLen Brown 12276574a5d5SLen Brown ratio = (msr >> 16) & 0xFF; 12286574a5d5SLen Brown if (ratio) 12296574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 11 active cores\n", 12306574a5d5SLen Brown ratio, bclk, ratio * bclk); 12316574a5d5SLen Brown 12326574a5d5SLen Brown ratio = (msr >> 8) & 0xFF; 12336574a5d5SLen Brown if (ratio) 12346574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 10 active cores\n", 12356574a5d5SLen Brown ratio, bclk, ratio * bclk); 12366574a5d5SLen Brown 12376574a5d5SLen Brown ratio = (msr >> 0) & 0xFF; 12386574a5d5SLen Brown if (ratio) 12396574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 9 active cores\n", 12406574a5d5SLen Brown ratio, bclk, ratio * bclk); 1241103a8feaSLen Brown return; 1242fcd17211SLen Brown } 1243fcd17211SLen Brown 1244fcd17211SLen Brown static void 1245fcd17211SLen Brown dump_nhm_turbo_ratio_limits(void) 1246fcd17211SLen Brown { 1247fcd17211SLen Brown unsigned long long msr; 1248fcd17211SLen Brown unsigned int ratio; 1249103a8feaSLen Brown 125012bb43c6SLen Brown get_msr(0, MSR_TURBO_RATIO_LIMIT, &msr); 1251103a8feaSLen Brown 125212bb43c6SLen Brown fprintf(stderr, "cpu0: MSR_TURBO_RATIO_LIMIT: 0x%08llx\n", msr); 12536574a5d5SLen Brown 12546574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 12556574a5d5SLen Brown if (ratio) 12566574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 8 active cores\n", 12576574a5d5SLen Brown ratio, bclk, ratio * bclk); 12586574a5d5SLen Brown 12596574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 12606574a5d5SLen Brown if (ratio) 12616574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 7 active cores\n", 12626574a5d5SLen Brown ratio, bclk, ratio * bclk); 12636574a5d5SLen Brown 12646574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 12656574a5d5SLen Brown if (ratio) 12666574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 6 active cores\n", 12676574a5d5SLen Brown ratio, bclk, ratio * bclk); 12686574a5d5SLen Brown 12696574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 12706574a5d5SLen Brown if (ratio) 12716574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 5 active cores\n", 12726574a5d5SLen Brown ratio, bclk, ratio * bclk); 12736574a5d5SLen Brown 1274103a8feaSLen Brown ratio = (msr >> 24) & 0xFF; 1275103a8feaSLen Brown if (ratio) 1276103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 4 active cores\n", 1277103a8feaSLen Brown ratio, bclk, ratio * bclk); 1278103a8feaSLen Brown 1279103a8feaSLen Brown ratio = (msr >> 16) & 0xFF; 1280103a8feaSLen Brown if (ratio) 1281103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 3 active cores\n", 1282103a8feaSLen Brown ratio, bclk, ratio * bclk); 1283103a8feaSLen Brown 1284103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 1285103a8feaSLen Brown if (ratio) 1286103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 2 active cores\n", 1287103a8feaSLen Brown ratio, bclk, ratio * bclk); 1288103a8feaSLen Brown 1289103a8feaSLen Brown ratio = (msr >> 0) & 0xFF; 1290103a8feaSLen Brown if (ratio) 1291103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 1 active cores\n", 1292103a8feaSLen Brown ratio, bclk, ratio * bclk); 1293fcd17211SLen Brown return; 1294fcd17211SLen Brown } 12953a9a941dSLen Brown 1296fcd17211SLen Brown static void 1297fcd17211SLen Brown dump_nhm_cst_cfg(void) 1298fcd17211SLen Brown { 1299fcd17211SLen Brown unsigned long long msr; 1300fcd17211SLen Brown 1301fcd17211SLen Brown get_msr(0, MSR_NHM_SNB_PKG_CST_CFG_CTL, &msr); 1302fcd17211SLen Brown 1303fcd17211SLen Brown #define SNB_C1_AUTO_UNDEMOTE (1UL << 27) 1304fcd17211SLen Brown #define SNB_C3_AUTO_UNDEMOTE (1UL << 28) 1305fcd17211SLen Brown 1306fcd17211SLen Brown fprintf(stderr, "cpu0: MSR_NHM_SNB_PKG_CST_CFG_CTL: 0x%08llx", msr); 1307fcd17211SLen Brown 1308fcd17211SLen Brown fprintf(stderr, " (%s%s%s%s%slocked: pkg-cstate-limit=%d: %s)\n", 1309fcd17211SLen Brown (msr & SNB_C3_AUTO_UNDEMOTE) ? "UNdemote-C3, " : "", 1310fcd17211SLen Brown (msr & SNB_C1_AUTO_UNDEMOTE) ? "UNdemote-C1, " : "", 1311fcd17211SLen Brown (msr & NHM_C3_AUTO_DEMOTE) ? "demote-C3, " : "", 1312fcd17211SLen Brown (msr & NHM_C1_AUTO_DEMOTE) ? "demote-C1, " : "", 1313fcd17211SLen Brown (msr & (1 << 15)) ? "" : "UN", 1314fcd17211SLen Brown (unsigned int)msr & 7, 1315fcd17211SLen Brown pkg_cstate_limit_strings[pkg_cstate_limit]); 1316fcd17211SLen Brown return; 1317103a8feaSLen Brown } 1318103a8feaSLen Brown 1319c98d5d94SLen Brown void free_all_buffers(void) 1320103a8feaSLen Brown { 1321c98d5d94SLen Brown CPU_FREE(cpu_present_set); 1322c98d5d94SLen Brown cpu_present_set = NULL; 1323c98d5d94SLen Brown cpu_present_set = 0; 1324103a8feaSLen Brown 1325c98d5d94SLen Brown CPU_FREE(cpu_affinity_set); 1326c98d5d94SLen Brown cpu_affinity_set = NULL; 1327c98d5d94SLen Brown cpu_affinity_setsize = 0; 1328103a8feaSLen Brown 1329c98d5d94SLen Brown free(thread_even); 1330c98d5d94SLen Brown free(core_even); 1331c98d5d94SLen Brown free(package_even); 1332103a8feaSLen Brown 1333c98d5d94SLen Brown thread_even = NULL; 1334c98d5d94SLen Brown core_even = NULL; 1335c98d5d94SLen Brown package_even = NULL; 1336103a8feaSLen Brown 1337c98d5d94SLen Brown free(thread_odd); 1338c98d5d94SLen Brown free(core_odd); 1339c98d5d94SLen Brown free(package_odd); 1340103a8feaSLen Brown 1341c98d5d94SLen Brown thread_odd = NULL; 1342c98d5d94SLen Brown core_odd = NULL; 1343c98d5d94SLen Brown package_odd = NULL; 1344103a8feaSLen Brown 1345c98d5d94SLen Brown free(output_buffer); 1346c98d5d94SLen Brown output_buffer = NULL; 1347c98d5d94SLen Brown outp = NULL; 1348103a8feaSLen Brown } 1349103a8feaSLen Brown 1350103a8feaSLen Brown /* 135157a42a34SJosh Triplett * Open a file, and exit on failure 135257a42a34SJosh Triplett */ 135357a42a34SJosh Triplett FILE *fopen_or_die(const char *path, const char *mode) 135457a42a34SJosh Triplett { 135557a42a34SJosh Triplett FILE *filep = fopen(path, "r"); 1356b2c95d90SJosh Triplett if (!filep) 1357b2c95d90SJosh Triplett err(1, "%s: open failed", path); 135857a42a34SJosh Triplett return filep; 135957a42a34SJosh Triplett } 136057a42a34SJosh Triplett 136157a42a34SJosh Triplett /* 136295aebc44SJosh Triplett * Parse a file containing a single int. 136395aebc44SJosh Triplett */ 136495aebc44SJosh Triplett int parse_int_file(const char *fmt, ...) 136595aebc44SJosh Triplett { 136695aebc44SJosh Triplett va_list args; 136795aebc44SJosh Triplett char path[PATH_MAX]; 136895aebc44SJosh Triplett FILE *filep; 136995aebc44SJosh Triplett int value; 137095aebc44SJosh Triplett 137195aebc44SJosh Triplett va_start(args, fmt); 137295aebc44SJosh Triplett vsnprintf(path, sizeof(path), fmt, args); 137395aebc44SJosh Triplett va_end(args); 137457a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1375b2c95d90SJosh Triplett if (fscanf(filep, "%d", &value) != 1) 1376b2c95d90SJosh Triplett err(1, "%s: failed to parse number from file", path); 137795aebc44SJosh Triplett fclose(filep); 137895aebc44SJosh Triplett return value; 137995aebc44SJosh Triplett } 138095aebc44SJosh Triplett 138195aebc44SJosh Triplett /* 1382c98d5d94SLen Brown * cpu_is_first_sibling_in_core(cpu) 1383c98d5d94SLen Brown * return 1 if given CPU is 1st HT sibling in the core 1384103a8feaSLen Brown */ 1385c98d5d94SLen Brown int cpu_is_first_sibling_in_core(int cpu) 1386103a8feaSLen Brown { 138795aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 1388c98d5d94SLen Brown } 1389103a8feaSLen Brown 1390c98d5d94SLen Brown /* 1391c98d5d94SLen Brown * cpu_is_first_core_in_package(cpu) 1392c98d5d94SLen Brown * return 1 if given CPU is 1st core in package 1393c98d5d94SLen Brown */ 1394c98d5d94SLen Brown int cpu_is_first_core_in_package(int cpu) 1395c98d5d94SLen Brown { 139695aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_siblings_list", cpu); 1397103a8feaSLen Brown } 1398103a8feaSLen Brown 1399103a8feaSLen Brown int get_physical_package_id(int cpu) 1400103a8feaSLen Brown { 140195aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu); 1402103a8feaSLen Brown } 1403103a8feaSLen Brown 1404103a8feaSLen Brown int get_core_id(int cpu) 1405103a8feaSLen Brown { 140695aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_id", cpu); 1407103a8feaSLen Brown } 1408103a8feaSLen Brown 1409c98d5d94SLen Brown int get_num_ht_siblings(int cpu) 1410c98d5d94SLen Brown { 1411c98d5d94SLen Brown char path[80]; 1412c98d5d94SLen Brown FILE *filep; 1413c98d5d94SLen Brown int sib1, sib2; 1414c98d5d94SLen Brown int matches; 1415c98d5d94SLen Brown char character; 1416c98d5d94SLen Brown 1417c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 141857a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1419103a8feaSLen Brown /* 1420c98d5d94SLen Brown * file format: 1421c98d5d94SLen Brown * if a pair of number with a character between: 2 siblings (eg. 1-2, or 1,4) 1422c98d5d94SLen Brown * otherwinse 1 sibling (self). 1423c98d5d94SLen Brown */ 1424c98d5d94SLen Brown matches = fscanf(filep, "%d%c%d\n", &sib1, &character, &sib2); 1425c98d5d94SLen Brown 1426c98d5d94SLen Brown fclose(filep); 1427c98d5d94SLen Brown 1428c98d5d94SLen Brown if (matches == 3) 1429c98d5d94SLen Brown return 2; 1430c98d5d94SLen Brown else 1431c98d5d94SLen Brown return 1; 1432c98d5d94SLen Brown } 1433c98d5d94SLen Brown 1434c98d5d94SLen Brown /* 1435c98d5d94SLen Brown * run func(thread, core, package) in topology order 1436c98d5d94SLen Brown * skip non-present cpus 1437103a8feaSLen Brown */ 1438103a8feaSLen Brown 1439c98d5d94SLen Brown int for_all_cpus_2(int (func)(struct thread_data *, struct core_data *, 1440c98d5d94SLen Brown struct pkg_data *, struct thread_data *, struct core_data *, 1441c98d5d94SLen Brown struct pkg_data *), struct thread_data *thread_base, 1442c98d5d94SLen Brown struct core_data *core_base, struct pkg_data *pkg_base, 1443c98d5d94SLen Brown struct thread_data *thread_base2, struct core_data *core_base2, 1444c98d5d94SLen Brown struct pkg_data *pkg_base2) 1445c98d5d94SLen Brown { 1446c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 1447c98d5d94SLen Brown 1448c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 1449c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 1450c98d5d94SLen Brown for (thread_no = 0; thread_no < 1451c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 1452c98d5d94SLen Brown struct thread_data *t, *t2; 1453c98d5d94SLen Brown struct core_data *c, *c2; 1454c98d5d94SLen Brown struct pkg_data *p, *p2; 1455c98d5d94SLen Brown 1456c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 1457c98d5d94SLen Brown 1458c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 1459c98d5d94SLen Brown continue; 1460c98d5d94SLen Brown 1461c98d5d94SLen Brown t2 = GET_THREAD(thread_base2, thread_no, core_no, pkg_no); 1462c98d5d94SLen Brown 1463c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 1464c98d5d94SLen Brown c2 = GET_CORE(core_base2, core_no, pkg_no); 1465c98d5d94SLen Brown 1466c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 1467c98d5d94SLen Brown p2 = GET_PKG(pkg_base2, pkg_no); 1468c98d5d94SLen Brown 1469c98d5d94SLen Brown retval = func(t, c, p, t2, c2, p2); 1470c98d5d94SLen Brown if (retval) 1471c98d5d94SLen Brown return retval; 1472c98d5d94SLen Brown } 1473c98d5d94SLen Brown } 1474c98d5d94SLen Brown } 1475c98d5d94SLen Brown return 0; 1476c98d5d94SLen Brown } 1477c98d5d94SLen Brown 1478c98d5d94SLen Brown /* 1479c98d5d94SLen Brown * run func(cpu) on every cpu in /proc/stat 1480c98d5d94SLen Brown * return max_cpu number 1481c98d5d94SLen Brown */ 1482c98d5d94SLen Brown int for_all_proc_cpus(int (func)(int)) 1483103a8feaSLen Brown { 1484103a8feaSLen Brown FILE *fp; 1485c98d5d94SLen Brown int cpu_num; 1486103a8feaSLen Brown int retval; 1487103a8feaSLen Brown 148857a42a34SJosh Triplett fp = fopen_or_die(proc_stat, "r"); 1489103a8feaSLen Brown 1490103a8feaSLen Brown retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n"); 1491b2c95d90SJosh Triplett if (retval != 0) 1492b2c95d90SJosh Triplett err(1, "%s: failed to parse format", proc_stat); 1493103a8feaSLen Brown 1494c98d5d94SLen Brown while (1) { 1495c98d5d94SLen Brown retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu_num); 1496103a8feaSLen Brown if (retval != 1) 1497103a8feaSLen Brown break; 1498103a8feaSLen Brown 1499c98d5d94SLen Brown retval = func(cpu_num); 1500c98d5d94SLen Brown if (retval) { 1501c98d5d94SLen Brown fclose(fp); 1502c98d5d94SLen Brown return(retval); 1503c98d5d94SLen Brown } 1504103a8feaSLen Brown } 1505103a8feaSLen Brown fclose(fp); 1506c98d5d94SLen Brown return 0; 1507103a8feaSLen Brown } 1508103a8feaSLen Brown 1509103a8feaSLen Brown void re_initialize(void) 1510103a8feaSLen Brown { 1511c98d5d94SLen Brown free_all_buffers(); 1512c98d5d94SLen Brown setup_all_buffers(); 1513c98d5d94SLen Brown printf("turbostat: re-initialized with num_cpus %d\n", topo.num_cpus); 1514103a8feaSLen Brown } 1515103a8feaSLen Brown 1516c98d5d94SLen Brown 1517103a8feaSLen Brown /* 1518c98d5d94SLen Brown * count_cpus() 1519c98d5d94SLen Brown * remember the last one seen, it will be the max 1520103a8feaSLen Brown */ 1521c98d5d94SLen Brown int count_cpus(int cpu) 1522103a8feaSLen Brown { 1523c98d5d94SLen Brown if (topo.max_cpu_num < cpu) 1524c98d5d94SLen Brown topo.max_cpu_num = cpu; 1525103a8feaSLen Brown 1526c98d5d94SLen Brown topo.num_cpus += 1; 1527c98d5d94SLen Brown return 0; 1528103a8feaSLen Brown } 1529c98d5d94SLen Brown int mark_cpu_present(int cpu) 1530c98d5d94SLen Brown { 1531c98d5d94SLen Brown CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set); 153215aaa346SLen Brown return 0; 1533103a8feaSLen Brown } 1534103a8feaSLen Brown 1535103a8feaSLen Brown void turbostat_loop() 1536103a8feaSLen Brown { 1537c98d5d94SLen Brown int retval; 1538e52966c0SLen Brown int restarted = 0; 1539c98d5d94SLen Brown 1540103a8feaSLen Brown restart: 1541e52966c0SLen Brown restarted++; 1542e52966c0SLen Brown 1543c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1544d91bb17cSLen Brown if (retval < -1) { 1545d91bb17cSLen Brown exit(retval); 1546d91bb17cSLen Brown } else if (retval == -1) { 1547e52966c0SLen Brown if (restarted > 1) { 1548e52966c0SLen Brown exit(retval); 1549e52966c0SLen Brown } 1550c98d5d94SLen Brown re_initialize(); 1551c98d5d94SLen Brown goto restart; 1552c98d5d94SLen Brown } 1553e52966c0SLen Brown restarted = 0; 1554103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1555103a8feaSLen Brown 1556103a8feaSLen Brown while (1) { 1557c98d5d94SLen Brown if (for_all_proc_cpus(cpu_is_not_present)) { 1558103a8feaSLen Brown re_initialize(); 1559103a8feaSLen Brown goto restart; 1560103a8feaSLen Brown } 1561103a8feaSLen Brown sleep(interval_sec); 1562c98d5d94SLen Brown retval = for_all_cpus(get_counters, ODD_COUNTERS); 1563d91bb17cSLen Brown if (retval < -1) { 1564d91bb17cSLen Brown exit(retval); 1565d91bb17cSLen Brown } else if (retval == -1) { 156615aaa346SLen Brown re_initialize(); 156715aaa346SLen Brown goto restart; 156815aaa346SLen Brown } 1569103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 1570103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 1571c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 1572c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 1573c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 1574c98d5d94SLen Brown flush_stdout(); 157515aaa346SLen Brown sleep(interval_sec); 1576c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1577d91bb17cSLen Brown if (retval < -1) { 1578d91bb17cSLen Brown exit(retval); 1579d91bb17cSLen Brown } else if (retval == -1) { 1580103a8feaSLen Brown re_initialize(); 1581103a8feaSLen Brown goto restart; 1582103a8feaSLen Brown } 1583103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1584103a8feaSLen Brown timersub(&tv_even, &tv_odd, &tv_delta); 1585c98d5d94SLen Brown for_all_cpus_2(delta_cpu, EVEN_COUNTERS, ODD_COUNTERS); 1586c98d5d94SLen Brown compute_average(ODD_COUNTERS); 1587c98d5d94SLen Brown format_all_counters(ODD_COUNTERS); 1588c98d5d94SLen Brown flush_stdout(); 1589103a8feaSLen Brown } 1590103a8feaSLen Brown } 1591103a8feaSLen Brown 1592103a8feaSLen Brown void check_dev_msr() 1593103a8feaSLen Brown { 1594103a8feaSLen Brown struct stat sb; 1595103a8feaSLen Brown 1596b2c95d90SJosh Triplett if (stat("/dev/cpu/0/msr", &sb)) 1597a21d38c8SLen Brown if (system("/sbin/modprobe msr > /dev/null 2>&1")) 1598d7899447SLen Brown err(-5, "no /dev/cpu/0/msr, Try \"# modprobe msr\" "); 1599103a8feaSLen Brown } 1600103a8feaSLen Brown 160198481e79SLen Brown void check_permissions() 1602103a8feaSLen Brown { 160398481e79SLen Brown struct __user_cap_header_struct cap_header_data; 160498481e79SLen Brown cap_user_header_t cap_header = &cap_header_data; 160598481e79SLen Brown struct __user_cap_data_struct cap_data_data; 160698481e79SLen Brown cap_user_data_t cap_data = &cap_data_data; 160798481e79SLen Brown extern int capget(cap_user_header_t hdrp, cap_user_data_t datap); 160898481e79SLen Brown int do_exit = 0; 160998481e79SLen Brown 161098481e79SLen Brown /* check for CAP_SYS_RAWIO */ 161198481e79SLen Brown cap_header->pid = getpid(); 161298481e79SLen Brown cap_header->version = _LINUX_CAPABILITY_VERSION; 161398481e79SLen Brown if (capget(cap_header, cap_data) < 0) 161498481e79SLen Brown err(-6, "capget(2) failed"); 161598481e79SLen Brown 161698481e79SLen Brown if ((cap_data->effective & (1 << CAP_SYS_RAWIO)) == 0) { 161798481e79SLen Brown do_exit++; 161898481e79SLen Brown warnx("capget(CAP_SYS_RAWIO) failed," 161998481e79SLen Brown " try \"# setcap cap_sys_rawio=ep %s\"", progname); 162098481e79SLen Brown } 162198481e79SLen Brown 162298481e79SLen Brown /* test file permissions */ 162398481e79SLen Brown if (euidaccess("/dev/cpu/0/msr", R_OK)) { 162498481e79SLen Brown do_exit++; 162598481e79SLen Brown warn("/dev/cpu/0/msr open failed, try chown or chmod +r /dev/cpu/*/msr"); 162698481e79SLen Brown } 162798481e79SLen Brown 162898481e79SLen Brown /* if all else fails, thell them to be root */ 162998481e79SLen Brown if (do_exit) 1630b2c95d90SJosh Triplett if (getuid() != 0) 1631d7899447SLen Brown warnx("... or simply run as root"); 163298481e79SLen Brown 163398481e79SLen Brown if (do_exit) 163498481e79SLen Brown exit(-6); 1635103a8feaSLen Brown } 1636103a8feaSLen Brown 1637d7899447SLen Brown /* 1638d7899447SLen Brown * NHM adds support for additional MSRs: 1639d7899447SLen Brown * 1640d7899447SLen Brown * MSR_SMI_COUNT 0x00000034 1641d7899447SLen Brown * 1642d7899447SLen Brown * MSR_NHM_PLATFORM_INFO 0x000000ce 1643d7899447SLen Brown * MSR_NHM_SNB_PKG_CST_CFG_CTL 0x000000e2 1644d7899447SLen Brown * 1645d7899447SLen Brown * MSR_PKG_C3_RESIDENCY 0x000003f8 1646d7899447SLen Brown * MSR_PKG_C6_RESIDENCY 0x000003f9 1647d7899447SLen Brown * MSR_CORE_C3_RESIDENCY 0x000003fc 1648d7899447SLen Brown * MSR_CORE_C6_RESIDENCY 0x000003fd 1649d7899447SLen Brown * 1650ee7e38e3SLen Brown * Side effect: 1651ee7e38e3SLen Brown * sets global pkg_cstate_limit to decode MSR_NHM_SNB_PKG_CST_CFG_CTL 1652d7899447SLen Brown */ 1653ee7e38e3SLen Brown int probe_nhm_msrs(unsigned int family, unsigned int model) 1654103a8feaSLen Brown { 1655ee7e38e3SLen Brown unsigned long long msr; 1656ee7e38e3SLen Brown int *pkg_cstate_limits; 1657ee7e38e3SLen Brown 1658103a8feaSLen Brown if (!genuine_intel) 1659103a8feaSLen Brown return 0; 1660103a8feaSLen Brown 1661103a8feaSLen Brown if (family != 6) 1662103a8feaSLen Brown return 0; 1663103a8feaSLen Brown 1664103a8feaSLen Brown switch (model) { 1665103a8feaSLen Brown case 0x1A: /* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */ 1666103a8feaSLen Brown case 0x1E: /* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */ 1667103a8feaSLen Brown case 0x1F: /* Core i7 and i5 Processor - Nehalem */ 1668103a8feaSLen Brown case 0x25: /* Westmere Client - Clarkdale, Arrandale */ 1669103a8feaSLen Brown case 0x2C: /* Westmere EP - Gulftown */ 1670ee7e38e3SLen Brown case 0x2E: /* Nehalem-EX Xeon - Beckton */ 1671ee7e38e3SLen Brown case 0x2F: /* Westmere-EX Xeon - Eagleton */ 1672ee7e38e3SLen Brown pkg_cstate_limits = nhm_pkg_cstate_limits; 1673ee7e38e3SLen Brown break; 1674103a8feaSLen Brown case 0x2A: /* SNB */ 1675103a8feaSLen Brown case 0x2D: /* SNB Xeon */ 1676553575f1SLen Brown case 0x3A: /* IVB */ 16771300651bSLen Brown case 0x3E: /* IVB Xeon */ 1678ee7e38e3SLen Brown pkg_cstate_limits = snb_pkg_cstate_limits; 1679ee7e38e3SLen Brown break; 168070b43400SLen Brown case 0x3C: /* HSW */ 1681e6f9bb3cSLen Brown case 0x3F: /* HSX */ 168270b43400SLen Brown case 0x45: /* HSW */ 1683149c2319SLen Brown case 0x46: /* HSW */ 16844e8e863fSLen Brown case 0x3D: /* BDW */ 168548a0631cSLen Brown case 0x47: /* BDW */ 16864e8e863fSLen Brown case 0x4F: /* BDX */ 16874e8e863fSLen Brown case 0x56: /* BDX-DE */ 1688*0b2bb692SLen Brown case 0x4E: /* SKL */ 1689*0b2bb692SLen Brown case 0x5E: /* SKL */ 1690ee7e38e3SLen Brown pkg_cstate_limits = hsw_pkg_cstate_limits; 1691ee7e38e3SLen Brown break; 1692ee7e38e3SLen Brown case 0x37: /* BYT */ 1693ee7e38e3SLen Brown case 0x4D: /* AVN */ 1694ee7e38e3SLen Brown pkg_cstate_limits = slv_pkg_cstate_limits; 1695ee7e38e3SLen Brown break; 1696ee7e38e3SLen Brown case 0x4C: /* AMT */ 1697ee7e38e3SLen Brown pkg_cstate_limits = amt_pkg_cstate_limits; 1698ee7e38e3SLen Brown break; 1699ee7e38e3SLen Brown case 0x57: /* PHI */ 1700ee7e38e3SLen Brown pkg_cstate_limits = phi_pkg_cstate_limits; 1701ee7e38e3SLen Brown break; 1702103a8feaSLen Brown default: 1703103a8feaSLen Brown return 0; 1704103a8feaSLen Brown } 1705ee7e38e3SLen Brown get_msr(0, MSR_NHM_SNB_PKG_CST_CFG_CTL, &msr); 1706ee7e38e3SLen Brown 1707ee7e38e3SLen Brown pkg_cstate_limit = pkg_cstate_limits[msr & 0x7]; 1708ee7e38e3SLen Brown 1709ee7e38e3SLen Brown return 1; 1710103a8feaSLen Brown } 1711d7899447SLen Brown int has_nhm_turbo_ratio_limit(unsigned int family, unsigned int model) 1712d7899447SLen Brown { 1713d7899447SLen Brown switch (model) { 1714d7899447SLen Brown /* Nehalem compatible, but do not include turbo-ratio limit support */ 1715d7899447SLen Brown case 0x2E: /* Nehalem-EX Xeon - Beckton */ 1716d7899447SLen Brown case 0x2F: /* Westmere-EX Xeon - Eagleton */ 1717d7899447SLen Brown return 0; 1718d7899447SLen Brown default: 1719d7899447SLen Brown return 1; 1720d7899447SLen Brown } 1721d7899447SLen Brown } 17226574a5d5SLen Brown int has_ivt_turbo_ratio_limit(unsigned int family, unsigned int model) 17236574a5d5SLen Brown { 17246574a5d5SLen Brown if (!genuine_intel) 17256574a5d5SLen Brown return 0; 17266574a5d5SLen Brown 17276574a5d5SLen Brown if (family != 6) 17286574a5d5SLen Brown return 0; 17296574a5d5SLen Brown 17306574a5d5SLen Brown switch (model) { 17316574a5d5SLen Brown case 0x3E: /* IVB Xeon */ 1732fcd17211SLen Brown case 0x3F: /* HSW Xeon */ 17336574a5d5SLen Brown return 1; 17346574a5d5SLen Brown default: 17356574a5d5SLen Brown return 0; 17366574a5d5SLen Brown } 17376574a5d5SLen Brown } 1738fcd17211SLen Brown int has_hsw_turbo_ratio_limit(unsigned int family, unsigned int model) 1739fcd17211SLen Brown { 1740fcd17211SLen Brown if (!genuine_intel) 1741fcd17211SLen Brown return 0; 1742fcd17211SLen Brown 1743fcd17211SLen Brown if (family != 6) 1744fcd17211SLen Brown return 0; 1745fcd17211SLen Brown 1746fcd17211SLen Brown switch (model) { 1747fcd17211SLen Brown case 0x3F: /* HSW Xeon */ 1748fcd17211SLen Brown return 1; 1749fcd17211SLen Brown default: 1750fcd17211SLen Brown return 0; 1751fcd17211SLen Brown } 1752fcd17211SLen Brown } 1753fcd17211SLen Brown 1754fcd17211SLen Brown static void 1755fcd17211SLen Brown dump_cstate_pstate_config_info(family, model) 1756fcd17211SLen Brown { 1757fcd17211SLen Brown if (!do_nhm_platform_info) 1758fcd17211SLen Brown return; 1759fcd17211SLen Brown 1760fcd17211SLen Brown dump_nhm_platform_info(); 1761fcd17211SLen Brown 1762fcd17211SLen Brown if (has_hsw_turbo_ratio_limit(family, model)) 1763fcd17211SLen Brown dump_hsw_turbo_ratio_limits(); 1764fcd17211SLen Brown 1765fcd17211SLen Brown if (has_ivt_turbo_ratio_limit(family, model)) 1766fcd17211SLen Brown dump_ivt_turbo_ratio_limits(); 1767fcd17211SLen Brown 1768fcd17211SLen Brown if (has_nhm_turbo_ratio_limit(family, model)) 1769fcd17211SLen Brown dump_nhm_turbo_ratio_limits(); 1770fcd17211SLen Brown 1771fcd17211SLen Brown dump_nhm_cst_cfg(); 1772fcd17211SLen Brown } 1773fcd17211SLen Brown 17746574a5d5SLen Brown 1775889facbeSLen Brown /* 1776889facbeSLen Brown * print_epb() 1777889facbeSLen Brown * Decode the ENERGY_PERF_BIAS MSR 1778889facbeSLen Brown */ 1779889facbeSLen Brown int print_epb(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1780889facbeSLen Brown { 1781889facbeSLen Brown unsigned long long msr; 1782889facbeSLen Brown char *epb_string; 1783889facbeSLen Brown int cpu; 1784889facbeSLen Brown 1785889facbeSLen Brown if (!has_epb) 1786889facbeSLen Brown return 0; 1787889facbeSLen Brown 1788889facbeSLen Brown cpu = t->cpu_id; 1789889facbeSLen Brown 1790889facbeSLen Brown /* EPB is per-package */ 1791889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1792889facbeSLen Brown return 0; 1793889facbeSLen Brown 1794889facbeSLen Brown if (cpu_migrate(cpu)) { 1795889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1796889facbeSLen Brown return -1; 1797889facbeSLen Brown } 1798889facbeSLen Brown 1799889facbeSLen Brown if (get_msr(cpu, MSR_IA32_ENERGY_PERF_BIAS, &msr)) 1800889facbeSLen Brown return 0; 1801889facbeSLen Brown 1802889facbeSLen Brown switch (msr & 0x7) { 1803889facbeSLen Brown case ENERGY_PERF_BIAS_PERFORMANCE: 1804889facbeSLen Brown epb_string = "performance"; 1805889facbeSLen Brown break; 1806889facbeSLen Brown case ENERGY_PERF_BIAS_NORMAL: 1807889facbeSLen Brown epb_string = "balanced"; 1808889facbeSLen Brown break; 1809889facbeSLen Brown case ENERGY_PERF_BIAS_POWERSAVE: 1810889facbeSLen Brown epb_string = "powersave"; 1811889facbeSLen Brown break; 1812889facbeSLen Brown default: 1813889facbeSLen Brown epb_string = "custom"; 1814889facbeSLen Brown break; 1815889facbeSLen Brown } 1816889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_ENERGY_PERF_BIAS: 0x%08llx (%s)\n", cpu, msr, epb_string); 1817889facbeSLen Brown 1818889facbeSLen Brown return 0; 1819889facbeSLen Brown } 1820889facbeSLen Brown 18213a9a941dSLen Brown /* 18223a9a941dSLen Brown * print_perf_limit() 18233a9a941dSLen Brown */ 18243a9a941dSLen Brown int print_perf_limit(struct thread_data *t, struct core_data *c, struct pkg_data *p) 18253a9a941dSLen Brown { 18263a9a941dSLen Brown unsigned long long msr; 18273a9a941dSLen Brown int cpu; 18283a9a941dSLen Brown 18293a9a941dSLen Brown cpu = t->cpu_id; 18303a9a941dSLen Brown 18313a9a941dSLen Brown /* per-package */ 18323a9a941dSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 18333a9a941dSLen Brown return 0; 18343a9a941dSLen Brown 18353a9a941dSLen Brown if (cpu_migrate(cpu)) { 18363a9a941dSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 18373a9a941dSLen Brown return -1; 18383a9a941dSLen Brown } 18393a9a941dSLen Brown 18403a9a941dSLen Brown if (do_core_perf_limit_reasons) { 18413a9a941dSLen Brown get_msr(cpu, MSR_CORE_PERF_LIMIT_REASONS, &msr); 18423a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_CORE_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 18433a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)", 1844e33cbe85SLen Brown (msr & 1 << 15) ? "bit15, " : "", 18453a9a941dSLen Brown (msr & 1 << 14) ? "bit14, " : "", 1846e33cbe85SLen Brown (msr & 1 << 13) ? "Transitions, " : "", 1847e33cbe85SLen Brown (msr & 1 << 12) ? "MultiCoreTurbo, " : "", 1848e33cbe85SLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : "", 1849e33cbe85SLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 1850e33cbe85SLen Brown (msr & 1 << 9) ? "CorePwr, " : "", 1851e33cbe85SLen Brown (msr & 1 << 8) ? "Amps, " : "", 1852e33cbe85SLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 1853e33cbe85SLen Brown (msr & 1 << 5) ? "Auto-HWP, " : "", 1854e33cbe85SLen Brown (msr & 1 << 4) ? "Graphics, " : "", 1855e33cbe85SLen Brown (msr & 1 << 2) ? "bit2, " : "", 1856e33cbe85SLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 1857e33cbe85SLen Brown (msr & 1 << 0) ? "PROCHOT, " : ""); 18583a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)\n", 1859e33cbe85SLen Brown (msr & 1 << 31) ? "bit31, " : "", 18603a9a941dSLen Brown (msr & 1 << 30) ? "bit30, " : "", 1861e33cbe85SLen Brown (msr & 1 << 29) ? "Transitions, " : "", 1862e33cbe85SLen Brown (msr & 1 << 28) ? "MultiCoreTurbo, " : "", 1863e33cbe85SLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : "", 1864e33cbe85SLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 1865e33cbe85SLen Brown (msr & 1 << 25) ? "CorePwr, " : "", 1866e33cbe85SLen Brown (msr & 1 << 24) ? "Amps, " : "", 1867e33cbe85SLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 1868e33cbe85SLen Brown (msr & 1 << 21) ? "Auto-HWP, " : "", 1869e33cbe85SLen Brown (msr & 1 << 20) ? "Graphics, " : "", 1870e33cbe85SLen Brown (msr & 1 << 18) ? "bit18, " : "", 1871e33cbe85SLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 1872e33cbe85SLen Brown (msr & 1 << 16) ? "PROCHOT, " : ""); 18733a9a941dSLen Brown 18743a9a941dSLen Brown } 18753a9a941dSLen Brown if (do_gfx_perf_limit_reasons) { 18763a9a941dSLen Brown get_msr(cpu, MSR_GFX_PERF_LIMIT_REASONS, &msr); 18773a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_GFX_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 18783a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s%s%s)", 18793a9a941dSLen Brown (msr & 1 << 0) ? "PROCHOT, " : "", 18803a9a941dSLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 18813a9a941dSLen Brown (msr & 1 << 4) ? "Graphics, " : "", 18823a9a941dSLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 18833a9a941dSLen Brown (msr & 1 << 8) ? "Amps, " : "", 18843a9a941dSLen Brown (msr & 1 << 9) ? "GFXPwr, " : "", 18853a9a941dSLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 18863a9a941dSLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : ""); 18873a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s%s%s)\n", 18883a9a941dSLen Brown (msr & 1 << 16) ? "PROCHOT, " : "", 18893a9a941dSLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 18903a9a941dSLen Brown (msr & 1 << 20) ? "Graphics, " : "", 18913a9a941dSLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 18923a9a941dSLen Brown (msr & 1 << 24) ? "Amps, " : "", 18933a9a941dSLen Brown (msr & 1 << 25) ? "GFXPwr, " : "", 18943a9a941dSLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 18953a9a941dSLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : ""); 18963a9a941dSLen Brown } 18973a9a941dSLen Brown if (do_ring_perf_limit_reasons) { 18983a9a941dSLen Brown get_msr(cpu, MSR_RING_PERF_LIMIT_REASONS, &msr); 18993a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_RING_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 19003a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s)", 19013a9a941dSLen Brown (msr & 1 << 0) ? "PROCHOT, " : "", 19023a9a941dSLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 19033a9a941dSLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 19043a9a941dSLen Brown (msr & 1 << 8) ? "Amps, " : "", 19053a9a941dSLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 19063a9a941dSLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : ""); 19073a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s)\n", 19083a9a941dSLen Brown (msr & 1 << 16) ? "PROCHOT, " : "", 19093a9a941dSLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 19103a9a941dSLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 19113a9a941dSLen Brown (msr & 1 << 24) ? "Amps, " : "", 19123a9a941dSLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 19133a9a941dSLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : ""); 19143a9a941dSLen Brown } 19153a9a941dSLen Brown return 0; 19163a9a941dSLen Brown } 19173a9a941dSLen Brown 1918889facbeSLen Brown #define RAPL_POWER_GRANULARITY 0x7FFF /* 15 bit power granularity */ 1919889facbeSLen Brown #define RAPL_TIME_GRANULARITY 0x3F /* 6 bit time granularity */ 1920889facbeSLen Brown 1921144b44b1SLen Brown double get_tdp(model) 1922144b44b1SLen Brown { 1923144b44b1SLen Brown unsigned long long msr; 1924144b44b1SLen Brown 1925144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) 1926144b44b1SLen Brown if (!get_msr(0, MSR_PKG_POWER_INFO, &msr)) 1927144b44b1SLen Brown return ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units; 1928144b44b1SLen Brown 1929144b44b1SLen Brown switch (model) { 1930144b44b1SLen Brown case 0x37: 1931144b44b1SLen Brown case 0x4D: 1932144b44b1SLen Brown return 30.0; 1933144b44b1SLen Brown default: 1934144b44b1SLen Brown return 135.0; 1935144b44b1SLen Brown } 1936144b44b1SLen Brown } 1937144b44b1SLen Brown 1938144b44b1SLen Brown 1939889facbeSLen Brown /* 1940889facbeSLen Brown * rapl_probe() 1941889facbeSLen Brown * 1942144b44b1SLen Brown * sets do_rapl, rapl_power_units, rapl_energy_units, rapl_time_units 1943889facbeSLen Brown */ 1944889facbeSLen Brown void rapl_probe(unsigned int family, unsigned int model) 1945889facbeSLen Brown { 1946889facbeSLen Brown unsigned long long msr; 1947144b44b1SLen Brown unsigned int time_unit; 1948889facbeSLen Brown double tdp; 1949889facbeSLen Brown 1950889facbeSLen Brown if (!genuine_intel) 1951889facbeSLen Brown return; 1952889facbeSLen Brown 1953889facbeSLen Brown if (family != 6) 1954889facbeSLen Brown return; 1955889facbeSLen Brown 1956889facbeSLen Brown switch (model) { 1957889facbeSLen Brown case 0x2A: 1958889facbeSLen Brown case 0x3A: 195970b43400SLen Brown case 0x3C: /* HSW */ 196070b43400SLen Brown case 0x45: /* HSW */ 1961149c2319SLen Brown case 0x46: /* HSW */ 19624e8e863fSLen Brown case 0x3D: /* BDW */ 196348a0631cSLen Brown case 0x47: /* BDW */ 1964144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_GFX | RAPL_PKG_POWER_INFO; 1965889facbeSLen Brown break; 1966*0b2bb692SLen Brown case 0x4E: /* SKL */ 1967*0b2bb692SLen Brown case 0x5E: /* SKL */ 1968*0b2bb692SLen Brown do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO; 1969*0b2bb692SLen Brown break; 1970e6f9bb3cSLen Brown case 0x3F: /* HSX */ 19714e8e863fSLen Brown case 0x4F: /* BDX */ 19724e8e863fSLen Brown case 0x56: /* BDX-DE */ 1973*0b2bb692SLen Brown do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_POWER_INFO | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO; 1974e6f9bb3cSLen Brown break; 1975889facbeSLen Brown case 0x2D: 1976889facbeSLen Brown case 0x3E: 1977*0b2bb692SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_DRAM | RAPL_DRAM_POWER_INFO | RAPL_PKG_PERF_STATUS | RAPL_DRAM_PERF_STATUS | RAPL_PKG_POWER_INFO; 1978144b44b1SLen Brown break; 1979144b44b1SLen Brown case 0x37: /* BYT */ 1980144b44b1SLen Brown case 0x4D: /* AVN */ 1981144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES ; 1982889facbeSLen Brown break; 1983889facbeSLen Brown default: 1984889facbeSLen Brown return; 1985889facbeSLen Brown } 1986889facbeSLen Brown 1987889facbeSLen Brown /* units on package 0, verify later other packages match */ 1988889facbeSLen Brown if (get_msr(0, MSR_RAPL_POWER_UNIT, &msr)) 1989889facbeSLen Brown return; 1990889facbeSLen Brown 1991889facbeSLen Brown rapl_power_units = 1.0 / (1 << (msr & 0xF)); 1992144b44b1SLen Brown if (model == 0x37) 1993144b44b1SLen Brown rapl_energy_units = 1.0 * (1 << (msr >> 8 & 0x1F)) / 1000000; 1994144b44b1SLen Brown else 1995889facbeSLen Brown rapl_energy_units = 1.0 / (1 << (msr >> 8 & 0x1F)); 1996889facbeSLen Brown 1997144b44b1SLen Brown time_unit = msr >> 16 & 0xF; 1998144b44b1SLen Brown if (time_unit == 0) 1999144b44b1SLen Brown time_unit = 0xA; 2000889facbeSLen Brown 2001144b44b1SLen Brown rapl_time_units = 1.0 / (1 << (time_unit)); 2002144b44b1SLen Brown 2003144b44b1SLen Brown tdp = get_tdp(model); 2004889facbeSLen Brown 2005889facbeSLen Brown rapl_joule_counter_range = 0xFFFFFFFF * rapl_energy_units / tdp; 2006d8af6f5fSLen Brown if (debug) 2007144b44b1SLen Brown fprintf(stderr, "RAPL: %.0f sec. Joule Counter Range, at %.0f Watts\n", rapl_joule_counter_range, tdp); 2008889facbeSLen Brown 2009889facbeSLen Brown return; 2010889facbeSLen Brown } 2011889facbeSLen Brown 20123a9a941dSLen Brown void perf_limit_reasons_probe(family, model) 20133a9a941dSLen Brown { 20143a9a941dSLen Brown if (!genuine_intel) 20153a9a941dSLen Brown return; 20163a9a941dSLen Brown 20173a9a941dSLen Brown if (family != 6) 20183a9a941dSLen Brown return; 20193a9a941dSLen Brown 20203a9a941dSLen Brown switch (model) { 20213a9a941dSLen Brown case 0x3C: /* HSW */ 20223a9a941dSLen Brown case 0x45: /* HSW */ 20233a9a941dSLen Brown case 0x46: /* HSW */ 20243a9a941dSLen Brown do_gfx_perf_limit_reasons = 1; 20253a9a941dSLen Brown case 0x3F: /* HSX */ 20263a9a941dSLen Brown do_core_perf_limit_reasons = 1; 20273a9a941dSLen Brown do_ring_perf_limit_reasons = 1; 20283a9a941dSLen Brown default: 20293a9a941dSLen Brown return; 20303a9a941dSLen Brown } 20313a9a941dSLen Brown } 20323a9a941dSLen Brown 2033889facbeSLen Brown int print_thermal(struct thread_data *t, struct core_data *c, struct pkg_data *p) 2034889facbeSLen Brown { 2035889facbeSLen Brown unsigned long long msr; 2036889facbeSLen Brown unsigned int dts; 2037889facbeSLen Brown int cpu; 2038889facbeSLen Brown 2039889facbeSLen Brown if (!(do_dts || do_ptm)) 2040889facbeSLen Brown return 0; 2041889facbeSLen Brown 2042889facbeSLen Brown cpu = t->cpu_id; 2043889facbeSLen Brown 2044889facbeSLen Brown /* DTS is per-core, no need to print for each thread */ 2045889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 2046889facbeSLen Brown return 0; 2047889facbeSLen Brown 2048889facbeSLen Brown if (cpu_migrate(cpu)) { 2049889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 2050889facbeSLen Brown return -1; 2051889facbeSLen Brown } 2052889facbeSLen Brown 2053889facbeSLen Brown if (do_ptm && (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) { 2054889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 2055889facbeSLen Brown return 0; 2056889facbeSLen Brown 2057889facbeSLen Brown dts = (msr >> 16) & 0x7F; 2058889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_STATUS: 0x%08llx (%d C)\n", 2059889facbeSLen Brown cpu, msr, tcc_activation_temp - dts); 2060889facbeSLen Brown 2061889facbeSLen Brown #ifdef THERM_DEBUG 2062889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_INTERRUPT, &msr)) 2063889facbeSLen Brown return 0; 2064889facbeSLen Brown 2065889facbeSLen Brown dts = (msr >> 16) & 0x7F; 2066889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 2067889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 2068889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 2069889facbeSLen Brown #endif 2070889facbeSLen Brown } 2071889facbeSLen Brown 2072889facbeSLen Brown 2073889facbeSLen Brown if (do_dts) { 2074889facbeSLen Brown unsigned int resolution; 2075889facbeSLen Brown 2076889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 2077889facbeSLen Brown return 0; 2078889facbeSLen Brown 2079889facbeSLen Brown dts = (msr >> 16) & 0x7F; 2080889facbeSLen Brown resolution = (msr >> 27) & 0xF; 2081889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_STATUS: 0x%08llx (%d C +/- %d)\n", 2082889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, resolution); 2083889facbeSLen Brown 2084889facbeSLen Brown #ifdef THERM_DEBUG 2085889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_INTERRUPT, &msr)) 2086889facbeSLen Brown return 0; 2087889facbeSLen Brown 2088889facbeSLen Brown dts = (msr >> 16) & 0x7F; 2089889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 2090889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 2091889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 2092889facbeSLen Brown #endif 2093889facbeSLen Brown } 2094889facbeSLen Brown 2095889facbeSLen Brown return 0; 2096889facbeSLen Brown } 2097889facbeSLen Brown 2098889facbeSLen Brown void print_power_limit_msr(int cpu, unsigned long long msr, char *label) 2099889facbeSLen Brown { 2100889facbeSLen Brown fprintf(stderr, "cpu%d: %s: %sabled (%f Watts, %f sec, clamp %sabled)\n", 2101889facbeSLen Brown cpu, label, 2102889facbeSLen Brown ((msr >> 15) & 1) ? "EN" : "DIS", 2103889facbeSLen Brown ((msr >> 0) & 0x7FFF) * rapl_power_units, 2104889facbeSLen Brown (1.0 + (((msr >> 22) & 0x3)/4.0)) * (1 << ((msr >> 17) & 0x1F)) * rapl_time_units, 2105889facbeSLen Brown (((msr >> 16) & 1) ? "EN" : "DIS")); 2106889facbeSLen Brown 2107889facbeSLen Brown return; 2108889facbeSLen Brown } 2109889facbeSLen Brown 2110889facbeSLen Brown int print_rapl(struct thread_data *t, struct core_data *c, struct pkg_data *p) 2111889facbeSLen Brown { 2112889facbeSLen Brown unsigned long long msr; 2113889facbeSLen Brown int cpu; 2114889facbeSLen Brown 2115889facbeSLen Brown if (!do_rapl) 2116889facbeSLen Brown return 0; 2117889facbeSLen Brown 2118889facbeSLen Brown /* RAPL counters are per package, so print only for 1st thread/package */ 2119889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 2120889facbeSLen Brown return 0; 2121889facbeSLen Brown 2122889facbeSLen Brown cpu = t->cpu_id; 2123889facbeSLen Brown if (cpu_migrate(cpu)) { 2124889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 2125889facbeSLen Brown return -1; 2126889facbeSLen Brown } 2127889facbeSLen Brown 2128889facbeSLen Brown if (get_msr(cpu, MSR_RAPL_POWER_UNIT, &msr)) 2129889facbeSLen Brown return -1; 2130889facbeSLen Brown 2131d8af6f5fSLen Brown if (debug) { 2132889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_RAPL_POWER_UNIT: 0x%08llx " 2133889facbeSLen Brown "(%f Watts, %f Joules, %f sec.)\n", cpu, msr, 2134144b44b1SLen Brown rapl_power_units, rapl_energy_units, rapl_time_units); 2135889facbeSLen Brown } 2136144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) { 2137144b44b1SLen Brown 2138889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_INFO, &msr)) 2139889facbeSLen Brown return -5; 2140889facbeSLen Brown 2141889facbeSLen Brown 2142889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_INFO: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 2143889facbeSLen Brown cpu, msr, 2144889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2145889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2146889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2147889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 2148889facbeSLen Brown 2149144b44b1SLen Brown } 2150144b44b1SLen Brown if (do_rapl & RAPL_PKG) { 2151144b44b1SLen Brown 2152889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_LIMIT, &msr)) 2153889facbeSLen Brown return -9; 2154889facbeSLen Brown 2155889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_LIMIT: 0x%08llx (%slocked)\n", 2156889facbeSLen Brown cpu, msr, (msr >> 63) & 1 ? "": "UN"); 2157889facbeSLen Brown 2158889facbeSLen Brown print_power_limit_msr(cpu, msr, "PKG Limit #1"); 2159889facbeSLen Brown fprintf(stderr, "cpu%d: PKG Limit #2: %sabled (%f Watts, %f* sec, clamp %sabled)\n", 2160889facbeSLen Brown cpu, 2161889facbeSLen Brown ((msr >> 47) & 1) ? "EN" : "DIS", 2162889facbeSLen Brown ((msr >> 32) & 0x7FFF) * rapl_power_units, 2163889facbeSLen Brown (1.0 + (((msr >> 54) & 0x3)/4.0)) * (1 << ((msr >> 49) & 0x1F)) * rapl_time_units, 2164889facbeSLen Brown ((msr >> 48) & 1) ? "EN" : "DIS"); 2165889facbeSLen Brown } 2166889facbeSLen Brown 2167*0b2bb692SLen Brown if (do_rapl & RAPL_DRAM_POWER_INFO) { 2168889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_INFO, &msr)) 2169889facbeSLen Brown return -6; 2170889facbeSLen Brown 2171889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_INFO,: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 2172889facbeSLen Brown cpu, msr, 2173889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2174889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2175889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 2176889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 2177*0b2bb692SLen Brown } 2178*0b2bb692SLen Brown if (do_rapl & RAPL_DRAM) { 2179889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_LIMIT, &msr)) 2180889facbeSLen Brown return -9; 2181889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_LIMIT: 0x%08llx (%slocked)\n", 2182889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 2183889facbeSLen Brown 2184889facbeSLen Brown print_power_limit_msr(cpu, msr, "DRAM Limit"); 2185889facbeSLen Brown } 2186144b44b1SLen Brown if (do_rapl & RAPL_CORE_POLICY) { 2187d8af6f5fSLen Brown if (debug) { 2188889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POLICY, &msr)) 2189889facbeSLen Brown return -7; 2190889facbeSLen Brown 2191889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POLICY: %lld\n", cpu, msr & 0xF); 2192144b44b1SLen Brown } 2193144b44b1SLen Brown } 2194144b44b1SLen Brown if (do_rapl & RAPL_CORES) { 2195d8af6f5fSLen Brown if (debug) { 2196889facbeSLen Brown 2197889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POWER_LIMIT, &msr)) 2198889facbeSLen Brown return -9; 2199889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POWER_LIMIT: 0x%08llx (%slocked)\n", 2200889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 2201889facbeSLen Brown print_power_limit_msr(cpu, msr, "Cores Limit"); 2202889facbeSLen Brown } 2203889facbeSLen Brown } 2204889facbeSLen Brown if (do_rapl & RAPL_GFX) { 2205d8af6f5fSLen Brown if (debug) { 2206889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POLICY, &msr)) 2207889facbeSLen Brown return -8; 2208889facbeSLen Brown 2209889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POLICY: %lld\n", cpu, msr & 0xF); 2210889facbeSLen Brown 2211889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POWER_LIMIT, &msr)) 2212889facbeSLen Brown return -9; 2213889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POWER_LIMIT: 0x%08llx (%slocked)\n", 2214889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 2215889facbeSLen Brown print_power_limit_msr(cpu, msr, "GFX Limit"); 2216889facbeSLen Brown } 2217889facbeSLen Brown } 2218889facbeSLen Brown return 0; 2219889facbeSLen Brown } 2220889facbeSLen Brown 2221d7899447SLen Brown /* 2222d7899447SLen Brown * SNB adds support for additional MSRs: 2223d7899447SLen Brown * 2224d7899447SLen Brown * MSR_PKG_C7_RESIDENCY 0x000003fa 2225d7899447SLen Brown * MSR_CORE_C7_RESIDENCY 0x000003fe 2226d7899447SLen Brown * MSR_PKG_C2_RESIDENCY 0x0000060d 2227d7899447SLen Brown */ 2228103a8feaSLen Brown 2229d7899447SLen Brown int has_snb_msrs(unsigned int family, unsigned int model) 2230103a8feaSLen Brown { 2231103a8feaSLen Brown if (!genuine_intel) 2232103a8feaSLen Brown return 0; 2233103a8feaSLen Brown 2234103a8feaSLen Brown switch (model) { 2235103a8feaSLen Brown case 0x2A: 2236103a8feaSLen Brown case 0x2D: 2237650a37f3SLen Brown case 0x3A: /* IVB */ 22381300651bSLen Brown case 0x3E: /* IVB Xeon */ 223970b43400SLen Brown case 0x3C: /* HSW */ 224070b43400SLen Brown case 0x3F: /* HSW */ 224170b43400SLen Brown case 0x45: /* HSW */ 2242149c2319SLen Brown case 0x46: /* HSW */ 22434e8e863fSLen Brown case 0x3D: /* BDW */ 224448a0631cSLen Brown case 0x47: /* BDW */ 22454e8e863fSLen Brown case 0x4F: /* BDX */ 22464e8e863fSLen Brown case 0x56: /* BDX-DE */ 2247*0b2bb692SLen Brown case 0x4E: /* SKL */ 2248*0b2bb692SLen Brown case 0x5E: /* SKL */ 2249103a8feaSLen Brown return 1; 2250103a8feaSLen Brown } 2251103a8feaSLen Brown return 0; 2252103a8feaSLen Brown } 2253103a8feaSLen Brown 2254d7899447SLen Brown /* 2255d7899447SLen Brown * HSW adds support for additional MSRs: 2256d7899447SLen Brown * 2257d7899447SLen Brown * MSR_PKG_C8_RESIDENCY 0x00000630 2258d7899447SLen Brown * MSR_PKG_C9_RESIDENCY 0x00000631 2259d7899447SLen Brown * MSR_PKG_C10_RESIDENCY 0x00000632 2260d7899447SLen Brown */ 2261d7899447SLen Brown int has_hsw_msrs(unsigned int family, unsigned int model) 2262ca58710fSKristen Carlson Accardi { 2263ca58710fSKristen Carlson Accardi if (!genuine_intel) 2264ca58710fSKristen Carlson Accardi return 0; 2265ca58710fSKristen Carlson Accardi 2266ca58710fSKristen Carlson Accardi switch (model) { 22674e8e863fSLen Brown case 0x45: /* HSW */ 22684e8e863fSLen Brown case 0x3D: /* BDW */ 2269*0b2bb692SLen Brown case 0x4E: /* SKL */ 2270*0b2bb692SLen Brown case 0x5E: /* SKL */ 2271ca58710fSKristen Carlson Accardi return 1; 2272ca58710fSKristen Carlson Accardi } 2273ca58710fSKristen Carlson Accardi return 0; 2274ca58710fSKristen Carlson Accardi } 2275ca58710fSKristen Carlson Accardi 2276*0b2bb692SLen Brown /* 2277*0b2bb692SLen Brown * SKL adds support for additional MSRS: 2278*0b2bb692SLen Brown * 2279*0b2bb692SLen Brown * MSR_PKG_WEIGHTED_CORE_C0_RES 0x00000658 2280*0b2bb692SLen Brown * MSR_PKG_ANY_CORE_C0_RES 0x00000659 2281*0b2bb692SLen Brown * MSR_PKG_ANY_GFXE_C0_RES 0x0000065A 2282*0b2bb692SLen Brown * MSR_PKG_BOTH_CORE_GFXE_C0_RES 0x0000065B 2283*0b2bb692SLen Brown */ 2284*0b2bb692SLen Brown int has_skl_msrs(unsigned int family, unsigned int model) 2285*0b2bb692SLen Brown { 2286*0b2bb692SLen Brown if (!genuine_intel) 2287*0b2bb692SLen Brown return 0; 2288*0b2bb692SLen Brown 2289*0b2bb692SLen Brown switch (model) { 2290*0b2bb692SLen Brown case 0x4E: /* SKL */ 2291*0b2bb692SLen Brown case 0x5E: /* SKL */ 2292*0b2bb692SLen Brown return 1; 2293*0b2bb692SLen Brown } 2294*0b2bb692SLen Brown return 0; 2295*0b2bb692SLen Brown } 2296*0b2bb692SLen Brown 2297*0b2bb692SLen Brown 2298ca58710fSKristen Carlson Accardi 2299144b44b1SLen Brown int is_slm(unsigned int family, unsigned int model) 2300144b44b1SLen Brown { 2301144b44b1SLen Brown if (!genuine_intel) 2302144b44b1SLen Brown return 0; 2303144b44b1SLen Brown switch (model) { 2304144b44b1SLen Brown case 0x37: /* BYT */ 2305144b44b1SLen Brown case 0x4D: /* AVN */ 2306144b44b1SLen Brown return 1; 2307144b44b1SLen Brown } 2308144b44b1SLen Brown return 0; 2309144b44b1SLen Brown } 2310144b44b1SLen Brown 2311144b44b1SLen Brown #define SLM_BCLK_FREQS 5 2312144b44b1SLen Brown double slm_freq_table[SLM_BCLK_FREQS] = { 83.3, 100.0, 133.3, 116.7, 80.0}; 2313144b44b1SLen Brown 2314144b44b1SLen Brown double slm_bclk(void) 2315144b44b1SLen Brown { 2316144b44b1SLen Brown unsigned long long msr = 3; 2317144b44b1SLen Brown unsigned int i; 2318144b44b1SLen Brown double freq; 2319144b44b1SLen Brown 2320144b44b1SLen Brown if (get_msr(0, MSR_FSB_FREQ, &msr)) 2321144b44b1SLen Brown fprintf(stderr, "SLM BCLK: unknown\n"); 2322144b44b1SLen Brown 2323144b44b1SLen Brown i = msr & 0xf; 2324144b44b1SLen Brown if (i >= SLM_BCLK_FREQS) { 2325144b44b1SLen Brown fprintf(stderr, "SLM BCLK[%d] invalid\n", i); 2326144b44b1SLen Brown msr = 3; 2327144b44b1SLen Brown } 2328144b44b1SLen Brown freq = slm_freq_table[i]; 2329144b44b1SLen Brown 2330144b44b1SLen Brown fprintf(stderr, "SLM BCLK: %.1f Mhz\n", freq); 2331144b44b1SLen Brown 2332144b44b1SLen Brown return freq; 2333144b44b1SLen Brown } 2334144b44b1SLen Brown 2335103a8feaSLen Brown double discover_bclk(unsigned int family, unsigned int model) 2336103a8feaSLen Brown { 2337d7899447SLen Brown if (has_snb_msrs(family, model)) 2338103a8feaSLen Brown return 100.00; 2339144b44b1SLen Brown else if (is_slm(family, model)) 2340144b44b1SLen Brown return slm_bclk(); 2341103a8feaSLen Brown else 2342103a8feaSLen Brown return 133.33; 2343103a8feaSLen Brown } 2344103a8feaSLen Brown 2345889facbeSLen Brown /* 2346889facbeSLen Brown * MSR_IA32_TEMPERATURE_TARGET indicates the temperature where 2347889facbeSLen Brown * the Thermal Control Circuit (TCC) activates. 2348889facbeSLen Brown * This is usually equal to tjMax. 2349889facbeSLen Brown * 2350889facbeSLen Brown * Older processors do not have this MSR, so there we guess, 2351889facbeSLen Brown * but also allow cmdline over-ride with -T. 2352889facbeSLen Brown * 2353889facbeSLen Brown * Several MSR temperature values are in units of degrees-C 2354889facbeSLen Brown * below this value, including the Digital Thermal Sensor (DTS), 2355889facbeSLen Brown * Package Thermal Management Sensor (PTM), and thermal event thresholds. 2356889facbeSLen Brown */ 2357889facbeSLen Brown int set_temperature_target(struct thread_data *t, struct core_data *c, struct pkg_data *p) 2358889facbeSLen Brown { 2359889facbeSLen Brown unsigned long long msr; 2360889facbeSLen Brown unsigned int target_c_local; 2361889facbeSLen Brown int cpu; 2362889facbeSLen Brown 2363889facbeSLen Brown /* tcc_activation_temp is used only for dts or ptm */ 2364889facbeSLen Brown if (!(do_dts || do_ptm)) 2365889facbeSLen Brown return 0; 2366889facbeSLen Brown 2367889facbeSLen Brown /* this is a per-package concept */ 2368889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 2369889facbeSLen Brown return 0; 2370889facbeSLen Brown 2371889facbeSLen Brown cpu = t->cpu_id; 2372889facbeSLen Brown if (cpu_migrate(cpu)) { 2373889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 2374889facbeSLen Brown return -1; 2375889facbeSLen Brown } 2376889facbeSLen Brown 2377889facbeSLen Brown if (tcc_activation_temp_override != 0) { 2378889facbeSLen Brown tcc_activation_temp = tcc_activation_temp_override; 2379889facbeSLen Brown fprintf(stderr, "cpu%d: Using cmdline TCC Target (%d C)\n", 2380889facbeSLen Brown cpu, tcc_activation_temp); 2381889facbeSLen Brown return 0; 2382889facbeSLen Brown } 2383889facbeSLen Brown 2384889facbeSLen Brown /* Temperature Target MSR is Nehalem and newer only */ 2385d7899447SLen Brown if (!do_nhm_platform_info) 2386889facbeSLen Brown goto guess; 2387889facbeSLen Brown 2388889facbeSLen Brown if (get_msr(0, MSR_IA32_TEMPERATURE_TARGET, &msr)) 2389889facbeSLen Brown goto guess; 2390889facbeSLen Brown 23913482124aSJean Delvare target_c_local = (msr >> 16) & 0xFF; 2392889facbeSLen Brown 2393d8af6f5fSLen Brown if (debug) 2394889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_TEMPERATURE_TARGET: 0x%08llx (%d C)\n", 2395889facbeSLen Brown cpu, msr, target_c_local); 2396889facbeSLen Brown 23973482124aSJean Delvare if (!target_c_local) 2398889facbeSLen Brown goto guess; 2399889facbeSLen Brown 2400889facbeSLen Brown tcc_activation_temp = target_c_local; 2401889facbeSLen Brown 2402889facbeSLen Brown return 0; 2403889facbeSLen Brown 2404889facbeSLen Brown guess: 2405889facbeSLen Brown tcc_activation_temp = TJMAX_DEFAULT; 2406889facbeSLen Brown fprintf(stderr, "cpu%d: Guessing tjMax %d C, Please use -T to specify\n", 2407889facbeSLen Brown cpu, tcc_activation_temp); 2408889facbeSLen Brown 2409889facbeSLen Brown return 0; 2410889facbeSLen Brown } 2411fcd17211SLen Brown void process_cpuid() 2412103a8feaSLen Brown { 2413103a8feaSLen Brown unsigned int eax, ebx, ecx, edx, max_level; 2414103a8feaSLen Brown unsigned int fms, family, model, stepping; 2415103a8feaSLen Brown 2416103a8feaSLen Brown eax = ebx = ecx = edx = 0; 2417103a8feaSLen Brown 24182b92865eSJosh Triplett __get_cpuid(0, &max_level, &ebx, &ecx, &edx); 2419103a8feaSLen Brown 2420103a8feaSLen Brown if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e) 2421103a8feaSLen Brown genuine_intel = 1; 2422103a8feaSLen Brown 2423d8af6f5fSLen Brown if (debug) 2424889facbeSLen Brown fprintf(stderr, "CPUID(0): %.4s%.4s%.4s ", 2425103a8feaSLen Brown (char *)&ebx, (char *)&edx, (char *)&ecx); 2426103a8feaSLen Brown 24272b92865eSJosh Triplett __get_cpuid(1, &fms, &ebx, &ecx, &edx); 2428103a8feaSLen Brown family = (fms >> 8) & 0xf; 2429103a8feaSLen Brown model = (fms >> 4) & 0xf; 2430103a8feaSLen Brown stepping = fms & 0xf; 2431103a8feaSLen Brown if (family == 6 || family == 0xf) 2432103a8feaSLen Brown model += ((fms >> 16) & 0xf) << 4; 2433103a8feaSLen Brown 2434d8af6f5fSLen Brown if (debug) 2435103a8feaSLen Brown fprintf(stderr, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n", 2436103a8feaSLen Brown max_level, family, model, stepping, family, model, stepping); 2437103a8feaSLen Brown 2438b2c95d90SJosh Triplett if (!(edx & (1 << 5))) 2439b2c95d90SJosh Triplett errx(1, "CPUID: no MSR"); 2440103a8feaSLen Brown 2441103a8feaSLen Brown /* 2442103a8feaSLen Brown * check max extended function levels of CPUID. 2443103a8feaSLen Brown * This is needed to check for invariant TSC. 2444103a8feaSLen Brown * This check is valid for both Intel and AMD. 2445103a8feaSLen Brown */ 2446103a8feaSLen Brown ebx = ecx = edx = 0; 24472b92865eSJosh Triplett __get_cpuid(0x80000000, &max_level, &ebx, &ecx, &edx); 2448103a8feaSLen Brown 2449d7899447SLen Brown if (max_level >= 0x80000007) { 2450103a8feaSLen Brown 2451103a8feaSLen Brown /* 2452103a8feaSLen Brown * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8 2453103a8feaSLen Brown * this check is valid for both Intel and AMD 2454103a8feaSLen Brown */ 24552b92865eSJosh Triplett __get_cpuid(0x80000007, &eax, &ebx, &ecx, &edx); 24568209e054SThomas Renninger has_invariant_tsc = edx & (1 << 8); 2457d7899447SLen Brown } 2458103a8feaSLen Brown 2459103a8feaSLen Brown /* 2460103a8feaSLen Brown * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0 2461103a8feaSLen Brown * this check is valid for both Intel and AMD 2462103a8feaSLen Brown */ 2463103a8feaSLen Brown 24642b92865eSJosh Triplett __get_cpuid(0x6, &eax, &ebx, &ecx, &edx); 24658209e054SThomas Renninger has_aperf = ecx & (1 << 0); 2466889facbeSLen Brown do_dts = eax & (1 << 0); 2467889facbeSLen Brown do_ptm = eax & (1 << 6); 2468889facbeSLen Brown has_epb = ecx & (1 << 3); 2469889facbeSLen Brown 2470d8af6f5fSLen Brown if (debug) 2471a729617cSLen Brown fprintf(stderr, "CPUID(6): %sAPERF, %sDTS, %sPTM, %sEPB\n", 2472a729617cSLen Brown has_aperf ? "" : "No ", 2473a729617cSLen Brown do_dts ? "" : "No ", 2474a729617cSLen Brown do_ptm ? "" : "No ", 2475a729617cSLen Brown has_epb ? "" : "No "); 2476103a8feaSLen Brown 2477ee7e38e3SLen Brown do_nhm_platform_info = do_nhm_cstates = do_smi = probe_nhm_msrs(family, model); 2478d7899447SLen Brown do_snb_cstates = has_snb_msrs(family, model); 2479ee7e38e3SLen Brown do_pc2 = do_snb_cstates && (pkg_cstate_limit >= PCL__2); 2480ee7e38e3SLen Brown do_pc3 = (pkg_cstate_limit >= PCL__3); 2481ee7e38e3SLen Brown do_pc6 = (pkg_cstate_limit >= PCL__6); 2482ee7e38e3SLen Brown do_pc7 = do_snb_cstates && (pkg_cstate_limit >= PCL__7); 2483d7899447SLen Brown do_c8_c9_c10 = has_hsw_msrs(family, model); 2484*0b2bb692SLen Brown do_skl_residency = has_skl_msrs(family, model); 2485144b44b1SLen Brown do_slm_cstates = is_slm(family, model); 2486103a8feaSLen Brown bclk = discover_bclk(family, model); 2487103a8feaSLen Brown 2488889facbeSLen Brown rapl_probe(family, model); 24893a9a941dSLen Brown perf_limit_reasons_probe(family, model); 2490889facbeSLen Brown 2491fcd17211SLen Brown if (debug) 2492fcd17211SLen Brown dump_cstate_pstate_config_info(); 2493fcd17211SLen Brown 2494889facbeSLen Brown return; 2495103a8feaSLen Brown } 2496103a8feaSLen Brown 2497d8af6f5fSLen Brown void help() 2498103a8feaSLen Brown { 2499d8af6f5fSLen Brown fprintf(stderr, 2500d8af6f5fSLen Brown "Usage: turbostat [OPTIONS][(--interval seconds) | COMMAND ...]\n" 2501d8af6f5fSLen Brown "\n" 2502d8af6f5fSLen Brown "Turbostat forks the specified COMMAND and prints statistics\n" 2503d8af6f5fSLen Brown "when COMMAND completes.\n" 2504d8af6f5fSLen Brown "If no COMMAND is specified, turbostat wakes every 5-seconds\n" 2505d8af6f5fSLen Brown "to print statistics, until interrupted.\n" 2506d8af6f5fSLen Brown "--debug run in \"debug\" mode\n" 2507d8af6f5fSLen Brown "--interval sec Override default 5-second measurement interval\n" 2508d8af6f5fSLen Brown "--help print this help message\n" 2509d8af6f5fSLen Brown "--counter msr print 32-bit counter at address \"msr\"\n" 2510d8af6f5fSLen Brown "--Counter msr print 64-bit Counter at address \"msr\"\n" 2511d8af6f5fSLen Brown "--msr msr print 32-bit value at address \"msr\"\n" 2512d8af6f5fSLen Brown "--MSR msr print 64-bit Value at address \"msr\"\n" 2513d8af6f5fSLen Brown "--version print version information\n" 2514d8af6f5fSLen Brown "\n" 2515d8af6f5fSLen Brown "For more help, run \"man turbostat\"\n"); 2516103a8feaSLen Brown } 2517103a8feaSLen Brown 2518103a8feaSLen Brown 2519103a8feaSLen Brown /* 2520103a8feaSLen Brown * in /dev/cpu/ return success for names that are numbers 2521103a8feaSLen Brown * ie. filter out ".", "..", "microcode". 2522103a8feaSLen Brown */ 2523103a8feaSLen Brown int dir_filter(const struct dirent *dirp) 2524103a8feaSLen Brown { 2525103a8feaSLen Brown if (isdigit(dirp->d_name[0])) 2526103a8feaSLen Brown return 1; 2527103a8feaSLen Brown else 2528103a8feaSLen Brown return 0; 2529103a8feaSLen Brown } 2530103a8feaSLen Brown 2531103a8feaSLen Brown int open_dev_cpu_msr(int dummy1) 2532103a8feaSLen Brown { 2533103a8feaSLen Brown return 0; 2534103a8feaSLen Brown } 2535103a8feaSLen Brown 2536c98d5d94SLen Brown void topology_probe() 2537c98d5d94SLen Brown { 2538c98d5d94SLen Brown int i; 2539c98d5d94SLen Brown int max_core_id = 0; 2540c98d5d94SLen Brown int max_package_id = 0; 2541c98d5d94SLen Brown int max_siblings = 0; 2542c98d5d94SLen Brown struct cpu_topology { 2543c98d5d94SLen Brown int core_id; 2544c98d5d94SLen Brown int physical_package_id; 2545c98d5d94SLen Brown } *cpus; 2546c98d5d94SLen Brown 2547c98d5d94SLen Brown /* Initialize num_cpus, max_cpu_num */ 2548c98d5d94SLen Brown topo.num_cpus = 0; 2549c98d5d94SLen Brown topo.max_cpu_num = 0; 2550c98d5d94SLen Brown for_all_proc_cpus(count_cpus); 2551c98d5d94SLen Brown if (!summary_only && topo.num_cpus > 1) 2552c98d5d94SLen Brown show_cpu = 1; 2553c98d5d94SLen Brown 2554d8af6f5fSLen Brown if (debug > 1) 2555c98d5d94SLen Brown fprintf(stderr, "num_cpus %d max_cpu_num %d\n", topo.num_cpus, topo.max_cpu_num); 2556c98d5d94SLen Brown 2557c98d5d94SLen Brown cpus = calloc(1, (topo.max_cpu_num + 1) * sizeof(struct cpu_topology)); 2558b2c95d90SJosh Triplett if (cpus == NULL) 2559b2c95d90SJosh Triplett err(1, "calloc cpus"); 2560c98d5d94SLen Brown 2561c98d5d94SLen Brown /* 2562c98d5d94SLen Brown * Allocate and initialize cpu_present_set 2563c98d5d94SLen Brown */ 2564c98d5d94SLen Brown cpu_present_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2565b2c95d90SJosh Triplett if (cpu_present_set == NULL) 2566b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2567c98d5d94SLen Brown cpu_present_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2568c98d5d94SLen Brown CPU_ZERO_S(cpu_present_setsize, cpu_present_set); 2569c98d5d94SLen Brown for_all_proc_cpus(mark_cpu_present); 2570c98d5d94SLen Brown 2571c98d5d94SLen Brown /* 2572c98d5d94SLen Brown * Allocate and initialize cpu_affinity_set 2573c98d5d94SLen Brown */ 2574c98d5d94SLen Brown cpu_affinity_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2575b2c95d90SJosh Triplett if (cpu_affinity_set == NULL) 2576b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2577c98d5d94SLen Brown cpu_affinity_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2578c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 2579c98d5d94SLen Brown 2580c98d5d94SLen Brown 2581c98d5d94SLen Brown /* 2582c98d5d94SLen Brown * For online cpus 2583c98d5d94SLen Brown * find max_core_id, max_package_id 2584c98d5d94SLen Brown */ 2585c98d5d94SLen Brown for (i = 0; i <= topo.max_cpu_num; ++i) { 2586c98d5d94SLen Brown int siblings; 2587c98d5d94SLen Brown 2588c98d5d94SLen Brown if (cpu_is_not_present(i)) { 2589d8af6f5fSLen Brown if (debug > 1) 2590c98d5d94SLen Brown fprintf(stderr, "cpu%d NOT PRESENT\n", i); 2591c98d5d94SLen Brown continue; 2592c98d5d94SLen Brown } 2593c98d5d94SLen Brown cpus[i].core_id = get_core_id(i); 2594c98d5d94SLen Brown if (cpus[i].core_id > max_core_id) 2595c98d5d94SLen Brown max_core_id = cpus[i].core_id; 2596c98d5d94SLen Brown 2597c98d5d94SLen Brown cpus[i].physical_package_id = get_physical_package_id(i); 2598c98d5d94SLen Brown if (cpus[i].physical_package_id > max_package_id) 2599c98d5d94SLen Brown max_package_id = cpus[i].physical_package_id; 2600c98d5d94SLen Brown 2601c98d5d94SLen Brown siblings = get_num_ht_siblings(i); 2602c98d5d94SLen Brown if (siblings > max_siblings) 2603c98d5d94SLen Brown max_siblings = siblings; 2604d8af6f5fSLen Brown if (debug > 1) 2605c98d5d94SLen Brown fprintf(stderr, "cpu %d pkg %d core %d\n", 2606c98d5d94SLen Brown i, cpus[i].physical_package_id, cpus[i].core_id); 2607c98d5d94SLen Brown } 2608c98d5d94SLen Brown topo.num_cores_per_pkg = max_core_id + 1; 2609d8af6f5fSLen Brown if (debug > 1) 2610c98d5d94SLen Brown fprintf(stderr, "max_core_id %d, sizing for %d cores per package\n", 2611c98d5d94SLen Brown max_core_id, topo.num_cores_per_pkg); 26121cc21f7bSLen Brown if (debug && !summary_only && topo.num_cores_per_pkg > 1) 2613c98d5d94SLen Brown show_core = 1; 2614c98d5d94SLen Brown 2615c98d5d94SLen Brown topo.num_packages = max_package_id + 1; 2616d8af6f5fSLen Brown if (debug > 1) 2617c98d5d94SLen Brown fprintf(stderr, "max_package_id %d, sizing for %d packages\n", 2618c98d5d94SLen Brown max_package_id, topo.num_packages); 26191cc21f7bSLen Brown if (debug && !summary_only && topo.num_packages > 1) 2620c98d5d94SLen Brown show_pkg = 1; 2621c98d5d94SLen Brown 2622c98d5d94SLen Brown topo.num_threads_per_core = max_siblings; 2623d8af6f5fSLen Brown if (debug > 1) 2624c98d5d94SLen Brown fprintf(stderr, "max_siblings %d\n", max_siblings); 2625c98d5d94SLen Brown 2626c98d5d94SLen Brown free(cpus); 2627c98d5d94SLen Brown } 2628c98d5d94SLen Brown 2629c98d5d94SLen Brown void 2630c98d5d94SLen Brown allocate_counters(struct thread_data **t, struct core_data **c, struct pkg_data **p) 2631c98d5d94SLen Brown { 2632c98d5d94SLen Brown int i; 2633c98d5d94SLen Brown 2634c98d5d94SLen Brown *t = calloc(topo.num_threads_per_core * topo.num_cores_per_pkg * 2635c98d5d94SLen Brown topo.num_packages, sizeof(struct thread_data)); 2636c98d5d94SLen Brown if (*t == NULL) 2637c98d5d94SLen Brown goto error; 2638c98d5d94SLen Brown 2639c98d5d94SLen Brown for (i = 0; i < topo.num_threads_per_core * 2640c98d5d94SLen Brown topo.num_cores_per_pkg * topo.num_packages; i++) 2641c98d5d94SLen Brown (*t)[i].cpu_id = -1; 2642c98d5d94SLen Brown 2643c98d5d94SLen Brown *c = calloc(topo.num_cores_per_pkg * topo.num_packages, 2644c98d5d94SLen Brown sizeof(struct core_data)); 2645c98d5d94SLen Brown if (*c == NULL) 2646c98d5d94SLen Brown goto error; 2647c98d5d94SLen Brown 2648c98d5d94SLen Brown for (i = 0; i < topo.num_cores_per_pkg * topo.num_packages; i++) 2649c98d5d94SLen Brown (*c)[i].core_id = -1; 2650c98d5d94SLen Brown 2651c98d5d94SLen Brown *p = calloc(topo.num_packages, sizeof(struct pkg_data)); 2652c98d5d94SLen Brown if (*p == NULL) 2653c98d5d94SLen Brown goto error; 2654c98d5d94SLen Brown 2655c98d5d94SLen Brown for (i = 0; i < topo.num_packages; i++) 2656c98d5d94SLen Brown (*p)[i].package_id = i; 2657c98d5d94SLen Brown 2658c98d5d94SLen Brown return; 2659c98d5d94SLen Brown error: 2660b2c95d90SJosh Triplett err(1, "calloc counters"); 2661c98d5d94SLen Brown } 2662c98d5d94SLen Brown /* 2663c98d5d94SLen Brown * init_counter() 2664c98d5d94SLen Brown * 2665c98d5d94SLen Brown * set cpu_id, core_num, pkg_num 2666c98d5d94SLen Brown * set FIRST_THREAD_IN_CORE and FIRST_CORE_IN_PACKAGE 2667c98d5d94SLen Brown * 2668c98d5d94SLen Brown * increment topo.num_cores when 1st core in pkg seen 2669c98d5d94SLen Brown */ 2670c98d5d94SLen Brown void init_counter(struct thread_data *thread_base, struct core_data *core_base, 2671c98d5d94SLen Brown struct pkg_data *pkg_base, int thread_num, int core_num, 2672c98d5d94SLen Brown int pkg_num, int cpu_id) 2673c98d5d94SLen Brown { 2674c98d5d94SLen Brown struct thread_data *t; 2675c98d5d94SLen Brown struct core_data *c; 2676c98d5d94SLen Brown struct pkg_data *p; 2677c98d5d94SLen Brown 2678c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_num, core_num, pkg_num); 2679c98d5d94SLen Brown c = GET_CORE(core_base, core_num, pkg_num); 2680c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_num); 2681c98d5d94SLen Brown 2682c98d5d94SLen Brown t->cpu_id = cpu_id; 2683c98d5d94SLen Brown if (thread_num == 0) { 2684c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_THREAD_IN_CORE; 2685c98d5d94SLen Brown if (cpu_is_first_core_in_package(cpu_id)) 2686c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_CORE_IN_PACKAGE; 2687c98d5d94SLen Brown } 2688c98d5d94SLen Brown 2689c98d5d94SLen Brown c->core_id = core_num; 2690c98d5d94SLen Brown p->package_id = pkg_num; 2691c98d5d94SLen Brown } 2692c98d5d94SLen Brown 2693c98d5d94SLen Brown 2694c98d5d94SLen Brown int initialize_counters(int cpu_id) 2695c98d5d94SLen Brown { 2696c98d5d94SLen Brown int my_thread_id, my_core_id, my_package_id; 2697c98d5d94SLen Brown 2698c98d5d94SLen Brown my_package_id = get_physical_package_id(cpu_id); 2699c98d5d94SLen Brown my_core_id = get_core_id(cpu_id); 2700c98d5d94SLen Brown 2701c98d5d94SLen Brown if (cpu_is_first_sibling_in_core(cpu_id)) { 2702c98d5d94SLen Brown my_thread_id = 0; 2703c98d5d94SLen Brown topo.num_cores++; 2704c98d5d94SLen Brown } else { 2705c98d5d94SLen Brown my_thread_id = 1; 2706c98d5d94SLen Brown } 2707c98d5d94SLen Brown 2708c98d5d94SLen Brown init_counter(EVEN_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2709c98d5d94SLen Brown init_counter(ODD_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2710c98d5d94SLen Brown return 0; 2711c98d5d94SLen Brown } 2712c98d5d94SLen Brown 2713c98d5d94SLen Brown void allocate_output_buffer() 2714c98d5d94SLen Brown { 27153b4d5c7fSAndy Shevchenko output_buffer = calloc(1, (1 + topo.num_cpus) * 1024); 2716c98d5d94SLen Brown outp = output_buffer; 2717b2c95d90SJosh Triplett if (outp == NULL) 2718b2c95d90SJosh Triplett err(-1, "calloc output buffer"); 2719c98d5d94SLen Brown } 2720c98d5d94SLen Brown 2721c98d5d94SLen Brown void setup_all_buffers(void) 2722c98d5d94SLen Brown { 2723c98d5d94SLen Brown topology_probe(); 2724c98d5d94SLen Brown allocate_counters(&thread_even, &core_even, &package_even); 2725c98d5d94SLen Brown allocate_counters(&thread_odd, &core_odd, &package_odd); 2726c98d5d94SLen Brown allocate_output_buffer(); 2727c98d5d94SLen Brown for_all_proc_cpus(initialize_counters); 2728c98d5d94SLen Brown } 27293b4d5c7fSAndy Shevchenko 2730103a8feaSLen Brown void turbostat_init() 2731103a8feaSLen Brown { 2732103a8feaSLen Brown check_dev_msr(); 273398481e79SLen Brown check_permissions(); 2734fcd17211SLen Brown process_cpuid(); 2735103a8feaSLen Brown 2736c98d5d94SLen Brown setup_all_buffers(); 2737103a8feaSLen Brown 2738d8af6f5fSLen Brown if (debug) 2739889facbeSLen Brown for_all_cpus(print_epb, ODD_COUNTERS); 2740889facbeSLen Brown 2741d8af6f5fSLen Brown if (debug) 27423a9a941dSLen Brown for_all_cpus(print_perf_limit, ODD_COUNTERS); 27433a9a941dSLen Brown 2744d8af6f5fSLen Brown if (debug) 2745889facbeSLen Brown for_all_cpus(print_rapl, ODD_COUNTERS); 2746889facbeSLen Brown 2747889facbeSLen Brown for_all_cpus(set_temperature_target, ODD_COUNTERS); 2748889facbeSLen Brown 2749d8af6f5fSLen Brown if (debug) 2750889facbeSLen Brown for_all_cpus(print_thermal, ODD_COUNTERS); 2751103a8feaSLen Brown } 2752103a8feaSLen Brown 2753103a8feaSLen Brown int fork_it(char **argv) 2754103a8feaSLen Brown { 2755103a8feaSLen Brown pid_t child_pid; 2756d91bb17cSLen Brown int status; 2757d15cf7c1SLen Brown 2758d91bb17cSLen Brown status = for_all_cpus(get_counters, EVEN_COUNTERS); 2759d91bb17cSLen Brown if (status) 2760d91bb17cSLen Brown exit(status); 2761d15cf7c1SLen Brown /* clear affinity side-effect of get_counters() */ 2762d15cf7c1SLen Brown sched_setaffinity(0, cpu_present_setsize, cpu_present_set); 2763103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 2764103a8feaSLen Brown 2765103a8feaSLen Brown child_pid = fork(); 2766103a8feaSLen Brown if (!child_pid) { 2767103a8feaSLen Brown /* child */ 2768103a8feaSLen Brown execvp(argv[0], argv); 2769103a8feaSLen Brown } else { 2770103a8feaSLen Brown 2771103a8feaSLen Brown /* parent */ 2772b2c95d90SJosh Triplett if (child_pid == -1) 2773b2c95d90SJosh Triplett err(1, "fork"); 2774103a8feaSLen Brown 2775103a8feaSLen Brown signal(SIGINT, SIG_IGN); 2776103a8feaSLen Brown signal(SIGQUIT, SIG_IGN); 2777b2c95d90SJosh Triplett if (waitpid(child_pid, &status, 0) == -1) 2778b2c95d90SJosh Triplett err(status, "waitpid"); 2779103a8feaSLen Brown } 2780c98d5d94SLen Brown /* 2781c98d5d94SLen Brown * n.b. fork_it() does not check for errors from for_all_cpus() 2782c98d5d94SLen Brown * because re-starting is problematic when forking 2783c98d5d94SLen Brown */ 2784c98d5d94SLen Brown for_all_cpus(get_counters, ODD_COUNTERS); 2785103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 2786103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 2787c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 2788c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 2789c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 2790c98d5d94SLen Brown flush_stderr(); 2791103a8feaSLen Brown 27926eab04a8SJustin P. Mattock fprintf(stderr, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0); 2793103a8feaSLen Brown 2794d91bb17cSLen Brown return status; 2795103a8feaSLen Brown } 2796103a8feaSLen Brown 27973b4d5c7fSAndy Shevchenko int get_and_dump_counters(void) 27983b4d5c7fSAndy Shevchenko { 27993b4d5c7fSAndy Shevchenko int status; 28003b4d5c7fSAndy Shevchenko 28013b4d5c7fSAndy Shevchenko status = for_all_cpus(get_counters, ODD_COUNTERS); 28023b4d5c7fSAndy Shevchenko if (status) 28033b4d5c7fSAndy Shevchenko return status; 28043b4d5c7fSAndy Shevchenko 28053b4d5c7fSAndy Shevchenko status = for_all_cpus(dump_counters, ODD_COUNTERS); 28063b4d5c7fSAndy Shevchenko if (status) 28073b4d5c7fSAndy Shevchenko return status; 28083b4d5c7fSAndy Shevchenko 28093b4d5c7fSAndy Shevchenko flush_stdout(); 28103b4d5c7fSAndy Shevchenko 28113b4d5c7fSAndy Shevchenko return status; 28123b4d5c7fSAndy Shevchenko } 28133b4d5c7fSAndy Shevchenko 2814d8af6f5fSLen Brown void print_version() { 2815a21d38c8SLen Brown fprintf(stderr, "turbostat version 4.3 24 Mar, 2015" 2816d8af6f5fSLen Brown " - Len Brown <lenb@kernel.org>\n"); 2817d8af6f5fSLen Brown } 2818d8af6f5fSLen Brown 2819103a8feaSLen Brown void cmdline(int argc, char **argv) 2820103a8feaSLen Brown { 2821103a8feaSLen Brown int opt; 2822d8af6f5fSLen Brown int option_index = 0; 2823d8af6f5fSLen Brown static struct option long_options[] = { 2824d8af6f5fSLen Brown {"Counter", required_argument, 0, 'C'}, 2825d8af6f5fSLen Brown {"counter", required_argument, 0, 'c'}, 2826d8af6f5fSLen Brown {"Dump", no_argument, 0, 'D'}, 2827d8af6f5fSLen Brown {"debug", no_argument, 0, 'd'}, 2828d8af6f5fSLen Brown {"interval", required_argument, 0, 'i'}, 2829d8af6f5fSLen Brown {"help", no_argument, 0, 'h'}, 2830d8af6f5fSLen Brown {"Joules", no_argument, 0, 'J'}, 2831d8af6f5fSLen Brown {"MSR", required_argument, 0, 'M'}, 2832d8af6f5fSLen Brown {"msr", required_argument, 0, 'm'}, 2833d8af6f5fSLen Brown {"Package", no_argument, 0, 'p'}, 2834d8af6f5fSLen Brown {"processor", no_argument, 0, 'p'}, 2835d8af6f5fSLen Brown {"Summary", no_argument, 0, 'S'}, 2836d8af6f5fSLen Brown {"TCC", required_argument, 0, 'T'}, 2837d8af6f5fSLen Brown {"version", no_argument, 0, 'v' }, 2838d8af6f5fSLen Brown {0, 0, 0, 0 } 2839d8af6f5fSLen Brown }; 2840103a8feaSLen Brown 2841103a8feaSLen Brown progname = argv[0]; 2842103a8feaSLen Brown 2843d8af6f5fSLen Brown while ((opt = getopt_long_only(argc, argv, "C:c:Ddhi:JM:m:PpST:v", 2844d8af6f5fSLen Brown long_options, &option_index)) != -1) { 2845103a8feaSLen Brown switch (opt) { 2846d8af6f5fSLen Brown case 'C': 2847d8af6f5fSLen Brown sscanf(optarg, "%x", &extra_delta_offset64); 2848103a8feaSLen Brown break; 2849f9240813SLen Brown case 'c': 28508e180f3cSLen Brown sscanf(optarg, "%x", &extra_delta_offset32); 28518e180f3cSLen Brown break; 2852d8af6f5fSLen Brown case 'D': 2853d8af6f5fSLen Brown dump_only++; 28548e180f3cSLen Brown break; 2855d8af6f5fSLen Brown case 'd': 2856d8af6f5fSLen Brown debug++; 28572f32edf1SLen Brown break; 2858d8af6f5fSLen Brown case 'h': 2859d8af6f5fSLen Brown default: 2860d8af6f5fSLen Brown help(); 2861d8af6f5fSLen Brown exit(1); 2862d8af6f5fSLen Brown case 'i': 2863d8af6f5fSLen Brown interval_sec = atoi(optarg); 2864889facbeSLen Brown break; 28655c56be9aSDirk Brandewie case 'J': 28665c56be9aSDirk Brandewie rapl_joules++; 28675c56be9aSDirk Brandewie break; 2868d8af6f5fSLen Brown case 'M': 2869d8af6f5fSLen Brown sscanf(optarg, "%x", &extra_msr_offset64); 2870d8af6f5fSLen Brown break; 2871d8af6f5fSLen Brown case 'm': 2872d8af6f5fSLen Brown sscanf(optarg, "%x", &extra_msr_offset32); 2873d8af6f5fSLen Brown break; 2874d8af6f5fSLen Brown case 'P': 2875d8af6f5fSLen Brown show_pkg_only++; 2876d8af6f5fSLen Brown break; 2877d8af6f5fSLen Brown case 'p': 2878d8af6f5fSLen Brown show_core_only++; 2879d8af6f5fSLen Brown break; 2880d8af6f5fSLen Brown case 'S': 2881d8af6f5fSLen Brown summary_only++; 2882d8af6f5fSLen Brown break; 2883d8af6f5fSLen Brown case 'T': 2884d8af6f5fSLen Brown tcc_activation_temp_override = atoi(optarg); 2885d8af6f5fSLen Brown break; 2886d8af6f5fSLen Brown case 'v': 2887d8af6f5fSLen Brown print_version(); 2888d8af6f5fSLen Brown exit(0); 2889d8af6f5fSLen Brown break; 2890103a8feaSLen Brown } 2891103a8feaSLen Brown } 2892103a8feaSLen Brown } 2893103a8feaSLen Brown 2894103a8feaSLen Brown int main(int argc, char **argv) 2895103a8feaSLen Brown { 2896103a8feaSLen Brown cmdline(argc, argv); 2897103a8feaSLen Brown 2898d8af6f5fSLen Brown if (debug) 2899d8af6f5fSLen Brown print_version(); 2900103a8feaSLen Brown 2901103a8feaSLen Brown turbostat_init(); 2902103a8feaSLen Brown 29033b4d5c7fSAndy Shevchenko /* dump counters and exit */ 29043b4d5c7fSAndy Shevchenko if (dump_only) 29053b4d5c7fSAndy Shevchenko return get_and_dump_counters(); 29063b4d5c7fSAndy Shevchenko 2907103a8feaSLen Brown /* 2908103a8feaSLen Brown * if any params left, it must be a command to fork 2909103a8feaSLen Brown */ 2910103a8feaSLen Brown if (argc - optind) 2911103a8feaSLen Brown return fork_it(argv + optind); 2912103a8feaSLen Brown else 2913103a8feaSLen Brown turbostat_loop(); 2914103a8feaSLen Brown 2915103a8feaSLen Brown return 0; 2916103a8feaSLen Brown } 2917