1103a8feaSLen Brown /* 2103a8feaSLen Brown * turbostat -- show CPU frequency and C-state residency 3103a8feaSLen Brown * on modern Intel turbo-capable processors. 4103a8feaSLen Brown * 5144b44b1SLen Brown * Copyright (c) 2013 Intel Corporation. 6103a8feaSLen Brown * Len Brown <len.brown@intel.com> 7103a8feaSLen Brown * 8103a8feaSLen Brown * This program is free software; you can redistribute it and/or modify it 9103a8feaSLen Brown * under the terms and conditions of the GNU General Public License, 10103a8feaSLen Brown * version 2, as published by the Free Software Foundation. 11103a8feaSLen Brown * 12103a8feaSLen Brown * This program is distributed in the hope it will be useful, but WITHOUT 13103a8feaSLen Brown * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 14103a8feaSLen Brown * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 15103a8feaSLen Brown * more details. 16103a8feaSLen Brown * 17103a8feaSLen Brown * You should have received a copy of the GNU General Public License along with 18103a8feaSLen Brown * this program; if not, write to the Free Software Foundation, Inc., 19103a8feaSLen Brown * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. 20103a8feaSLen Brown */ 21103a8feaSLen Brown 2288c3281fSLen Brown #define _GNU_SOURCE 23b731f311SJosh Triplett #include MSRHEADER 2495aebc44SJosh Triplett #include <stdarg.h> 25103a8feaSLen Brown #include <stdio.h> 26b2c95d90SJosh Triplett #include <err.h> 27103a8feaSLen Brown #include <unistd.h> 28103a8feaSLen Brown #include <sys/types.h> 29103a8feaSLen Brown #include <sys/wait.h> 30103a8feaSLen Brown #include <sys/stat.h> 31103a8feaSLen Brown #include <sys/resource.h> 32103a8feaSLen Brown #include <fcntl.h> 33103a8feaSLen Brown #include <signal.h> 34103a8feaSLen Brown #include <sys/time.h> 35103a8feaSLen Brown #include <stdlib.h> 36103a8feaSLen Brown #include <dirent.h> 37103a8feaSLen Brown #include <string.h> 38103a8feaSLen Brown #include <ctype.h> 3988c3281fSLen Brown #include <sched.h> 402b92865eSJosh Triplett #include <cpuid.h> 4198481e79SLen Brown #include <linux/capability.h> 4298481e79SLen Brown #include <errno.h> 43103a8feaSLen Brown 44103a8feaSLen Brown char *proc_stat = "/proc/stat"; 45103a8feaSLen Brown unsigned int interval_sec = 5; /* set with -i interval_sec */ 46103a8feaSLen Brown unsigned int verbose; /* set with -v */ 47889facbeSLen Brown unsigned int rapl_verbose; /* set with -R */ 485c56be9aSDirk Brandewie unsigned int rapl_joules; /* set with -J */ 49889facbeSLen Brown unsigned int thermal_verbose; /* set with -T */ 50f591c38bSAndy Shevchenko unsigned int summary_only; /* set with -S */ 513b4d5c7fSAndy Shevchenko unsigned int dump_only; /* set with -s */ 52103a8feaSLen Brown unsigned int skip_c0; 53103a8feaSLen Brown unsigned int skip_c1; 54103a8feaSLen Brown unsigned int do_nhm_cstates; 55103a8feaSLen Brown unsigned int do_snb_cstates; 56ca58710fSKristen Carlson Accardi unsigned int do_c8_c9_c10; 57144b44b1SLen Brown unsigned int do_slm_cstates; 58144b44b1SLen Brown unsigned int use_c1_residency_msr; 59103a8feaSLen Brown unsigned int has_aperf; 60889facbeSLen Brown unsigned int has_epb; 61fc04cc67SLen Brown unsigned int units = 1000000; /* MHz etc */ 62103a8feaSLen Brown unsigned int genuine_intel; 63103a8feaSLen Brown unsigned int has_invariant_tsc; 64103a8feaSLen Brown unsigned int do_nehalem_platform_info; 65103a8feaSLen Brown unsigned int do_nehalem_turbo_ratio_limit; 666574a5d5SLen Brown unsigned int do_ivt_turbo_ratio_limit; 672f32edf1SLen Brown unsigned int extra_msr_offset32; 682f32edf1SLen Brown unsigned int extra_msr_offset64; 698e180f3cSLen Brown unsigned int extra_delta_offset32; 708e180f3cSLen Brown unsigned int extra_delta_offset64; 711ed51011SLen Brown int do_smi; 72103a8feaSLen Brown double bclk; 73103a8feaSLen Brown unsigned int show_pkg; 74103a8feaSLen Brown unsigned int show_core; 75103a8feaSLen Brown unsigned int show_cpu; 76c98d5d94SLen Brown unsigned int show_pkg_only; 77c98d5d94SLen Brown unsigned int show_core_only; 78c98d5d94SLen Brown char *output_buffer, *outp; 79889facbeSLen Brown unsigned int do_rapl; 80889facbeSLen Brown unsigned int do_dts; 81889facbeSLen Brown unsigned int do_ptm; 82889facbeSLen Brown unsigned int tcc_activation_temp; 83889facbeSLen Brown unsigned int tcc_activation_temp_override; 84889facbeSLen Brown double rapl_power_units, rapl_energy_units, rapl_time_units; 85889facbeSLen Brown double rapl_joule_counter_range; 86*3a9a941dSLen Brown unsigned int do_core_perf_limit_reasons; 87*3a9a941dSLen Brown unsigned int do_gfx_perf_limit_reasons; 88*3a9a941dSLen Brown unsigned int do_ring_perf_limit_reasons; 89889facbeSLen Brown 90889facbeSLen Brown #define RAPL_PKG (1 << 0) 91e6f9bb3cSLen Brown /* 0x610 MSR_PKG_POWER_LIMIT */ 92e6f9bb3cSLen Brown /* 0x611 MSR_PKG_ENERGY_STATUS */ 93e6f9bb3cSLen Brown #define RAPL_PKG_PERF_STATUS (1 << 1) 94e6f9bb3cSLen Brown /* 0x613 MSR_PKG_PERF_STATUS */ 95e6f9bb3cSLen Brown #define RAPL_PKG_POWER_INFO (1 << 2) 96e6f9bb3cSLen Brown /* 0x614 MSR_PKG_POWER_INFO */ 97e6f9bb3cSLen Brown 98889facbeSLen Brown #define RAPL_DRAM (1 << 3) 99e6f9bb3cSLen Brown /* 0x618 MSR_DRAM_POWER_LIMIT */ 100e6f9bb3cSLen Brown /* 0x619 MSR_DRAM_ENERGY_STATUS */ 101e6f9bb3cSLen Brown /* 0x61c MSR_DRAM_POWER_INFO */ 102e6f9bb3cSLen Brown #define RAPL_DRAM_PERF_STATUS (1 << 4) 103e6f9bb3cSLen Brown /* 0x61b MSR_DRAM_PERF_STATUS */ 104e6f9bb3cSLen Brown 105e6f9bb3cSLen Brown #define RAPL_CORES (1 << 5) 106e6f9bb3cSLen Brown /* 0x638 MSR_PP0_POWER_LIMIT */ 107e6f9bb3cSLen Brown /* 0x639 MSR_PP0_ENERGY_STATUS */ 108e6f9bb3cSLen Brown #define RAPL_CORE_POLICY (1 << 6) 109e6f9bb3cSLen Brown /* 0x63a MSR_PP0_POLICY */ 110e6f9bb3cSLen Brown 111e6f9bb3cSLen Brown 112e6f9bb3cSLen Brown #define RAPL_GFX (1 << 7) 113e6f9bb3cSLen Brown /* 0x640 MSR_PP1_POWER_LIMIT */ 114e6f9bb3cSLen Brown /* 0x641 MSR_PP1_ENERGY_STATUS */ 115e6f9bb3cSLen Brown /* 0x642 MSR_PP1_POLICY */ 116889facbeSLen Brown #define TJMAX_DEFAULT 100 117889facbeSLen Brown 118889facbeSLen Brown #define MAX(a, b) ((a) > (b) ? (a) : (b)) 119103a8feaSLen Brown 120103a8feaSLen Brown int aperf_mperf_unstable; 121103a8feaSLen Brown int backwards_count; 122103a8feaSLen Brown char *progname; 123103a8feaSLen Brown 124c98d5d94SLen Brown cpu_set_t *cpu_present_set, *cpu_affinity_set; 125c98d5d94SLen Brown size_t cpu_present_setsize, cpu_affinity_setsize; 126c98d5d94SLen Brown 127c98d5d94SLen Brown struct thread_data { 128c98d5d94SLen Brown unsigned long long tsc; 129c98d5d94SLen Brown unsigned long long aperf; 130c98d5d94SLen Brown unsigned long long mperf; 131144b44b1SLen Brown unsigned long long c1; 1322f32edf1SLen Brown unsigned long long extra_msr64; 1338e180f3cSLen Brown unsigned long long extra_delta64; 1348e180f3cSLen Brown unsigned long long extra_msr32; 1358e180f3cSLen Brown unsigned long long extra_delta32; 1361ed51011SLen Brown unsigned int smi_count; 137c98d5d94SLen Brown unsigned int cpu_id; 138c98d5d94SLen Brown unsigned int flags; 139c98d5d94SLen Brown #define CPU_IS_FIRST_THREAD_IN_CORE 0x2 140c98d5d94SLen Brown #define CPU_IS_FIRST_CORE_IN_PACKAGE 0x4 141c98d5d94SLen Brown } *thread_even, *thread_odd; 142c98d5d94SLen Brown 143c98d5d94SLen Brown struct core_data { 144c98d5d94SLen Brown unsigned long long c3; 145c98d5d94SLen Brown unsigned long long c6; 146c98d5d94SLen Brown unsigned long long c7; 147889facbeSLen Brown unsigned int core_temp_c; 148c98d5d94SLen Brown unsigned int core_id; 149c98d5d94SLen Brown } *core_even, *core_odd; 150c98d5d94SLen Brown 151c98d5d94SLen Brown struct pkg_data { 152c98d5d94SLen Brown unsigned long long pc2; 153c98d5d94SLen Brown unsigned long long pc3; 154c98d5d94SLen Brown unsigned long long pc6; 155c98d5d94SLen Brown unsigned long long pc7; 156ca58710fSKristen Carlson Accardi unsigned long long pc8; 157ca58710fSKristen Carlson Accardi unsigned long long pc9; 158ca58710fSKristen Carlson Accardi unsigned long long pc10; 159c98d5d94SLen Brown unsigned int package_id; 160889facbeSLen Brown unsigned int energy_pkg; /* MSR_PKG_ENERGY_STATUS */ 161889facbeSLen Brown unsigned int energy_dram; /* MSR_DRAM_ENERGY_STATUS */ 162889facbeSLen Brown unsigned int energy_cores; /* MSR_PP0_ENERGY_STATUS */ 163889facbeSLen Brown unsigned int energy_gfx; /* MSR_PP1_ENERGY_STATUS */ 164889facbeSLen Brown unsigned int rapl_pkg_perf_status; /* MSR_PKG_PERF_STATUS */ 165889facbeSLen Brown unsigned int rapl_dram_perf_status; /* MSR_DRAM_PERF_STATUS */ 166889facbeSLen Brown unsigned int pkg_temp_c; 167889facbeSLen Brown 168c98d5d94SLen Brown } *package_even, *package_odd; 169c98d5d94SLen Brown 170c98d5d94SLen Brown #define ODD_COUNTERS thread_odd, core_odd, package_odd 171c98d5d94SLen Brown #define EVEN_COUNTERS thread_even, core_even, package_even 172c98d5d94SLen Brown 173c98d5d94SLen Brown #define GET_THREAD(thread_base, thread_no, core_no, pkg_no) \ 174c98d5d94SLen Brown (thread_base + (pkg_no) * topo.num_cores_per_pkg * \ 175c98d5d94SLen Brown topo.num_threads_per_core + \ 176c98d5d94SLen Brown (core_no) * topo.num_threads_per_core + (thread_no)) 177c98d5d94SLen Brown #define GET_CORE(core_base, core_no, pkg_no) \ 178c98d5d94SLen Brown (core_base + (pkg_no) * topo.num_cores_per_pkg + (core_no)) 179c98d5d94SLen Brown #define GET_PKG(pkg_base, pkg_no) (pkg_base + pkg_no) 180c98d5d94SLen Brown 181c98d5d94SLen Brown struct system_summary { 182c98d5d94SLen Brown struct thread_data threads; 183c98d5d94SLen Brown struct core_data cores; 184c98d5d94SLen Brown struct pkg_data packages; 185c98d5d94SLen Brown } sum, average; 186c98d5d94SLen Brown 187c98d5d94SLen Brown 188c98d5d94SLen Brown struct topo_params { 189c98d5d94SLen Brown int num_packages; 190103a8feaSLen Brown int num_cpus; 191c98d5d94SLen Brown int num_cores; 192c98d5d94SLen Brown int max_cpu_num; 193c98d5d94SLen Brown int num_cores_per_pkg; 194c98d5d94SLen Brown int num_threads_per_core; 195c98d5d94SLen Brown } topo; 196103a8feaSLen Brown 197c98d5d94SLen Brown struct timeval tv_even, tv_odd, tv_delta; 198103a8feaSLen Brown 199c98d5d94SLen Brown void setup_all_buffers(void); 200103a8feaSLen Brown 201c98d5d94SLen Brown int cpu_is_not_present(int cpu) 202d15cf7c1SLen Brown { 203c98d5d94SLen Brown return !CPU_ISSET_S(cpu, cpu_present_setsize, cpu_present_set); 204c98d5d94SLen Brown } 205c98d5d94SLen Brown /* 206c98d5d94SLen Brown * run func(thread, core, package) in topology order 207c98d5d94SLen Brown * skip non-present cpus 208c98d5d94SLen Brown */ 209c98d5d94SLen Brown 210c98d5d94SLen Brown int for_all_cpus(int (func)(struct thread_data *, struct core_data *, struct pkg_data *), 211c98d5d94SLen Brown struct thread_data *thread_base, struct core_data *core_base, struct pkg_data *pkg_base) 212c98d5d94SLen Brown { 213c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 214c98d5d94SLen Brown 215c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 216c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 217c98d5d94SLen Brown for (thread_no = 0; thread_no < 218c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 219c98d5d94SLen Brown struct thread_data *t; 220c98d5d94SLen Brown struct core_data *c; 221c98d5d94SLen Brown struct pkg_data *p; 222c98d5d94SLen Brown 223c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 224c98d5d94SLen Brown 225c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 226c98d5d94SLen Brown continue; 227c98d5d94SLen Brown 228c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 229c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 230c98d5d94SLen Brown 231c98d5d94SLen Brown retval = func(t, c, p); 232c98d5d94SLen Brown if (retval) 233c98d5d94SLen Brown return retval; 234c98d5d94SLen Brown } 235c98d5d94SLen Brown } 236c98d5d94SLen Brown } 237d15cf7c1SLen Brown return 0; 238d15cf7c1SLen Brown } 239d15cf7c1SLen Brown 24088c3281fSLen Brown int cpu_migrate(int cpu) 24188c3281fSLen Brown { 242c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 243c98d5d94SLen Brown CPU_SET_S(cpu, cpu_affinity_setsize, cpu_affinity_set); 244c98d5d94SLen Brown if (sched_setaffinity(0, cpu_affinity_setsize, cpu_affinity_set) == -1) 24588c3281fSLen Brown return -1; 24688c3281fSLen Brown else 24788c3281fSLen Brown return 0; 24888c3281fSLen Brown } 24988c3281fSLen Brown 25015aaa346SLen Brown int get_msr(int cpu, off_t offset, unsigned long long *msr) 251103a8feaSLen Brown { 252103a8feaSLen Brown ssize_t retval; 253103a8feaSLen Brown char pathname[32]; 254103a8feaSLen Brown int fd; 255103a8feaSLen Brown 256103a8feaSLen Brown sprintf(pathname, "/dev/cpu/%d/msr", cpu); 257103a8feaSLen Brown fd = open(pathname, O_RDONLY); 25815aaa346SLen Brown if (fd < 0) 25998481e79SLen Brown err(-1, "%s open failed, try chown or chmod +r /dev/cpu/*/msr, or run as root", pathname); 260103a8feaSLen Brown 26115aaa346SLen Brown retval = pread(fd, msr, sizeof *msr, offset); 262103a8feaSLen Brown close(fd); 26315aaa346SLen Brown 26498481e79SLen Brown if (retval != sizeof *msr) 26598481e79SLen Brown err(-1, "%s offset 0x%llx read failed", pathname, (unsigned long long)offset); 26615aaa346SLen Brown 26715aaa346SLen Brown return 0; 268103a8feaSLen Brown } 269103a8feaSLen Brown 270fc04cc67SLen Brown /* 271fc04cc67SLen Brown * Example Format w/ field column widths: 272fc04cc67SLen Brown * 273fc04cc67SLen Brown * Package Core CPU Avg_MHz Bzy_MHz TSC_MHz SMI %Busy CPU_%c1 CPU_%c3 CPU_%c6 CPU_%c7 CoreTmp PkgTmp Pkg%pc2 Pkg%pc3 Pkg%pc6 Pkg%pc7 PkgWatt CorWatt GFXWatt 274e7c95ff3SLen Brown * 123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678123456781234567812345678 275fc04cc67SLen Brown */ 276fc04cc67SLen Brown 277a829eb4dSLen Brown void print_header(void) 278103a8feaSLen Brown { 279103a8feaSLen Brown if (show_pkg) 280fc04cc67SLen Brown outp += sprintf(outp, " Package"); 281103a8feaSLen Brown if (show_core) 282fc04cc67SLen Brown outp += sprintf(outp, " Core"); 283103a8feaSLen Brown if (show_cpu) 284c98d5d94SLen Brown outp += sprintf(outp, " CPU"); 285103a8feaSLen Brown if (has_aperf) 286fc04cc67SLen Brown outp += sprintf(outp, " Avg_MHz"); 287fc04cc67SLen Brown if (do_nhm_cstates) 288fc04cc67SLen Brown outp += sprintf(outp, " %%Busy"); 289fc04cc67SLen Brown if (has_aperf) 290fc04cc67SLen Brown outp += sprintf(outp, " Bzy_MHz"); 291fc04cc67SLen Brown outp += sprintf(outp, " TSC_MHz"); 2921ed51011SLen Brown if (do_smi) 2931ed51011SLen Brown outp += sprintf(outp, " SMI"); 2948e180f3cSLen Brown if (extra_delta_offset32) 295f9240813SLen Brown outp += sprintf(outp, " count 0x%03X", extra_delta_offset32); 2968e180f3cSLen Brown if (extra_delta_offset64) 297f9240813SLen Brown outp += sprintf(outp, " COUNT 0x%03X", extra_delta_offset64); 2982f32edf1SLen Brown if (extra_msr_offset32) 2998e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset32); 3002f32edf1SLen Brown if (extra_msr_offset64) 3018e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset64); 302103a8feaSLen Brown if (do_nhm_cstates) 303fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c1"); 304144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 305fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c3"); 306103a8feaSLen Brown if (do_nhm_cstates) 307fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c6"); 308103a8feaSLen Brown if (do_snb_cstates) 309fc04cc67SLen Brown outp += sprintf(outp, " CPU%%c7"); 310889facbeSLen Brown 311889facbeSLen Brown if (do_dts) 312fc04cc67SLen Brown outp += sprintf(outp, " CoreTmp"); 313889facbeSLen Brown if (do_ptm) 314fc04cc67SLen Brown outp += sprintf(outp, " PkgTmp"); 315889facbeSLen Brown 316103a8feaSLen Brown if (do_snb_cstates) 317fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc2"); 318144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 319fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc3"); 320144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 321fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc6"); 322103a8feaSLen Brown if (do_snb_cstates) 323fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc7"); 324ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 325fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc8"); 326fc04cc67SLen Brown outp += sprintf(outp, " Pkg%%pc9"); 327fc04cc67SLen Brown outp += sprintf(outp, " Pk%%pc10"); 328ca58710fSKristen Carlson Accardi } 329103a8feaSLen Brown 3305c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 331889facbeSLen Brown if (do_rapl & RAPL_PKG) 332fc04cc67SLen Brown outp += sprintf(outp, " PkgWatt"); 333889facbeSLen Brown if (do_rapl & RAPL_CORES) 334fc04cc67SLen Brown outp += sprintf(outp, " CorWatt"); 335889facbeSLen Brown if (do_rapl & RAPL_GFX) 336fc04cc67SLen Brown outp += sprintf(outp, " GFXWatt"); 337889facbeSLen Brown if (do_rapl & RAPL_DRAM) 338fc04cc67SLen Brown outp += sprintf(outp, " RAMWatt"); 339889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 340889facbeSLen Brown outp += sprintf(outp, " PKG_%%"); 341889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 342889facbeSLen Brown outp += sprintf(outp, " RAM_%%"); 3435c56be9aSDirk Brandewie } else { 3445c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 3455c56be9aSDirk Brandewie outp += sprintf(outp, " Pkg_J"); 3465c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 3475c56be9aSDirk Brandewie outp += sprintf(outp, " Cor_J"); 3485c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 3495c56be9aSDirk Brandewie outp += sprintf(outp, " GFX_J"); 3505c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 3515c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_W"); 3525c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 3535c56be9aSDirk Brandewie outp += sprintf(outp, " PKG_%%"); 3545c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 3555c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_%%"); 3565c56be9aSDirk Brandewie outp += sprintf(outp, " time"); 357889facbeSLen Brown 3585c56be9aSDirk Brandewie } 359c98d5d94SLen Brown outp += sprintf(outp, "\n"); 360103a8feaSLen Brown } 361103a8feaSLen Brown 362c98d5d94SLen Brown int dump_counters(struct thread_data *t, struct core_data *c, 363c98d5d94SLen Brown struct pkg_data *p) 364103a8feaSLen Brown { 3653b4d5c7fSAndy Shevchenko outp += sprintf(outp, "t %p, c %p, p %p\n", t, c, p); 366c98d5d94SLen Brown 367c98d5d94SLen Brown if (t) { 3683b4d5c7fSAndy Shevchenko outp += sprintf(outp, "CPU: %d flags 0x%x\n", 3693b4d5c7fSAndy Shevchenko t->cpu_id, t->flags); 3703b4d5c7fSAndy Shevchenko outp += sprintf(outp, "TSC: %016llX\n", t->tsc); 3713b4d5c7fSAndy Shevchenko outp += sprintf(outp, "aperf: %016llX\n", t->aperf); 3723b4d5c7fSAndy Shevchenko outp += sprintf(outp, "mperf: %016llX\n", t->mperf); 3733b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c1: %016llX\n", t->c1); 3743b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %08llX\n", 3758e180f3cSLen Brown extra_delta_offset32, t->extra_delta32); 3763b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %016llX\n", 3778e180f3cSLen Brown extra_delta_offset64, t->extra_delta64); 3783b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %08llX\n", 3792f32edf1SLen Brown extra_msr_offset32, t->extra_msr32); 3803b4d5c7fSAndy Shevchenko outp += sprintf(outp, "msr0x%x: %016llX\n", 3812f32edf1SLen Brown extra_msr_offset64, t->extra_msr64); 3821ed51011SLen Brown if (do_smi) 3833b4d5c7fSAndy Shevchenko outp += sprintf(outp, "SMI: %08X\n", t->smi_count); 384103a8feaSLen Brown } 385103a8feaSLen Brown 386c98d5d94SLen Brown if (c) { 3873b4d5c7fSAndy Shevchenko outp += sprintf(outp, "core: %d\n", c->core_id); 3883b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c3: %016llX\n", c->c3); 3893b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c6: %016llX\n", c->c6); 3903b4d5c7fSAndy Shevchenko outp += sprintf(outp, "c7: %016llX\n", c->c7); 3913b4d5c7fSAndy Shevchenko outp += sprintf(outp, "DTS: %dC\n", c->core_temp_c); 392c98d5d94SLen Brown } 393103a8feaSLen Brown 394c98d5d94SLen Brown if (p) { 3953b4d5c7fSAndy Shevchenko outp += sprintf(outp, "package: %d\n", p->package_id); 3963b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc2: %016llX\n", p->pc2); 3973b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc3: %016llX\n", p->pc3); 3983b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc6: %016llX\n", p->pc6); 3993b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc7: %016llX\n", p->pc7); 4003b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc8: %016llX\n", p->pc8); 4013b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc9: %016llX\n", p->pc9); 4023b4d5c7fSAndy Shevchenko outp += sprintf(outp, "pc10: %016llX\n", p->pc10); 4033b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules PKG: %0X\n", p->energy_pkg); 4043b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules COR: %0X\n", p->energy_cores); 4053b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules GFX: %0X\n", p->energy_gfx); 4063b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Joules RAM: %0X\n", p->energy_dram); 4073b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Throttle PKG: %0X\n", 4083b4d5c7fSAndy Shevchenko p->rapl_pkg_perf_status); 4093b4d5c7fSAndy Shevchenko outp += sprintf(outp, "Throttle RAM: %0X\n", 4103b4d5c7fSAndy Shevchenko p->rapl_dram_perf_status); 4113b4d5c7fSAndy Shevchenko outp += sprintf(outp, "PTM: %dC\n", p->pkg_temp_c); 412c98d5d94SLen Brown } 4133b4d5c7fSAndy Shevchenko 4143b4d5c7fSAndy Shevchenko outp += sprintf(outp, "\n"); 4153b4d5c7fSAndy Shevchenko 416c98d5d94SLen Brown return 0; 417103a8feaSLen Brown } 418103a8feaSLen Brown 419e23da037SLen Brown /* 420e23da037SLen Brown * column formatting convention & formats 421e23da037SLen Brown */ 422c98d5d94SLen Brown int format_counters(struct thread_data *t, struct core_data *c, 423c98d5d94SLen Brown struct pkg_data *p) 424103a8feaSLen Brown { 425103a8feaSLen Brown double interval_float; 426fc04cc67SLen Brown char *fmt8; 427103a8feaSLen Brown 428c98d5d94SLen Brown /* if showing only 1st thread in core and this isn't one, bail out */ 429c98d5d94SLen Brown if (show_core_only && !(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 430c98d5d94SLen Brown return 0; 431c98d5d94SLen Brown 432c98d5d94SLen Brown /* if showing only 1st thread in pkg and this isn't one, bail out */ 433c98d5d94SLen Brown if (show_pkg_only && !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 434c98d5d94SLen Brown return 0; 435c98d5d94SLen Brown 436103a8feaSLen Brown interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0; 437103a8feaSLen Brown 438c98d5d94SLen Brown /* topo columns, print blanks on 1st (average) line */ 439c98d5d94SLen Brown if (t == &average.threads) { 440103a8feaSLen Brown if (show_pkg) 441fc04cc67SLen Brown outp += sprintf(outp, " -"); 442103a8feaSLen Brown if (show_core) 443fc04cc67SLen Brown outp += sprintf(outp, " -"); 444103a8feaSLen Brown if (show_cpu) 445fc04cc67SLen Brown outp += sprintf(outp, " -"); 446103a8feaSLen Brown } else { 447c98d5d94SLen Brown if (show_pkg) { 448c98d5d94SLen Brown if (p) 449fc04cc67SLen Brown outp += sprintf(outp, "%8d", p->package_id); 450c98d5d94SLen Brown else 451fc04cc67SLen Brown outp += sprintf(outp, " -"); 452c98d5d94SLen Brown } 453c98d5d94SLen Brown if (show_core) { 454c98d5d94SLen Brown if (c) 455fc04cc67SLen Brown outp += sprintf(outp, "%8d", c->core_id); 456c98d5d94SLen Brown else 457fc04cc67SLen Brown outp += sprintf(outp, " -"); 458c98d5d94SLen Brown } 459103a8feaSLen Brown if (show_cpu) 460fc04cc67SLen Brown outp += sprintf(outp, "%8d", t->cpu_id); 461103a8feaSLen Brown } 462fc04cc67SLen Brown 463fc04cc67SLen Brown /* AvgMHz */ 464fc04cc67SLen Brown if (has_aperf) 465fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 466fc04cc67SLen Brown 1.0 / units * t->aperf / interval_float); 467fc04cc67SLen Brown 468103a8feaSLen Brown /* %c0 */ 469103a8feaSLen Brown if (do_nhm_cstates) { 470103a8feaSLen Brown if (!skip_c0) 471fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * t->mperf/t->tsc); 472103a8feaSLen Brown else 473fc04cc67SLen Brown outp += sprintf(outp, "********"); 474103a8feaSLen Brown } 475103a8feaSLen Brown 476fc04cc67SLen Brown /* BzyMHz */ 477fc04cc67SLen Brown if (has_aperf) 478fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 479fc04cc67SLen Brown 1.0 * t->tsc / units * t->aperf / t->mperf / interval_float); 480103a8feaSLen Brown 481103a8feaSLen Brown /* TSC */ 482fc04cc67SLen Brown outp += sprintf(outp, "%8.0f", 1.0 * t->tsc/units/interval_float); 483103a8feaSLen Brown 4841ed51011SLen Brown /* SMI */ 4851ed51011SLen Brown if (do_smi) 486fc04cc67SLen Brown outp += sprintf(outp, "%8d", t->smi_count); 4871ed51011SLen Brown 4888e180f3cSLen Brown /* delta */ 4898e180f3cSLen Brown if (extra_delta_offset32) 4908e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta32); 4918e180f3cSLen Brown 4928e180f3cSLen Brown /* DELTA */ 4938e180f3cSLen Brown if (extra_delta_offset64) 4948e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta64); 4952f32edf1SLen Brown /* msr */ 4962f32edf1SLen Brown if (extra_msr_offset32) 4978e180f3cSLen Brown outp += sprintf(outp, " 0x%08llx", t->extra_msr32); 4982f32edf1SLen Brown 499130ff304SLen Brown /* MSR */ 5002f32edf1SLen Brown if (extra_msr_offset64) 5012f32edf1SLen Brown outp += sprintf(outp, " 0x%016llx", t->extra_msr64); 502130ff304SLen Brown 503103a8feaSLen Brown if (do_nhm_cstates) { 504103a8feaSLen Brown if (!skip_c1) 505fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * t->c1/t->tsc); 506103a8feaSLen Brown else 507fc04cc67SLen Brown outp += sprintf(outp, "********"); 508103a8feaSLen Brown } 509c98d5d94SLen Brown 510c98d5d94SLen Brown /* print per-core data only for 1st thread in core */ 511c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 512c98d5d94SLen Brown goto done; 513c98d5d94SLen Brown 514144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 515fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c3/t->tsc); 516103a8feaSLen Brown if (do_nhm_cstates) 517fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c6/t->tsc); 518103a8feaSLen Brown if (do_snb_cstates) 519fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * c->c7/t->tsc); 520c98d5d94SLen Brown 521889facbeSLen Brown if (do_dts) 522fc04cc67SLen Brown outp += sprintf(outp, "%8d", c->core_temp_c); 523889facbeSLen Brown 524c98d5d94SLen Brown /* print per-package data only for 1st core in package */ 525c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 526c98d5d94SLen Brown goto done; 527c98d5d94SLen Brown 528889facbeSLen Brown if (do_ptm) 529fc04cc67SLen Brown outp += sprintf(outp, "%8d", p->pkg_temp_c); 530889facbeSLen Brown 531103a8feaSLen Brown if (do_snb_cstates) 532fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc2/t->tsc); 533144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 534fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc3/t->tsc); 535144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 536fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc6/t->tsc); 537103a8feaSLen Brown if (do_snb_cstates) 538fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc7/t->tsc); 539ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 540fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc8/t->tsc); 541fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc9/t->tsc); 542fc04cc67SLen Brown outp += sprintf(outp, "%8.2f", 100.0 * p->pc10/t->tsc); 543ca58710fSKristen Carlson Accardi } 544889facbeSLen Brown 545889facbeSLen Brown /* 546889facbeSLen Brown * If measurement interval exceeds minimum RAPL Joule Counter range, 547889facbeSLen Brown * indicate that results are suspect by printing "**" in fraction place. 548889facbeSLen Brown */ 549fc04cc67SLen Brown if (interval_float < rapl_joule_counter_range) 550fc04cc67SLen Brown fmt8 = "%8.2f"; 551fc04cc67SLen Brown else 552fc04cc67SLen Brown fmt8 = " %6.0f**"; 553889facbeSLen Brown 5545c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 555889facbeSLen Brown if (do_rapl & RAPL_PKG) 556fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_pkg * rapl_energy_units / interval_float); 557889facbeSLen Brown if (do_rapl & RAPL_CORES) 558fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_cores * rapl_energy_units / interval_float); 559889facbeSLen Brown if (do_rapl & RAPL_GFX) 560fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_gfx * rapl_energy_units / interval_float); 561889facbeSLen Brown if (do_rapl & RAPL_DRAM) 562fc04cc67SLen Brown outp += sprintf(outp, fmt8, p->energy_dram * rapl_energy_units / interval_float); 563889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 564fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 565889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 566fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 5675c56be9aSDirk Brandewie } else { 5685c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 569fc04cc67SLen Brown outp += sprintf(outp, fmt8, 5705c56be9aSDirk Brandewie p->energy_pkg * rapl_energy_units); 5715c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 572fc04cc67SLen Brown outp += sprintf(outp, fmt8, 5735c56be9aSDirk Brandewie p->energy_cores * rapl_energy_units); 5745c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 575fc04cc67SLen Brown outp += sprintf(outp, fmt8, 5765c56be9aSDirk Brandewie p->energy_gfx * rapl_energy_units); 5775c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 578fc04cc67SLen Brown outp += sprintf(outp, fmt8, 5795c56be9aSDirk Brandewie p->energy_dram * rapl_energy_units); 5805c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 581fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 5825c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 583fc04cc67SLen Brown outp += sprintf(outp, fmt8, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 584fc04cc67SLen Brown outp += sprintf(outp, fmt8, interval_float); 585889facbeSLen Brown 5865c56be9aSDirk Brandewie } 587c98d5d94SLen Brown done: 588c98d5d94SLen Brown outp += sprintf(outp, "\n"); 589c98d5d94SLen Brown 590c98d5d94SLen Brown return 0; 591103a8feaSLen Brown } 592103a8feaSLen Brown 593c98d5d94SLen Brown void flush_stdout() 594103a8feaSLen Brown { 595c98d5d94SLen Brown fputs(output_buffer, stdout); 596ddac0d68SLen Brown fflush(stdout); 597c98d5d94SLen Brown outp = output_buffer; 598c98d5d94SLen Brown } 599c98d5d94SLen Brown void flush_stderr() 600c98d5d94SLen Brown { 601c98d5d94SLen Brown fputs(output_buffer, stderr); 602c98d5d94SLen Brown outp = output_buffer; 603c98d5d94SLen Brown } 604c98d5d94SLen Brown void format_all_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 605c98d5d94SLen Brown { 606e23da037SLen Brown static int printed; 607103a8feaSLen Brown 608e23da037SLen Brown if (!printed || !summary_only) 609103a8feaSLen Brown print_header(); 610103a8feaSLen Brown 611c98d5d94SLen Brown if (topo.num_cpus > 1) 612c98d5d94SLen Brown format_counters(&average.threads, &average.cores, 613c98d5d94SLen Brown &average.packages); 614103a8feaSLen Brown 615e23da037SLen Brown printed = 1; 616e23da037SLen Brown 617e23da037SLen Brown if (summary_only) 618e23da037SLen Brown return; 619e23da037SLen Brown 620c98d5d94SLen Brown for_all_cpus(format_counters, t, c, p); 621103a8feaSLen Brown } 622103a8feaSLen Brown 623889facbeSLen Brown #define DELTA_WRAP32(new, old) \ 624889facbeSLen Brown if (new > old) { \ 625889facbeSLen Brown old = new - old; \ 626889facbeSLen Brown } else { \ 627889facbeSLen Brown old = 0x100000000 + new - old; \ 628889facbeSLen Brown } 629889facbeSLen Brown 630c98d5d94SLen Brown void 631c98d5d94SLen Brown delta_package(struct pkg_data *new, struct pkg_data *old) 632103a8feaSLen Brown { 633c98d5d94SLen Brown old->pc2 = new->pc2 - old->pc2; 634c98d5d94SLen Brown old->pc3 = new->pc3 - old->pc3; 635c98d5d94SLen Brown old->pc6 = new->pc6 - old->pc6; 636c98d5d94SLen Brown old->pc7 = new->pc7 - old->pc7; 637ca58710fSKristen Carlson Accardi old->pc8 = new->pc8 - old->pc8; 638ca58710fSKristen Carlson Accardi old->pc9 = new->pc9 - old->pc9; 639ca58710fSKristen Carlson Accardi old->pc10 = new->pc10 - old->pc10; 640889facbeSLen Brown old->pkg_temp_c = new->pkg_temp_c; 641889facbeSLen Brown 642889facbeSLen Brown DELTA_WRAP32(new->energy_pkg, old->energy_pkg); 643889facbeSLen Brown DELTA_WRAP32(new->energy_cores, old->energy_cores); 644889facbeSLen Brown DELTA_WRAP32(new->energy_gfx, old->energy_gfx); 645889facbeSLen Brown DELTA_WRAP32(new->energy_dram, old->energy_dram); 646889facbeSLen Brown DELTA_WRAP32(new->rapl_pkg_perf_status, old->rapl_pkg_perf_status); 647889facbeSLen Brown DELTA_WRAP32(new->rapl_dram_perf_status, old->rapl_dram_perf_status); 648103a8feaSLen Brown } 649103a8feaSLen Brown 650c98d5d94SLen Brown void 651c98d5d94SLen Brown delta_core(struct core_data *new, struct core_data *old) 652c98d5d94SLen Brown { 653c98d5d94SLen Brown old->c3 = new->c3 - old->c3; 654c98d5d94SLen Brown old->c6 = new->c6 - old->c6; 655c98d5d94SLen Brown old->c7 = new->c7 - old->c7; 656889facbeSLen Brown old->core_temp_c = new->core_temp_c; 657103a8feaSLen Brown } 658c98d5d94SLen Brown 659c3ae331dSLen Brown /* 660c3ae331dSLen Brown * old = new - old 661c3ae331dSLen Brown */ 662c98d5d94SLen Brown void 663c98d5d94SLen Brown delta_thread(struct thread_data *new, struct thread_data *old, 664c98d5d94SLen Brown struct core_data *core_delta) 665c98d5d94SLen Brown { 666c98d5d94SLen Brown old->tsc = new->tsc - old->tsc; 667c98d5d94SLen Brown 668103a8feaSLen Brown /* check for TSC < 1 Mcycles over interval */ 669b2c95d90SJosh Triplett if (old->tsc < (1000 * 1000)) 670b2c95d90SJosh Triplett errx(-3, "Insanely slow TSC rate, TSC stops in idle?\n" 671b2c95d90SJosh Triplett "You can disable all c-states by booting with \"idle=poll\"\n" 672b2c95d90SJosh Triplett "or just the deep ones with \"processor.max_cstate=1\""); 673103a8feaSLen Brown 674c98d5d94SLen Brown old->c1 = new->c1 - old->c1; 675c98d5d94SLen Brown 676c98d5d94SLen Brown if ((new->aperf > old->aperf) && (new->mperf > old->mperf)) { 677c98d5d94SLen Brown old->aperf = new->aperf - old->aperf; 678c98d5d94SLen Brown old->mperf = new->mperf - old->mperf; 679c98d5d94SLen Brown } else { 680c98d5d94SLen Brown 681103a8feaSLen Brown if (!aperf_mperf_unstable) { 682103a8feaSLen Brown fprintf(stderr, "%s: APERF or MPERF went backwards *\n", progname); 683103a8feaSLen Brown fprintf(stderr, "* Frequency results do not cover entire interval *\n"); 684103a8feaSLen Brown fprintf(stderr, "* fix this by running Linux-2.6.30 or later *\n"); 685103a8feaSLen Brown 686103a8feaSLen Brown aperf_mperf_unstable = 1; 687103a8feaSLen Brown } 688103a8feaSLen Brown /* 689103a8feaSLen Brown * mperf delta is likely a huge "positive" number 690103a8feaSLen Brown * can not use it for calculating c0 time 691103a8feaSLen Brown */ 692103a8feaSLen Brown skip_c0 = 1; 693103a8feaSLen Brown skip_c1 = 1; 694103a8feaSLen Brown } 695103a8feaSLen Brown 696c98d5d94SLen Brown 697144b44b1SLen Brown if (use_c1_residency_msr) { 698144b44b1SLen Brown /* 699144b44b1SLen Brown * Some models have a dedicated C1 residency MSR, 700144b44b1SLen Brown * which should be more accurate than the derivation below. 701144b44b1SLen Brown */ 702144b44b1SLen Brown } else { 703103a8feaSLen Brown /* 704c3ae331dSLen Brown * As counter collection is not atomic, 705c3ae331dSLen Brown * it is possible for mperf's non-halted cycles + idle states 706103a8feaSLen Brown * to exceed TSC's all cycles: show c1 = 0% in that case. 707103a8feaSLen Brown */ 708c3ae331dSLen Brown if ((old->mperf + core_delta->c3 + core_delta->c6 + core_delta->c7) > old->tsc) 709c98d5d94SLen Brown old->c1 = 0; 710c98d5d94SLen Brown else { 711c98d5d94SLen Brown /* normal case, derive c1 */ 712c98d5d94SLen Brown old->c1 = old->tsc - old->mperf - core_delta->c3 713c98d5d94SLen Brown - core_delta->c6 - core_delta->c7; 714c98d5d94SLen Brown } 715144b44b1SLen Brown } 716c3ae331dSLen Brown 717c98d5d94SLen Brown if (old->mperf == 0) { 718c3ae331dSLen Brown if (verbose > 1) fprintf(stderr, "cpu%d MPERF 0!\n", old->cpu_id); 719c98d5d94SLen Brown old->mperf = 1; /* divide by 0 protection */ 720c98d5d94SLen Brown } 721103a8feaSLen Brown 7228e180f3cSLen Brown old->extra_delta32 = new->extra_delta32 - old->extra_delta32; 7238e180f3cSLen Brown old->extra_delta32 &= 0xFFFFFFFF; 7248e180f3cSLen Brown 7258e180f3cSLen Brown old->extra_delta64 = new->extra_delta64 - old->extra_delta64; 7268e180f3cSLen Brown 727103a8feaSLen Brown /* 7288e180f3cSLen Brown * Extra MSR is just a snapshot, simply copy latest w/o subtracting 729103a8feaSLen Brown */ 7302f32edf1SLen Brown old->extra_msr32 = new->extra_msr32; 7312f32edf1SLen Brown old->extra_msr64 = new->extra_msr64; 7321ed51011SLen Brown 7331ed51011SLen Brown if (do_smi) 7341ed51011SLen Brown old->smi_count = new->smi_count - old->smi_count; 735103a8feaSLen Brown } 736c98d5d94SLen Brown 737c98d5d94SLen Brown int delta_cpu(struct thread_data *t, struct core_data *c, 738c98d5d94SLen Brown struct pkg_data *p, struct thread_data *t2, 739c98d5d94SLen Brown struct core_data *c2, struct pkg_data *p2) 740c98d5d94SLen Brown { 741c98d5d94SLen Brown /* calculate core delta only for 1st thread in core */ 742c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_THREAD_IN_CORE) 743c98d5d94SLen Brown delta_core(c, c2); 744c98d5d94SLen Brown 745c98d5d94SLen Brown /* always calculate thread delta */ 746c98d5d94SLen Brown delta_thread(t, t2, c2); /* c2 is core delta */ 747c98d5d94SLen Brown 748c98d5d94SLen Brown /* calculate package delta only for 1st core in package */ 749c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE) 750c98d5d94SLen Brown delta_package(p, p2); 751c98d5d94SLen Brown 752103a8feaSLen Brown return 0; 753103a8feaSLen Brown } 754103a8feaSLen Brown 755c98d5d94SLen Brown void clear_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 756103a8feaSLen Brown { 757c98d5d94SLen Brown t->tsc = 0; 758c98d5d94SLen Brown t->aperf = 0; 759c98d5d94SLen Brown t->mperf = 0; 760c98d5d94SLen Brown t->c1 = 0; 761103a8feaSLen Brown 7621ed51011SLen Brown t->smi_count = 0; 7638e180f3cSLen Brown t->extra_delta32 = 0; 7648e180f3cSLen Brown t->extra_delta64 = 0; 7658e180f3cSLen Brown 766c98d5d94SLen Brown /* tells format_counters to dump all fields from this set */ 767c98d5d94SLen Brown t->flags = CPU_IS_FIRST_THREAD_IN_CORE | CPU_IS_FIRST_CORE_IN_PACKAGE; 768c98d5d94SLen Brown 769c98d5d94SLen Brown c->c3 = 0; 770c98d5d94SLen Brown c->c6 = 0; 771c98d5d94SLen Brown c->c7 = 0; 772889facbeSLen Brown c->core_temp_c = 0; 773c98d5d94SLen Brown 774c98d5d94SLen Brown p->pc2 = 0; 775c98d5d94SLen Brown p->pc3 = 0; 776c98d5d94SLen Brown p->pc6 = 0; 777c98d5d94SLen Brown p->pc7 = 0; 778ca58710fSKristen Carlson Accardi p->pc8 = 0; 779ca58710fSKristen Carlson Accardi p->pc9 = 0; 780ca58710fSKristen Carlson Accardi p->pc10 = 0; 781889facbeSLen Brown 782889facbeSLen Brown p->energy_pkg = 0; 783889facbeSLen Brown p->energy_dram = 0; 784889facbeSLen Brown p->energy_cores = 0; 785889facbeSLen Brown p->energy_gfx = 0; 786889facbeSLen Brown p->rapl_pkg_perf_status = 0; 787889facbeSLen Brown p->rapl_dram_perf_status = 0; 788889facbeSLen Brown p->pkg_temp_c = 0; 789103a8feaSLen Brown } 790c98d5d94SLen Brown int sum_counters(struct thread_data *t, struct core_data *c, 791c98d5d94SLen Brown struct pkg_data *p) 792103a8feaSLen Brown { 793c98d5d94SLen Brown average.threads.tsc += t->tsc; 794c98d5d94SLen Brown average.threads.aperf += t->aperf; 795c98d5d94SLen Brown average.threads.mperf += t->mperf; 796c98d5d94SLen Brown average.threads.c1 += t->c1; 79715aaa346SLen Brown 7988e180f3cSLen Brown average.threads.extra_delta32 += t->extra_delta32; 7998e180f3cSLen Brown average.threads.extra_delta64 += t->extra_delta64; 8008e180f3cSLen Brown 801c98d5d94SLen Brown /* sum per-core values only for 1st thread in core */ 802c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 803c98d5d94SLen Brown return 0; 804c98d5d94SLen Brown 805c98d5d94SLen Brown average.cores.c3 += c->c3; 806c98d5d94SLen Brown average.cores.c6 += c->c6; 807c98d5d94SLen Brown average.cores.c7 += c->c7; 808c98d5d94SLen Brown 809889facbeSLen Brown average.cores.core_temp_c = MAX(average.cores.core_temp_c, c->core_temp_c); 810889facbeSLen Brown 811c98d5d94SLen Brown /* sum per-pkg values only for 1st core in pkg */ 812c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 813c98d5d94SLen Brown return 0; 814c98d5d94SLen Brown 815c98d5d94SLen Brown average.packages.pc2 += p->pc2; 816c98d5d94SLen Brown average.packages.pc3 += p->pc3; 817c98d5d94SLen Brown average.packages.pc6 += p->pc6; 818c98d5d94SLen Brown average.packages.pc7 += p->pc7; 819ca58710fSKristen Carlson Accardi average.packages.pc8 += p->pc8; 820ca58710fSKristen Carlson Accardi average.packages.pc9 += p->pc9; 821ca58710fSKristen Carlson Accardi average.packages.pc10 += p->pc10; 822c98d5d94SLen Brown 823889facbeSLen Brown average.packages.energy_pkg += p->energy_pkg; 824889facbeSLen Brown average.packages.energy_dram += p->energy_dram; 825889facbeSLen Brown average.packages.energy_cores += p->energy_cores; 826889facbeSLen Brown average.packages.energy_gfx += p->energy_gfx; 827889facbeSLen Brown 828889facbeSLen Brown average.packages.pkg_temp_c = MAX(average.packages.pkg_temp_c, p->pkg_temp_c); 829889facbeSLen Brown 830889facbeSLen Brown average.packages.rapl_pkg_perf_status += p->rapl_pkg_perf_status; 831889facbeSLen Brown average.packages.rapl_dram_perf_status += p->rapl_dram_perf_status; 832c98d5d94SLen Brown return 0; 833c98d5d94SLen Brown } 834c98d5d94SLen Brown /* 835c98d5d94SLen Brown * sum the counters for all cpus in the system 836c98d5d94SLen Brown * compute the weighted average 837c98d5d94SLen Brown */ 838c98d5d94SLen Brown void compute_average(struct thread_data *t, struct core_data *c, 839c98d5d94SLen Brown struct pkg_data *p) 840c98d5d94SLen Brown { 841c98d5d94SLen Brown clear_counters(&average.threads, &average.cores, &average.packages); 842c98d5d94SLen Brown 843c98d5d94SLen Brown for_all_cpus(sum_counters, t, c, p); 844c98d5d94SLen Brown 845c98d5d94SLen Brown average.threads.tsc /= topo.num_cpus; 846c98d5d94SLen Brown average.threads.aperf /= topo.num_cpus; 847c98d5d94SLen Brown average.threads.mperf /= topo.num_cpus; 848c98d5d94SLen Brown average.threads.c1 /= topo.num_cpus; 849c98d5d94SLen Brown 8508e180f3cSLen Brown average.threads.extra_delta32 /= topo.num_cpus; 8518e180f3cSLen Brown average.threads.extra_delta32 &= 0xFFFFFFFF; 8528e180f3cSLen Brown 8538e180f3cSLen Brown average.threads.extra_delta64 /= topo.num_cpus; 8548e180f3cSLen Brown 855c98d5d94SLen Brown average.cores.c3 /= topo.num_cores; 856c98d5d94SLen Brown average.cores.c6 /= topo.num_cores; 857c98d5d94SLen Brown average.cores.c7 /= topo.num_cores; 858c98d5d94SLen Brown 859c98d5d94SLen Brown average.packages.pc2 /= topo.num_packages; 860c98d5d94SLen Brown average.packages.pc3 /= topo.num_packages; 861c98d5d94SLen Brown average.packages.pc6 /= topo.num_packages; 862c98d5d94SLen Brown average.packages.pc7 /= topo.num_packages; 863ca58710fSKristen Carlson Accardi 864ca58710fSKristen Carlson Accardi average.packages.pc8 /= topo.num_packages; 865ca58710fSKristen Carlson Accardi average.packages.pc9 /= topo.num_packages; 866ca58710fSKristen Carlson Accardi average.packages.pc10 /= topo.num_packages; 867c98d5d94SLen Brown } 868c98d5d94SLen Brown 869c98d5d94SLen Brown static unsigned long long rdtsc(void) 870c98d5d94SLen Brown { 871c98d5d94SLen Brown unsigned int low, high; 872c98d5d94SLen Brown 873c98d5d94SLen Brown asm volatile("rdtsc" : "=a" (low), "=d" (high)); 874c98d5d94SLen Brown 875c98d5d94SLen Brown return low | ((unsigned long long)high) << 32; 876c98d5d94SLen Brown } 877c98d5d94SLen Brown 878c98d5d94SLen Brown 879c98d5d94SLen Brown /* 880c98d5d94SLen Brown * get_counters(...) 881c98d5d94SLen Brown * migrate to cpu 882c98d5d94SLen Brown * acquire and record local counters for that cpu 883c98d5d94SLen Brown */ 884c98d5d94SLen Brown int get_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 885c98d5d94SLen Brown { 886c98d5d94SLen Brown int cpu = t->cpu_id; 887889facbeSLen Brown unsigned long long msr; 888c98d5d94SLen Brown 889e52966c0SLen Brown if (cpu_migrate(cpu)) { 890e52966c0SLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 89115aaa346SLen Brown return -1; 892e52966c0SLen Brown } 89315aaa346SLen Brown 894c98d5d94SLen Brown t->tsc = rdtsc(); /* we are running on local CPU of interest */ 89515aaa346SLen Brown 89615aaa346SLen Brown if (has_aperf) { 8979c63a650SLen Brown if (get_msr(cpu, MSR_IA32_APERF, &t->aperf)) 898c98d5d94SLen Brown return -3; 8999c63a650SLen Brown if (get_msr(cpu, MSR_IA32_MPERF, &t->mperf)) 900c98d5d94SLen Brown return -4; 90188c3281fSLen Brown } 90288c3281fSLen Brown 9031ed51011SLen Brown if (do_smi) { 9041ed51011SLen Brown if (get_msr(cpu, MSR_SMI_COUNT, &msr)) 9051ed51011SLen Brown return -5; 9061ed51011SLen Brown t->smi_count = msr & 0xFFFFFFFF; 9071ed51011SLen Brown } 9088e180f3cSLen Brown if (extra_delta_offset32) { 909889facbeSLen Brown if (get_msr(cpu, extra_delta_offset32, &msr)) 9102f32edf1SLen Brown return -5; 911889facbeSLen Brown t->extra_delta32 = msr & 0xFFFFFFFF; 9128e180f3cSLen Brown } 9138e180f3cSLen Brown 9148e180f3cSLen Brown if (extra_delta_offset64) 9158e180f3cSLen Brown if (get_msr(cpu, extra_delta_offset64, &t->extra_delta64)) 9168e180f3cSLen Brown return -5; 9178e180f3cSLen Brown 9188e180f3cSLen Brown if (extra_msr_offset32) { 919889facbeSLen Brown if (get_msr(cpu, extra_msr_offset32, &msr)) 9208e180f3cSLen Brown return -5; 921889facbeSLen Brown t->extra_msr32 = msr & 0xFFFFFFFF; 9228e180f3cSLen Brown } 9232f32edf1SLen Brown 9242f32edf1SLen Brown if (extra_msr_offset64) 9252f32edf1SLen Brown if (get_msr(cpu, extra_msr_offset64, &t->extra_msr64)) 926c98d5d94SLen Brown return -5; 927c98d5d94SLen Brown 928144b44b1SLen Brown if (use_c1_residency_msr) { 929144b44b1SLen Brown if (get_msr(cpu, MSR_CORE_C1_RES, &t->c1)) 930144b44b1SLen Brown return -6; 931144b44b1SLen Brown } 932144b44b1SLen Brown 933c98d5d94SLen Brown /* collect core counters only for 1st thread in core */ 934c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 935c98d5d94SLen Brown return 0; 936c98d5d94SLen Brown 937144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) { 938c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C3_RESIDENCY, &c->c3)) 939c98d5d94SLen Brown return -6; 940144b44b1SLen Brown } 941144b44b1SLen Brown 942144b44b1SLen Brown if (do_nhm_cstates) { 943c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C6_RESIDENCY, &c->c6)) 944c98d5d94SLen Brown return -7; 945103a8feaSLen Brown } 94615aaa346SLen Brown 94715aaa346SLen Brown if (do_snb_cstates) 948c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C7_RESIDENCY, &c->c7)) 949c98d5d94SLen Brown return -8; 950c98d5d94SLen Brown 951889facbeSLen Brown if (do_dts) { 952889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 953889facbeSLen Brown return -9; 954889facbeSLen Brown c->core_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 955889facbeSLen Brown } 956889facbeSLen Brown 957889facbeSLen Brown 958c98d5d94SLen Brown /* collect package counters only for 1st core in package */ 959c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 960c98d5d94SLen Brown return 0; 96115aaa346SLen Brown 962144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) { 963c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C3_RESIDENCY, &p->pc3)) 964c98d5d94SLen Brown return -9; 965c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C6_RESIDENCY, &p->pc6)) 966c98d5d94SLen Brown return -10; 96715aaa346SLen Brown } 96815aaa346SLen Brown if (do_snb_cstates) { 969c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C2_RESIDENCY, &p->pc2)) 970c98d5d94SLen Brown return -11; 971c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C7_RESIDENCY, &p->pc7)) 972c98d5d94SLen Brown return -12; 97315aaa346SLen Brown } 974ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 975ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C8_RESIDENCY, &p->pc8)) 976ca58710fSKristen Carlson Accardi return -13; 977ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C9_RESIDENCY, &p->pc9)) 978ca58710fSKristen Carlson Accardi return -13; 979ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C10_RESIDENCY, &p->pc10)) 980ca58710fSKristen Carlson Accardi return -13; 981ca58710fSKristen Carlson Accardi } 982889facbeSLen Brown if (do_rapl & RAPL_PKG) { 983889facbeSLen Brown if (get_msr(cpu, MSR_PKG_ENERGY_STATUS, &msr)) 984889facbeSLen Brown return -13; 985889facbeSLen Brown p->energy_pkg = msr & 0xFFFFFFFF; 986889facbeSLen Brown } 987889facbeSLen Brown if (do_rapl & RAPL_CORES) { 988889facbeSLen Brown if (get_msr(cpu, MSR_PP0_ENERGY_STATUS, &msr)) 989889facbeSLen Brown return -14; 990889facbeSLen Brown p->energy_cores = msr & 0xFFFFFFFF; 991889facbeSLen Brown } 992889facbeSLen Brown if (do_rapl & RAPL_DRAM) { 993889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_ENERGY_STATUS, &msr)) 994889facbeSLen Brown return -15; 995889facbeSLen Brown p->energy_dram = msr & 0xFFFFFFFF; 996889facbeSLen Brown } 997889facbeSLen Brown if (do_rapl & RAPL_GFX) { 998889facbeSLen Brown if (get_msr(cpu, MSR_PP1_ENERGY_STATUS, &msr)) 999889facbeSLen Brown return -16; 1000889facbeSLen Brown p->energy_gfx = msr & 0xFFFFFFFF; 1001889facbeSLen Brown } 1002889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) { 1003889facbeSLen Brown if (get_msr(cpu, MSR_PKG_PERF_STATUS, &msr)) 1004889facbeSLen Brown return -16; 1005889facbeSLen Brown p->rapl_pkg_perf_status = msr & 0xFFFFFFFF; 1006889facbeSLen Brown } 1007889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) { 1008889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_PERF_STATUS, &msr)) 1009889facbeSLen Brown return -16; 1010889facbeSLen Brown p->rapl_dram_perf_status = msr & 0xFFFFFFFF; 1011889facbeSLen Brown } 1012889facbeSLen Brown if (do_ptm) { 1013889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 1014889facbeSLen Brown return -17; 1015889facbeSLen Brown p->pkg_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 1016889facbeSLen Brown } 101715aaa346SLen Brown return 0; 1018103a8feaSLen Brown } 1019103a8feaSLen Brown 1020c98d5d94SLen Brown void print_verbose_header(void) 1021103a8feaSLen Brown { 1022103a8feaSLen Brown unsigned long long msr; 1023103a8feaSLen Brown unsigned int ratio; 1024103a8feaSLen Brown 1025103a8feaSLen Brown if (!do_nehalem_platform_info) 1026103a8feaSLen Brown return; 1027103a8feaSLen Brown 10289c63a650SLen Brown get_msr(0, MSR_NHM_PLATFORM_INFO, &msr); 1029103a8feaSLen Brown 1030889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_PLATFORM_INFO: 0x%08llx\n", msr); 10316574a5d5SLen Brown 1032103a8feaSLen Brown ratio = (msr >> 40) & 0xFF; 1033103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max efficiency\n", 1034103a8feaSLen Brown ratio, bclk, ratio * bclk); 1035103a8feaSLen Brown 1036103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 1037103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz TSC frequency\n", 1038103a8feaSLen Brown ratio, bclk, ratio * bclk); 1039103a8feaSLen Brown 104067920418SLen Brown get_msr(0, MSR_IA32_POWER_CTL, &msr); 1041144b44b1SLen Brown fprintf(stderr, "cpu0: MSR_IA32_POWER_CTL: 0x%08llx (C1E auto-promotion: %sabled)\n", 104267920418SLen Brown msr, msr & 0x2 ? "EN" : "DIS"); 104367920418SLen Brown 10446574a5d5SLen Brown if (!do_ivt_turbo_ratio_limit) 10456574a5d5SLen Brown goto print_nhm_turbo_ratio_limits; 10466574a5d5SLen Brown 10476574a5d5SLen Brown get_msr(0, MSR_IVT_TURBO_RATIO_LIMIT, &msr); 10486574a5d5SLen Brown 1049889facbeSLen Brown fprintf(stderr, "cpu0: MSR_IVT_TURBO_RATIO_LIMIT: 0x%08llx\n", msr); 10506574a5d5SLen Brown 10516574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 10526574a5d5SLen Brown if (ratio) 10536574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 16 active cores\n", 10546574a5d5SLen Brown ratio, bclk, ratio * bclk); 10556574a5d5SLen Brown 10566574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 10576574a5d5SLen Brown if (ratio) 10586574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 15 active cores\n", 10596574a5d5SLen Brown ratio, bclk, ratio * bclk); 10606574a5d5SLen Brown 10616574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 10626574a5d5SLen Brown if (ratio) 10636574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 14 active cores\n", 10646574a5d5SLen Brown ratio, bclk, ratio * bclk); 10656574a5d5SLen Brown 10666574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 10676574a5d5SLen Brown if (ratio) 10686574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 13 active cores\n", 10696574a5d5SLen Brown ratio, bclk, ratio * bclk); 10706574a5d5SLen Brown 10716574a5d5SLen Brown ratio = (msr >> 24) & 0xFF; 10726574a5d5SLen Brown if (ratio) 10736574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 12 active cores\n", 10746574a5d5SLen Brown ratio, bclk, ratio * bclk); 10756574a5d5SLen Brown 10766574a5d5SLen Brown ratio = (msr >> 16) & 0xFF; 10776574a5d5SLen Brown if (ratio) 10786574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 11 active cores\n", 10796574a5d5SLen Brown ratio, bclk, ratio * bclk); 10806574a5d5SLen Brown 10816574a5d5SLen Brown ratio = (msr >> 8) & 0xFF; 10826574a5d5SLen Brown if (ratio) 10836574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 10 active cores\n", 10846574a5d5SLen Brown ratio, bclk, ratio * bclk); 10856574a5d5SLen Brown 10866574a5d5SLen Brown ratio = (msr >> 0) & 0xFF; 10876574a5d5SLen Brown if (ratio) 10886574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 9 active cores\n", 10896574a5d5SLen Brown ratio, bclk, ratio * bclk); 10906574a5d5SLen Brown 10916574a5d5SLen Brown print_nhm_turbo_ratio_limits: 1092889facbeSLen Brown get_msr(0, MSR_NHM_SNB_PKG_CST_CFG_CTL, &msr); 1093889facbeSLen Brown 1094889facbeSLen Brown #define SNB_C1_AUTO_UNDEMOTE (1UL << 27) 1095889facbeSLen Brown #define SNB_C3_AUTO_UNDEMOTE (1UL << 28) 1096889facbeSLen Brown 1097889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_SNB_PKG_CST_CFG_CTL: 0x%08llx", msr); 1098889facbeSLen Brown 1099889facbeSLen Brown fprintf(stderr, " (%s%s%s%s%slocked: pkg-cstate-limit=%d: ", 1100889facbeSLen Brown (msr & SNB_C3_AUTO_UNDEMOTE) ? "UNdemote-C3, " : "", 1101889facbeSLen Brown (msr & SNB_C1_AUTO_UNDEMOTE) ? "UNdemote-C1, " : "", 1102889facbeSLen Brown (msr & NHM_C3_AUTO_DEMOTE) ? "demote-C3, " : "", 1103889facbeSLen Brown (msr & NHM_C1_AUTO_DEMOTE) ? "demote-C1, " : "", 1104889facbeSLen Brown (msr & (1 << 15)) ? "" : "UN", 1105889facbeSLen Brown (unsigned int)msr & 7); 1106889facbeSLen Brown 1107889facbeSLen Brown 1108889facbeSLen Brown switch(msr & 0x7) { 1109889facbeSLen Brown case 0: 1110144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "no pkg states" : "pc0"); 1111889facbeSLen Brown break; 1112889facbeSLen Brown case 1: 1113144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "no pkg states" : do_snb_cstates ? "pc2" : "pc0"); 1114889facbeSLen Brown break; 1115889facbeSLen Brown case 2: 1116144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : do_snb_cstates ? "pc6-noret" : "pc3"); 1117889facbeSLen Brown break; 1118889facbeSLen Brown case 3: 1119144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : "pc6"); 1120889facbeSLen Brown break; 1121889facbeSLen Brown case 4: 1122144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc4" : "pc7"); 1123889facbeSLen Brown break; 1124889facbeSLen Brown case 5: 1125144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : do_snb_cstates ? "pc7s" : "invalid"); 1126144b44b1SLen Brown break; 1127144b44b1SLen Brown case 6: 1128144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc6" : "invalid"); 1129889facbeSLen Brown break; 1130889facbeSLen Brown case 7: 1131144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc7" : "unlimited"); 1132889facbeSLen Brown break; 1133889facbeSLen Brown default: 1134889facbeSLen Brown fprintf(stderr, "invalid"); 1135889facbeSLen Brown } 1136889facbeSLen Brown fprintf(stderr, ")\n"); 1137103a8feaSLen Brown 1138103a8feaSLen Brown if (!do_nehalem_turbo_ratio_limit) 1139103a8feaSLen Brown return; 1140103a8feaSLen Brown 11419c63a650SLen Brown get_msr(0, MSR_NHM_TURBO_RATIO_LIMIT, &msr); 1142103a8feaSLen Brown 1143889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_TURBO_RATIO_LIMIT: 0x%08llx\n", msr); 11446574a5d5SLen Brown 11456574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 11466574a5d5SLen Brown if (ratio) 11476574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 8 active cores\n", 11486574a5d5SLen Brown ratio, bclk, ratio * bclk); 11496574a5d5SLen Brown 11506574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 11516574a5d5SLen Brown if (ratio) 11526574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 7 active cores\n", 11536574a5d5SLen Brown ratio, bclk, ratio * bclk); 11546574a5d5SLen Brown 11556574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 11566574a5d5SLen Brown if (ratio) 11576574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 6 active cores\n", 11586574a5d5SLen Brown ratio, bclk, ratio * bclk); 11596574a5d5SLen Brown 11606574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 11616574a5d5SLen Brown if (ratio) 11626574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 5 active cores\n", 11636574a5d5SLen Brown ratio, bclk, ratio * bclk); 11646574a5d5SLen Brown 1165103a8feaSLen Brown ratio = (msr >> 24) & 0xFF; 1166103a8feaSLen Brown if (ratio) 1167103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 4 active cores\n", 1168103a8feaSLen Brown ratio, bclk, ratio * bclk); 1169103a8feaSLen Brown 1170103a8feaSLen Brown ratio = (msr >> 16) & 0xFF; 1171103a8feaSLen Brown if (ratio) 1172103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 3 active cores\n", 1173103a8feaSLen Brown ratio, bclk, ratio * bclk); 1174103a8feaSLen Brown 1175103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 1176103a8feaSLen Brown if (ratio) 1177103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 2 active cores\n", 1178103a8feaSLen Brown ratio, bclk, ratio * bclk); 1179103a8feaSLen Brown 1180103a8feaSLen Brown ratio = (msr >> 0) & 0xFF; 1181103a8feaSLen Brown if (ratio) 1182103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 1 active cores\n", 1183103a8feaSLen Brown ratio, bclk, ratio * bclk); 1184*3a9a941dSLen Brown 1185103a8feaSLen Brown } 1186103a8feaSLen Brown 1187c98d5d94SLen Brown void free_all_buffers(void) 1188103a8feaSLen Brown { 1189c98d5d94SLen Brown CPU_FREE(cpu_present_set); 1190c98d5d94SLen Brown cpu_present_set = NULL; 1191c98d5d94SLen Brown cpu_present_set = 0; 1192103a8feaSLen Brown 1193c98d5d94SLen Brown CPU_FREE(cpu_affinity_set); 1194c98d5d94SLen Brown cpu_affinity_set = NULL; 1195c98d5d94SLen Brown cpu_affinity_setsize = 0; 1196103a8feaSLen Brown 1197c98d5d94SLen Brown free(thread_even); 1198c98d5d94SLen Brown free(core_even); 1199c98d5d94SLen Brown free(package_even); 1200103a8feaSLen Brown 1201c98d5d94SLen Brown thread_even = NULL; 1202c98d5d94SLen Brown core_even = NULL; 1203c98d5d94SLen Brown package_even = NULL; 1204103a8feaSLen Brown 1205c98d5d94SLen Brown free(thread_odd); 1206c98d5d94SLen Brown free(core_odd); 1207c98d5d94SLen Brown free(package_odd); 1208103a8feaSLen Brown 1209c98d5d94SLen Brown thread_odd = NULL; 1210c98d5d94SLen Brown core_odd = NULL; 1211c98d5d94SLen Brown package_odd = NULL; 1212103a8feaSLen Brown 1213c98d5d94SLen Brown free(output_buffer); 1214c98d5d94SLen Brown output_buffer = NULL; 1215c98d5d94SLen Brown outp = NULL; 1216103a8feaSLen Brown } 1217103a8feaSLen Brown 1218103a8feaSLen Brown /* 121957a42a34SJosh Triplett * Open a file, and exit on failure 122057a42a34SJosh Triplett */ 122157a42a34SJosh Triplett FILE *fopen_or_die(const char *path, const char *mode) 122257a42a34SJosh Triplett { 122357a42a34SJosh Triplett FILE *filep = fopen(path, "r"); 1224b2c95d90SJosh Triplett if (!filep) 1225b2c95d90SJosh Triplett err(1, "%s: open failed", path); 122657a42a34SJosh Triplett return filep; 122757a42a34SJosh Triplett } 122857a42a34SJosh Triplett 122957a42a34SJosh Triplett /* 123095aebc44SJosh Triplett * Parse a file containing a single int. 123195aebc44SJosh Triplett */ 123295aebc44SJosh Triplett int parse_int_file(const char *fmt, ...) 123395aebc44SJosh Triplett { 123495aebc44SJosh Triplett va_list args; 123595aebc44SJosh Triplett char path[PATH_MAX]; 123695aebc44SJosh Triplett FILE *filep; 123795aebc44SJosh Triplett int value; 123895aebc44SJosh Triplett 123995aebc44SJosh Triplett va_start(args, fmt); 124095aebc44SJosh Triplett vsnprintf(path, sizeof(path), fmt, args); 124195aebc44SJosh Triplett va_end(args); 124257a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1243b2c95d90SJosh Triplett if (fscanf(filep, "%d", &value) != 1) 1244b2c95d90SJosh Triplett err(1, "%s: failed to parse number from file", path); 124595aebc44SJosh Triplett fclose(filep); 124695aebc44SJosh Triplett return value; 124795aebc44SJosh Triplett } 124895aebc44SJosh Triplett 124995aebc44SJosh Triplett /* 1250c98d5d94SLen Brown * cpu_is_first_sibling_in_core(cpu) 1251c98d5d94SLen Brown * return 1 if given CPU is 1st HT sibling in the core 1252103a8feaSLen Brown */ 1253c98d5d94SLen Brown int cpu_is_first_sibling_in_core(int cpu) 1254103a8feaSLen Brown { 125595aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 1256c98d5d94SLen Brown } 1257103a8feaSLen Brown 1258c98d5d94SLen Brown /* 1259c98d5d94SLen Brown * cpu_is_first_core_in_package(cpu) 1260c98d5d94SLen Brown * return 1 if given CPU is 1st core in package 1261c98d5d94SLen Brown */ 1262c98d5d94SLen Brown int cpu_is_first_core_in_package(int cpu) 1263c98d5d94SLen Brown { 126495aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_siblings_list", cpu); 1265103a8feaSLen Brown } 1266103a8feaSLen Brown 1267103a8feaSLen Brown int get_physical_package_id(int cpu) 1268103a8feaSLen Brown { 126995aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu); 1270103a8feaSLen Brown } 1271103a8feaSLen Brown 1272103a8feaSLen Brown int get_core_id(int cpu) 1273103a8feaSLen Brown { 127495aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_id", cpu); 1275103a8feaSLen Brown } 1276103a8feaSLen Brown 1277c98d5d94SLen Brown int get_num_ht_siblings(int cpu) 1278c98d5d94SLen Brown { 1279c98d5d94SLen Brown char path[80]; 1280c98d5d94SLen Brown FILE *filep; 1281c98d5d94SLen Brown int sib1, sib2; 1282c98d5d94SLen Brown int matches; 1283c98d5d94SLen Brown char character; 1284c98d5d94SLen Brown 1285c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 128657a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1287103a8feaSLen Brown /* 1288c98d5d94SLen Brown * file format: 1289c98d5d94SLen Brown * if a pair of number with a character between: 2 siblings (eg. 1-2, or 1,4) 1290c98d5d94SLen Brown * otherwinse 1 sibling (self). 1291c98d5d94SLen Brown */ 1292c98d5d94SLen Brown matches = fscanf(filep, "%d%c%d\n", &sib1, &character, &sib2); 1293c98d5d94SLen Brown 1294c98d5d94SLen Brown fclose(filep); 1295c98d5d94SLen Brown 1296c98d5d94SLen Brown if (matches == 3) 1297c98d5d94SLen Brown return 2; 1298c98d5d94SLen Brown else 1299c98d5d94SLen Brown return 1; 1300c98d5d94SLen Brown } 1301c98d5d94SLen Brown 1302c98d5d94SLen Brown /* 1303c98d5d94SLen Brown * run func(thread, core, package) in topology order 1304c98d5d94SLen Brown * skip non-present cpus 1305103a8feaSLen Brown */ 1306103a8feaSLen Brown 1307c98d5d94SLen Brown int for_all_cpus_2(int (func)(struct thread_data *, struct core_data *, 1308c98d5d94SLen Brown struct pkg_data *, struct thread_data *, struct core_data *, 1309c98d5d94SLen Brown struct pkg_data *), struct thread_data *thread_base, 1310c98d5d94SLen Brown struct core_data *core_base, struct pkg_data *pkg_base, 1311c98d5d94SLen Brown struct thread_data *thread_base2, struct core_data *core_base2, 1312c98d5d94SLen Brown struct pkg_data *pkg_base2) 1313c98d5d94SLen Brown { 1314c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 1315c98d5d94SLen Brown 1316c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 1317c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 1318c98d5d94SLen Brown for (thread_no = 0; thread_no < 1319c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 1320c98d5d94SLen Brown struct thread_data *t, *t2; 1321c98d5d94SLen Brown struct core_data *c, *c2; 1322c98d5d94SLen Brown struct pkg_data *p, *p2; 1323c98d5d94SLen Brown 1324c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 1325c98d5d94SLen Brown 1326c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 1327c98d5d94SLen Brown continue; 1328c98d5d94SLen Brown 1329c98d5d94SLen Brown t2 = GET_THREAD(thread_base2, thread_no, core_no, pkg_no); 1330c98d5d94SLen Brown 1331c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 1332c98d5d94SLen Brown c2 = GET_CORE(core_base2, core_no, pkg_no); 1333c98d5d94SLen Brown 1334c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 1335c98d5d94SLen Brown p2 = GET_PKG(pkg_base2, pkg_no); 1336c98d5d94SLen Brown 1337c98d5d94SLen Brown retval = func(t, c, p, t2, c2, p2); 1338c98d5d94SLen Brown if (retval) 1339c98d5d94SLen Brown return retval; 1340c98d5d94SLen Brown } 1341c98d5d94SLen Brown } 1342c98d5d94SLen Brown } 1343c98d5d94SLen Brown return 0; 1344c98d5d94SLen Brown } 1345c98d5d94SLen Brown 1346c98d5d94SLen Brown /* 1347c98d5d94SLen Brown * run func(cpu) on every cpu in /proc/stat 1348c98d5d94SLen Brown * return max_cpu number 1349c98d5d94SLen Brown */ 1350c98d5d94SLen Brown int for_all_proc_cpus(int (func)(int)) 1351103a8feaSLen Brown { 1352103a8feaSLen Brown FILE *fp; 1353c98d5d94SLen Brown int cpu_num; 1354103a8feaSLen Brown int retval; 1355103a8feaSLen Brown 135657a42a34SJosh Triplett fp = fopen_or_die(proc_stat, "r"); 1357103a8feaSLen Brown 1358103a8feaSLen Brown retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n"); 1359b2c95d90SJosh Triplett if (retval != 0) 1360b2c95d90SJosh Triplett err(1, "%s: failed to parse format", proc_stat); 1361103a8feaSLen Brown 1362c98d5d94SLen Brown while (1) { 1363c98d5d94SLen Brown retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu_num); 1364103a8feaSLen Brown if (retval != 1) 1365103a8feaSLen Brown break; 1366103a8feaSLen Brown 1367c98d5d94SLen Brown retval = func(cpu_num); 1368c98d5d94SLen Brown if (retval) { 1369c98d5d94SLen Brown fclose(fp); 1370c98d5d94SLen Brown return(retval); 1371c98d5d94SLen Brown } 1372103a8feaSLen Brown } 1373103a8feaSLen Brown fclose(fp); 1374c98d5d94SLen Brown return 0; 1375103a8feaSLen Brown } 1376103a8feaSLen Brown 1377103a8feaSLen Brown void re_initialize(void) 1378103a8feaSLen Brown { 1379c98d5d94SLen Brown free_all_buffers(); 1380c98d5d94SLen Brown setup_all_buffers(); 1381c98d5d94SLen Brown printf("turbostat: re-initialized with num_cpus %d\n", topo.num_cpus); 1382103a8feaSLen Brown } 1383103a8feaSLen Brown 1384c98d5d94SLen Brown 1385103a8feaSLen Brown /* 1386c98d5d94SLen Brown * count_cpus() 1387c98d5d94SLen Brown * remember the last one seen, it will be the max 1388103a8feaSLen Brown */ 1389c98d5d94SLen Brown int count_cpus(int cpu) 1390103a8feaSLen Brown { 1391c98d5d94SLen Brown if (topo.max_cpu_num < cpu) 1392c98d5d94SLen Brown topo.max_cpu_num = cpu; 1393103a8feaSLen Brown 1394c98d5d94SLen Brown topo.num_cpus += 1; 1395c98d5d94SLen Brown return 0; 1396103a8feaSLen Brown } 1397c98d5d94SLen Brown int mark_cpu_present(int cpu) 1398c98d5d94SLen Brown { 1399c98d5d94SLen Brown CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set); 140015aaa346SLen Brown return 0; 1401103a8feaSLen Brown } 1402103a8feaSLen Brown 1403103a8feaSLen Brown void turbostat_loop() 1404103a8feaSLen Brown { 1405c98d5d94SLen Brown int retval; 1406e52966c0SLen Brown int restarted = 0; 1407c98d5d94SLen Brown 1408103a8feaSLen Brown restart: 1409e52966c0SLen Brown restarted++; 1410e52966c0SLen Brown 1411c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1412d91bb17cSLen Brown if (retval < -1) { 1413d91bb17cSLen Brown exit(retval); 1414d91bb17cSLen Brown } else if (retval == -1) { 1415e52966c0SLen Brown if (restarted > 1) { 1416e52966c0SLen Brown exit(retval); 1417e52966c0SLen Brown } 1418c98d5d94SLen Brown re_initialize(); 1419c98d5d94SLen Brown goto restart; 1420c98d5d94SLen Brown } 1421e52966c0SLen Brown restarted = 0; 1422103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1423103a8feaSLen Brown 1424103a8feaSLen Brown while (1) { 1425c98d5d94SLen Brown if (for_all_proc_cpus(cpu_is_not_present)) { 1426103a8feaSLen Brown re_initialize(); 1427103a8feaSLen Brown goto restart; 1428103a8feaSLen Brown } 1429103a8feaSLen Brown sleep(interval_sec); 1430c98d5d94SLen Brown retval = for_all_cpus(get_counters, ODD_COUNTERS); 1431d91bb17cSLen Brown if (retval < -1) { 1432d91bb17cSLen Brown exit(retval); 1433d91bb17cSLen Brown } else if (retval == -1) { 143415aaa346SLen Brown re_initialize(); 143515aaa346SLen Brown goto restart; 143615aaa346SLen Brown } 1437103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 1438103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 1439c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 1440c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 1441c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 1442c98d5d94SLen Brown flush_stdout(); 144315aaa346SLen Brown sleep(interval_sec); 1444c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1445d91bb17cSLen Brown if (retval < -1) { 1446d91bb17cSLen Brown exit(retval); 1447d91bb17cSLen Brown } else if (retval == -1) { 1448103a8feaSLen Brown re_initialize(); 1449103a8feaSLen Brown goto restart; 1450103a8feaSLen Brown } 1451103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1452103a8feaSLen Brown timersub(&tv_even, &tv_odd, &tv_delta); 1453c98d5d94SLen Brown for_all_cpus_2(delta_cpu, EVEN_COUNTERS, ODD_COUNTERS); 1454c98d5d94SLen Brown compute_average(ODD_COUNTERS); 1455c98d5d94SLen Brown format_all_counters(ODD_COUNTERS); 1456c98d5d94SLen Brown flush_stdout(); 1457103a8feaSLen Brown } 1458103a8feaSLen Brown } 1459103a8feaSLen Brown 1460103a8feaSLen Brown void check_dev_msr() 1461103a8feaSLen Brown { 1462103a8feaSLen Brown struct stat sb; 1463103a8feaSLen Brown 1464b2c95d90SJosh Triplett if (stat("/dev/cpu/0/msr", &sb)) 1465b2c95d90SJosh Triplett err(-5, "no /dev/cpu/0/msr\n" 1466b2c95d90SJosh Triplett "Try \"# modprobe msr\""); 1467103a8feaSLen Brown } 1468103a8feaSLen Brown 146998481e79SLen Brown void check_permissions() 1470103a8feaSLen Brown { 147198481e79SLen Brown struct __user_cap_header_struct cap_header_data; 147298481e79SLen Brown cap_user_header_t cap_header = &cap_header_data; 147398481e79SLen Brown struct __user_cap_data_struct cap_data_data; 147498481e79SLen Brown cap_user_data_t cap_data = &cap_data_data; 147598481e79SLen Brown extern int capget(cap_user_header_t hdrp, cap_user_data_t datap); 147698481e79SLen Brown int do_exit = 0; 147798481e79SLen Brown 147898481e79SLen Brown /* check for CAP_SYS_RAWIO */ 147998481e79SLen Brown cap_header->pid = getpid(); 148098481e79SLen Brown cap_header->version = _LINUX_CAPABILITY_VERSION; 148198481e79SLen Brown if (capget(cap_header, cap_data) < 0) 148298481e79SLen Brown err(-6, "capget(2) failed"); 148398481e79SLen Brown 148498481e79SLen Brown if ((cap_data->effective & (1 << CAP_SYS_RAWIO)) == 0) { 148598481e79SLen Brown do_exit++; 148698481e79SLen Brown warnx("capget(CAP_SYS_RAWIO) failed," 148798481e79SLen Brown " try \"# setcap cap_sys_rawio=ep %s\"", progname); 148898481e79SLen Brown } 148998481e79SLen Brown 149098481e79SLen Brown /* test file permissions */ 149198481e79SLen Brown if (euidaccess("/dev/cpu/0/msr", R_OK)) { 149298481e79SLen Brown do_exit++; 149398481e79SLen Brown warn("/dev/cpu/0/msr open failed, try chown or chmod +r /dev/cpu/*/msr"); 149498481e79SLen Brown } 149598481e79SLen Brown 149698481e79SLen Brown /* if all else fails, thell them to be root */ 149798481e79SLen Brown if (do_exit) 1498b2c95d90SJosh Triplett if (getuid() != 0) 149998481e79SLen Brown warnx("Or simply run as root"); 150098481e79SLen Brown 150198481e79SLen Brown if (do_exit) 150298481e79SLen Brown exit(-6); 1503103a8feaSLen Brown } 1504103a8feaSLen Brown 1505103a8feaSLen Brown int has_nehalem_turbo_ratio_limit(unsigned int family, unsigned int model) 1506103a8feaSLen Brown { 1507103a8feaSLen Brown if (!genuine_intel) 1508103a8feaSLen Brown return 0; 1509103a8feaSLen Brown 1510103a8feaSLen Brown if (family != 6) 1511103a8feaSLen Brown return 0; 1512103a8feaSLen Brown 1513103a8feaSLen Brown switch (model) { 1514103a8feaSLen Brown case 0x1A: /* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */ 1515103a8feaSLen Brown case 0x1E: /* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */ 1516103a8feaSLen Brown case 0x1F: /* Core i7 and i5 Processor - Nehalem */ 1517103a8feaSLen Brown case 0x25: /* Westmere Client - Clarkdale, Arrandale */ 1518103a8feaSLen Brown case 0x2C: /* Westmere EP - Gulftown */ 1519103a8feaSLen Brown case 0x2A: /* SNB */ 1520103a8feaSLen Brown case 0x2D: /* SNB Xeon */ 1521553575f1SLen Brown case 0x3A: /* IVB */ 15221300651bSLen Brown case 0x3E: /* IVB Xeon */ 152370b43400SLen Brown case 0x3C: /* HSW */ 1524e6f9bb3cSLen Brown case 0x3F: /* HSX */ 152570b43400SLen Brown case 0x45: /* HSW */ 1526149c2319SLen Brown case 0x46: /* HSW */ 1527144b44b1SLen Brown case 0x37: /* BYT */ 1528144b44b1SLen Brown case 0x4D: /* AVN */ 15294e8e863fSLen Brown case 0x3D: /* BDW */ 15304e8e863fSLen Brown case 0x4F: /* BDX */ 15314e8e863fSLen Brown case 0x56: /* BDX-DE */ 1532103a8feaSLen Brown return 1; 1533103a8feaSLen Brown case 0x2E: /* Nehalem-EX Xeon - Beckton */ 1534103a8feaSLen Brown case 0x2F: /* Westmere-EX Xeon - Eagleton */ 1535103a8feaSLen Brown default: 1536103a8feaSLen Brown return 0; 1537103a8feaSLen Brown } 1538103a8feaSLen Brown } 15396574a5d5SLen Brown int has_ivt_turbo_ratio_limit(unsigned int family, unsigned int model) 15406574a5d5SLen Brown { 15416574a5d5SLen Brown if (!genuine_intel) 15426574a5d5SLen Brown return 0; 15436574a5d5SLen Brown 15446574a5d5SLen Brown if (family != 6) 15456574a5d5SLen Brown return 0; 15466574a5d5SLen Brown 15476574a5d5SLen Brown switch (model) { 15486574a5d5SLen Brown case 0x3E: /* IVB Xeon */ 15496574a5d5SLen Brown return 1; 15506574a5d5SLen Brown default: 15516574a5d5SLen Brown return 0; 15526574a5d5SLen Brown } 15536574a5d5SLen Brown } 15546574a5d5SLen Brown 1555889facbeSLen Brown /* 1556889facbeSLen Brown * print_epb() 1557889facbeSLen Brown * Decode the ENERGY_PERF_BIAS MSR 1558889facbeSLen Brown */ 1559889facbeSLen Brown int print_epb(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1560889facbeSLen Brown { 1561889facbeSLen Brown unsigned long long msr; 1562889facbeSLen Brown char *epb_string; 1563889facbeSLen Brown int cpu; 1564889facbeSLen Brown 1565889facbeSLen Brown if (!has_epb) 1566889facbeSLen Brown return 0; 1567889facbeSLen Brown 1568889facbeSLen Brown cpu = t->cpu_id; 1569889facbeSLen Brown 1570889facbeSLen Brown /* EPB is per-package */ 1571889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1572889facbeSLen Brown return 0; 1573889facbeSLen Brown 1574889facbeSLen Brown if (cpu_migrate(cpu)) { 1575889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1576889facbeSLen Brown return -1; 1577889facbeSLen Brown } 1578889facbeSLen Brown 1579889facbeSLen Brown if (get_msr(cpu, MSR_IA32_ENERGY_PERF_BIAS, &msr)) 1580889facbeSLen Brown return 0; 1581889facbeSLen Brown 1582889facbeSLen Brown switch (msr & 0x7) { 1583889facbeSLen Brown case ENERGY_PERF_BIAS_PERFORMANCE: 1584889facbeSLen Brown epb_string = "performance"; 1585889facbeSLen Brown break; 1586889facbeSLen Brown case ENERGY_PERF_BIAS_NORMAL: 1587889facbeSLen Brown epb_string = "balanced"; 1588889facbeSLen Brown break; 1589889facbeSLen Brown case ENERGY_PERF_BIAS_POWERSAVE: 1590889facbeSLen Brown epb_string = "powersave"; 1591889facbeSLen Brown break; 1592889facbeSLen Brown default: 1593889facbeSLen Brown epb_string = "custom"; 1594889facbeSLen Brown break; 1595889facbeSLen Brown } 1596889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_ENERGY_PERF_BIAS: 0x%08llx (%s)\n", cpu, msr, epb_string); 1597889facbeSLen Brown 1598889facbeSLen Brown return 0; 1599889facbeSLen Brown } 1600889facbeSLen Brown 1601*3a9a941dSLen Brown /* 1602*3a9a941dSLen Brown * print_perf_limit() 1603*3a9a941dSLen Brown */ 1604*3a9a941dSLen Brown int print_perf_limit(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1605*3a9a941dSLen Brown { 1606*3a9a941dSLen Brown unsigned long long msr; 1607*3a9a941dSLen Brown int cpu; 1608*3a9a941dSLen Brown 1609*3a9a941dSLen Brown cpu = t->cpu_id; 1610*3a9a941dSLen Brown 1611*3a9a941dSLen Brown /* per-package */ 1612*3a9a941dSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1613*3a9a941dSLen Brown return 0; 1614*3a9a941dSLen Brown 1615*3a9a941dSLen Brown if (cpu_migrate(cpu)) { 1616*3a9a941dSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1617*3a9a941dSLen Brown return -1; 1618*3a9a941dSLen Brown } 1619*3a9a941dSLen Brown 1620*3a9a941dSLen Brown if (do_core_perf_limit_reasons) { 1621*3a9a941dSLen Brown get_msr(cpu, MSR_CORE_PERF_LIMIT_REASONS, &msr); 1622*3a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_CORE_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 1623*3a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)", 1624*3a9a941dSLen Brown (msr & 1 << 0) ? "PROCHOT, " : "", 1625*3a9a941dSLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 1626*3a9a941dSLen Brown (msr & 1 << 2) ? "bit2, " : "", 1627*3a9a941dSLen Brown (msr & 1 << 4) ? "Graphics, " : "", 1628*3a9a941dSLen Brown (msr & 1 << 5) ? "Auto-HWP, " : "", 1629*3a9a941dSLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 1630*3a9a941dSLen Brown (msr & 1 << 8) ? "Amps, " : "", 1631*3a9a941dSLen Brown (msr & 1 << 9) ? "CorePwr, " : "", 1632*3a9a941dSLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 1633*3a9a941dSLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : "", 1634*3a9a941dSLen Brown (msr & 1 << 12) ? "MultiCoreTurbo, " : "", 1635*3a9a941dSLen Brown (msr & 1 << 13) ? "Transitions, " : "", 1636*3a9a941dSLen Brown (msr & 1 << 14) ? "bit14, " : "", 1637*3a9a941dSLen Brown (msr & 1 << 15) ? "bit15, " : ""); 1638*3a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)\n", 1639*3a9a941dSLen Brown (msr & 1 << 16) ? "PROCHOT, " : "", 1640*3a9a941dSLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 1641*3a9a941dSLen Brown (msr & 1 << 18) ? "bit18, " : "", 1642*3a9a941dSLen Brown (msr & 1 << 20) ? "Graphics, " : "", 1643*3a9a941dSLen Brown (msr & 1 << 21) ? "Auto-HWP, " : "", 1644*3a9a941dSLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 1645*3a9a941dSLen Brown (msr & 1 << 24) ? "Amps, " : "", 1646*3a9a941dSLen Brown (msr & 1 << 25) ? "CorePwr, " : "", 1647*3a9a941dSLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 1648*3a9a941dSLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : "", 1649*3a9a941dSLen Brown (msr & 1 << 28) ? "MultiCoreTurbo, " : "", 1650*3a9a941dSLen Brown (msr & 1 << 29) ? "Transitions, " : "", 1651*3a9a941dSLen Brown (msr & 1 << 30) ? "bit30, " : "", 1652*3a9a941dSLen Brown (msr & 1 << 31) ? "bit31, " : ""); 1653*3a9a941dSLen Brown 1654*3a9a941dSLen Brown } 1655*3a9a941dSLen Brown if (do_gfx_perf_limit_reasons) { 1656*3a9a941dSLen Brown get_msr(cpu, MSR_GFX_PERF_LIMIT_REASONS, &msr); 1657*3a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_GFX_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 1658*3a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s%s%s)", 1659*3a9a941dSLen Brown (msr & 1 << 0) ? "PROCHOT, " : "", 1660*3a9a941dSLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 1661*3a9a941dSLen Brown (msr & 1 << 4) ? "Graphics, " : "", 1662*3a9a941dSLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 1663*3a9a941dSLen Brown (msr & 1 << 8) ? "Amps, " : "", 1664*3a9a941dSLen Brown (msr & 1 << 9) ? "GFXPwr, " : "", 1665*3a9a941dSLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 1666*3a9a941dSLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : ""); 1667*3a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s%s%s)\n", 1668*3a9a941dSLen Brown (msr & 1 << 16) ? "PROCHOT, " : "", 1669*3a9a941dSLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 1670*3a9a941dSLen Brown (msr & 1 << 20) ? "Graphics, " : "", 1671*3a9a941dSLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 1672*3a9a941dSLen Brown (msr & 1 << 24) ? "Amps, " : "", 1673*3a9a941dSLen Brown (msr & 1 << 25) ? "GFXPwr, " : "", 1674*3a9a941dSLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 1675*3a9a941dSLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : ""); 1676*3a9a941dSLen Brown } 1677*3a9a941dSLen Brown if (do_ring_perf_limit_reasons) { 1678*3a9a941dSLen Brown get_msr(cpu, MSR_RING_PERF_LIMIT_REASONS, &msr); 1679*3a9a941dSLen Brown fprintf(stderr, "cpu%d: MSR_RING_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr); 1680*3a9a941dSLen Brown fprintf(stderr, " (Active: %s%s%s%s%s%s)", 1681*3a9a941dSLen Brown (msr & 1 << 0) ? "PROCHOT, " : "", 1682*3a9a941dSLen Brown (msr & 1 << 1) ? "ThermStatus, " : "", 1683*3a9a941dSLen Brown (msr & 1 << 6) ? "VR-Therm, " : "", 1684*3a9a941dSLen Brown (msr & 1 << 8) ? "Amps, " : "", 1685*3a9a941dSLen Brown (msr & 1 << 10) ? "PkgPwrL1, " : "", 1686*3a9a941dSLen Brown (msr & 1 << 11) ? "PkgPwrL2, " : ""); 1687*3a9a941dSLen Brown fprintf(stderr, " (Logged: %s%s%s%s%s%s)\n", 1688*3a9a941dSLen Brown (msr & 1 << 16) ? "PROCHOT, " : "", 1689*3a9a941dSLen Brown (msr & 1 << 17) ? "ThermStatus, " : "", 1690*3a9a941dSLen Brown (msr & 1 << 22) ? "VR-Therm, " : "", 1691*3a9a941dSLen Brown (msr & 1 << 24) ? "Amps, " : "", 1692*3a9a941dSLen Brown (msr & 1 << 26) ? "PkgPwrL1, " : "", 1693*3a9a941dSLen Brown (msr & 1 << 27) ? "PkgPwrL2, " : ""); 1694*3a9a941dSLen Brown } 1695*3a9a941dSLen Brown return 0; 1696*3a9a941dSLen Brown } 1697*3a9a941dSLen Brown 1698889facbeSLen Brown #define RAPL_POWER_GRANULARITY 0x7FFF /* 15 bit power granularity */ 1699889facbeSLen Brown #define RAPL_TIME_GRANULARITY 0x3F /* 6 bit time granularity */ 1700889facbeSLen Brown 1701144b44b1SLen Brown double get_tdp(model) 1702144b44b1SLen Brown { 1703144b44b1SLen Brown unsigned long long msr; 1704144b44b1SLen Brown 1705144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) 1706144b44b1SLen Brown if (!get_msr(0, MSR_PKG_POWER_INFO, &msr)) 1707144b44b1SLen Brown return ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units; 1708144b44b1SLen Brown 1709144b44b1SLen Brown switch (model) { 1710144b44b1SLen Brown case 0x37: 1711144b44b1SLen Brown case 0x4D: 1712144b44b1SLen Brown return 30.0; 1713144b44b1SLen Brown default: 1714144b44b1SLen Brown return 135.0; 1715144b44b1SLen Brown } 1716144b44b1SLen Brown } 1717144b44b1SLen Brown 1718144b44b1SLen Brown 1719889facbeSLen Brown /* 1720889facbeSLen Brown * rapl_probe() 1721889facbeSLen Brown * 1722144b44b1SLen Brown * sets do_rapl, rapl_power_units, rapl_energy_units, rapl_time_units 1723889facbeSLen Brown */ 1724889facbeSLen Brown void rapl_probe(unsigned int family, unsigned int model) 1725889facbeSLen Brown { 1726889facbeSLen Brown unsigned long long msr; 1727144b44b1SLen Brown unsigned int time_unit; 1728889facbeSLen Brown double tdp; 1729889facbeSLen Brown 1730889facbeSLen Brown if (!genuine_intel) 1731889facbeSLen Brown return; 1732889facbeSLen Brown 1733889facbeSLen Brown if (family != 6) 1734889facbeSLen Brown return; 1735889facbeSLen Brown 1736889facbeSLen Brown switch (model) { 1737889facbeSLen Brown case 0x2A: 1738889facbeSLen Brown case 0x3A: 173970b43400SLen Brown case 0x3C: /* HSW */ 174070b43400SLen Brown case 0x45: /* HSW */ 1741149c2319SLen Brown case 0x46: /* HSW */ 17424e8e863fSLen Brown case 0x3D: /* BDW */ 1743144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_GFX | RAPL_PKG_POWER_INFO; 1744889facbeSLen Brown break; 1745e6f9bb3cSLen Brown case 0x3F: /* HSX */ 17464e8e863fSLen Brown case 0x4F: /* BDX */ 17474e8e863fSLen Brown case 0x56: /* BDX-DE */ 1748e6f9bb3cSLen Brown do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO; 1749e6f9bb3cSLen Brown break; 1750889facbeSLen Brown case 0x2D: 1751889facbeSLen Brown case 0x3E: 1752144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_DRAM | RAPL_PKG_PERF_STATUS | RAPL_DRAM_PERF_STATUS | RAPL_PKG_POWER_INFO; 1753144b44b1SLen Brown break; 1754144b44b1SLen Brown case 0x37: /* BYT */ 1755144b44b1SLen Brown case 0x4D: /* AVN */ 1756144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES ; 1757889facbeSLen Brown break; 1758889facbeSLen Brown default: 1759889facbeSLen Brown return; 1760889facbeSLen Brown } 1761889facbeSLen Brown 1762889facbeSLen Brown /* units on package 0, verify later other packages match */ 1763889facbeSLen Brown if (get_msr(0, MSR_RAPL_POWER_UNIT, &msr)) 1764889facbeSLen Brown return; 1765889facbeSLen Brown 1766889facbeSLen Brown rapl_power_units = 1.0 / (1 << (msr & 0xF)); 1767144b44b1SLen Brown if (model == 0x37) 1768144b44b1SLen Brown rapl_energy_units = 1.0 * (1 << (msr >> 8 & 0x1F)) / 1000000; 1769144b44b1SLen Brown else 1770889facbeSLen Brown rapl_energy_units = 1.0 / (1 << (msr >> 8 & 0x1F)); 1771889facbeSLen Brown 1772144b44b1SLen Brown time_unit = msr >> 16 & 0xF; 1773144b44b1SLen Brown if (time_unit == 0) 1774144b44b1SLen Brown time_unit = 0xA; 1775889facbeSLen Brown 1776144b44b1SLen Brown rapl_time_units = 1.0 / (1 << (time_unit)); 1777144b44b1SLen Brown 1778144b44b1SLen Brown tdp = get_tdp(model); 1779889facbeSLen Brown 1780889facbeSLen Brown rapl_joule_counter_range = 0xFFFFFFFF * rapl_energy_units / tdp; 1781889facbeSLen Brown if (verbose) 1782144b44b1SLen Brown fprintf(stderr, "RAPL: %.0f sec. Joule Counter Range, at %.0f Watts\n", rapl_joule_counter_range, tdp); 1783889facbeSLen Brown 1784889facbeSLen Brown return; 1785889facbeSLen Brown } 1786889facbeSLen Brown 1787*3a9a941dSLen Brown void perf_limit_reasons_probe(family, model) 1788*3a9a941dSLen Brown { 1789*3a9a941dSLen Brown if (!genuine_intel) 1790*3a9a941dSLen Brown return; 1791*3a9a941dSLen Brown 1792*3a9a941dSLen Brown if (family != 6) 1793*3a9a941dSLen Brown return; 1794*3a9a941dSLen Brown 1795*3a9a941dSLen Brown switch (model) { 1796*3a9a941dSLen Brown case 0x3C: /* HSW */ 1797*3a9a941dSLen Brown case 0x45: /* HSW */ 1798*3a9a941dSLen Brown case 0x46: /* HSW */ 1799*3a9a941dSLen Brown do_gfx_perf_limit_reasons = 1; 1800*3a9a941dSLen Brown case 0x3F: /* HSX */ 1801*3a9a941dSLen Brown do_core_perf_limit_reasons = 1; 1802*3a9a941dSLen Brown do_ring_perf_limit_reasons = 1; 1803*3a9a941dSLen Brown default: 1804*3a9a941dSLen Brown return; 1805*3a9a941dSLen Brown } 1806*3a9a941dSLen Brown } 1807*3a9a941dSLen Brown 1808889facbeSLen Brown int print_thermal(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1809889facbeSLen Brown { 1810889facbeSLen Brown unsigned long long msr; 1811889facbeSLen Brown unsigned int dts; 1812889facbeSLen Brown int cpu; 1813889facbeSLen Brown 1814889facbeSLen Brown if (!(do_dts || do_ptm)) 1815889facbeSLen Brown return 0; 1816889facbeSLen Brown 1817889facbeSLen Brown cpu = t->cpu_id; 1818889facbeSLen Brown 1819889facbeSLen Brown /* DTS is per-core, no need to print for each thread */ 1820889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 1821889facbeSLen Brown return 0; 1822889facbeSLen Brown 1823889facbeSLen Brown if (cpu_migrate(cpu)) { 1824889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1825889facbeSLen Brown return -1; 1826889facbeSLen Brown } 1827889facbeSLen Brown 1828889facbeSLen Brown if (do_ptm && (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) { 1829889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 1830889facbeSLen Brown return 0; 1831889facbeSLen Brown 1832889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1833889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_STATUS: 0x%08llx (%d C)\n", 1834889facbeSLen Brown cpu, msr, tcc_activation_temp - dts); 1835889facbeSLen Brown 1836889facbeSLen Brown #ifdef THERM_DEBUG 1837889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_INTERRUPT, &msr)) 1838889facbeSLen Brown return 0; 1839889facbeSLen Brown 1840889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1841889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 1842889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 1843889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 1844889facbeSLen Brown #endif 1845889facbeSLen Brown } 1846889facbeSLen Brown 1847889facbeSLen Brown 1848889facbeSLen Brown if (do_dts) { 1849889facbeSLen Brown unsigned int resolution; 1850889facbeSLen Brown 1851889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 1852889facbeSLen Brown return 0; 1853889facbeSLen Brown 1854889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1855889facbeSLen Brown resolution = (msr >> 27) & 0xF; 1856889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_STATUS: 0x%08llx (%d C +/- %d)\n", 1857889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, resolution); 1858889facbeSLen Brown 1859889facbeSLen Brown #ifdef THERM_DEBUG 1860889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_INTERRUPT, &msr)) 1861889facbeSLen Brown return 0; 1862889facbeSLen Brown 1863889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1864889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 1865889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 1866889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 1867889facbeSLen Brown #endif 1868889facbeSLen Brown } 1869889facbeSLen Brown 1870889facbeSLen Brown return 0; 1871889facbeSLen Brown } 1872889facbeSLen Brown 1873889facbeSLen Brown void print_power_limit_msr(int cpu, unsigned long long msr, char *label) 1874889facbeSLen Brown { 1875889facbeSLen Brown fprintf(stderr, "cpu%d: %s: %sabled (%f Watts, %f sec, clamp %sabled)\n", 1876889facbeSLen Brown cpu, label, 1877889facbeSLen Brown ((msr >> 15) & 1) ? "EN" : "DIS", 1878889facbeSLen Brown ((msr >> 0) & 0x7FFF) * rapl_power_units, 1879889facbeSLen Brown (1.0 + (((msr >> 22) & 0x3)/4.0)) * (1 << ((msr >> 17) & 0x1F)) * rapl_time_units, 1880889facbeSLen Brown (((msr >> 16) & 1) ? "EN" : "DIS")); 1881889facbeSLen Brown 1882889facbeSLen Brown return; 1883889facbeSLen Brown } 1884889facbeSLen Brown 1885889facbeSLen Brown int print_rapl(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1886889facbeSLen Brown { 1887889facbeSLen Brown unsigned long long msr; 1888889facbeSLen Brown int cpu; 1889889facbeSLen Brown 1890889facbeSLen Brown if (!do_rapl) 1891889facbeSLen Brown return 0; 1892889facbeSLen Brown 1893889facbeSLen Brown /* RAPL counters are per package, so print only for 1st thread/package */ 1894889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1895889facbeSLen Brown return 0; 1896889facbeSLen Brown 1897889facbeSLen Brown cpu = t->cpu_id; 1898889facbeSLen Brown if (cpu_migrate(cpu)) { 1899889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1900889facbeSLen Brown return -1; 1901889facbeSLen Brown } 1902889facbeSLen Brown 1903889facbeSLen Brown if (get_msr(cpu, MSR_RAPL_POWER_UNIT, &msr)) 1904889facbeSLen Brown return -1; 1905889facbeSLen Brown 1906889facbeSLen Brown if (verbose) { 1907889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_RAPL_POWER_UNIT: 0x%08llx " 1908889facbeSLen Brown "(%f Watts, %f Joules, %f sec.)\n", cpu, msr, 1909144b44b1SLen Brown rapl_power_units, rapl_energy_units, rapl_time_units); 1910889facbeSLen Brown } 1911144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) { 1912144b44b1SLen Brown 1913889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_INFO, &msr)) 1914889facbeSLen Brown return -5; 1915889facbeSLen Brown 1916889facbeSLen Brown 1917889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_INFO: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 1918889facbeSLen Brown cpu, msr, 1919889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1920889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1921889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1922889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 1923889facbeSLen Brown 1924144b44b1SLen Brown } 1925144b44b1SLen Brown if (do_rapl & RAPL_PKG) { 1926144b44b1SLen Brown 1927889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_LIMIT, &msr)) 1928889facbeSLen Brown return -9; 1929889facbeSLen Brown 1930889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_LIMIT: 0x%08llx (%slocked)\n", 1931889facbeSLen Brown cpu, msr, (msr >> 63) & 1 ? "": "UN"); 1932889facbeSLen Brown 1933889facbeSLen Brown print_power_limit_msr(cpu, msr, "PKG Limit #1"); 1934889facbeSLen Brown fprintf(stderr, "cpu%d: PKG Limit #2: %sabled (%f Watts, %f* sec, clamp %sabled)\n", 1935889facbeSLen Brown cpu, 1936889facbeSLen Brown ((msr >> 47) & 1) ? "EN" : "DIS", 1937889facbeSLen Brown ((msr >> 32) & 0x7FFF) * rapl_power_units, 1938889facbeSLen Brown (1.0 + (((msr >> 54) & 0x3)/4.0)) * (1 << ((msr >> 49) & 0x1F)) * rapl_time_units, 1939889facbeSLen Brown ((msr >> 48) & 1) ? "EN" : "DIS"); 1940889facbeSLen Brown } 1941889facbeSLen Brown 1942889facbeSLen Brown if (do_rapl & RAPL_DRAM) { 1943889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_INFO, &msr)) 1944889facbeSLen Brown return -6; 1945889facbeSLen Brown 1946889facbeSLen Brown 1947889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_INFO,: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 1948889facbeSLen Brown cpu, msr, 1949889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1950889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1951889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1952889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 1953889facbeSLen Brown 1954889facbeSLen Brown 1955889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_LIMIT, &msr)) 1956889facbeSLen Brown return -9; 1957889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_LIMIT: 0x%08llx (%slocked)\n", 1958889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1959889facbeSLen Brown 1960889facbeSLen Brown print_power_limit_msr(cpu, msr, "DRAM Limit"); 1961889facbeSLen Brown } 1962144b44b1SLen Brown if (do_rapl & RAPL_CORE_POLICY) { 1963889facbeSLen Brown if (verbose) { 1964889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POLICY, &msr)) 1965889facbeSLen Brown return -7; 1966889facbeSLen Brown 1967889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POLICY: %lld\n", cpu, msr & 0xF); 1968144b44b1SLen Brown } 1969144b44b1SLen Brown } 1970144b44b1SLen Brown if (do_rapl & RAPL_CORES) { 1971144b44b1SLen Brown if (verbose) { 1972889facbeSLen Brown 1973889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POWER_LIMIT, &msr)) 1974889facbeSLen Brown return -9; 1975889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POWER_LIMIT: 0x%08llx (%slocked)\n", 1976889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1977889facbeSLen Brown print_power_limit_msr(cpu, msr, "Cores Limit"); 1978889facbeSLen Brown } 1979889facbeSLen Brown } 1980889facbeSLen Brown if (do_rapl & RAPL_GFX) { 1981889facbeSLen Brown if (verbose) { 1982889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POLICY, &msr)) 1983889facbeSLen Brown return -8; 1984889facbeSLen Brown 1985889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POLICY: %lld\n", cpu, msr & 0xF); 1986889facbeSLen Brown 1987889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POWER_LIMIT, &msr)) 1988889facbeSLen Brown return -9; 1989889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POWER_LIMIT: 0x%08llx (%slocked)\n", 1990889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1991889facbeSLen Brown print_power_limit_msr(cpu, msr, "GFX Limit"); 1992889facbeSLen Brown } 1993889facbeSLen Brown } 1994889facbeSLen Brown return 0; 1995889facbeSLen Brown } 1996889facbeSLen Brown 1997103a8feaSLen Brown 1998103a8feaSLen Brown int is_snb(unsigned int family, unsigned int model) 1999103a8feaSLen Brown { 2000103a8feaSLen Brown if (!genuine_intel) 2001103a8feaSLen Brown return 0; 2002103a8feaSLen Brown 2003103a8feaSLen Brown switch (model) { 2004103a8feaSLen Brown case 0x2A: 2005103a8feaSLen Brown case 0x2D: 2006650a37f3SLen Brown case 0x3A: /* IVB */ 20071300651bSLen Brown case 0x3E: /* IVB Xeon */ 200870b43400SLen Brown case 0x3C: /* HSW */ 200970b43400SLen Brown case 0x3F: /* HSW */ 201070b43400SLen Brown case 0x45: /* HSW */ 2011149c2319SLen Brown case 0x46: /* HSW */ 20124e8e863fSLen Brown case 0x3D: /* BDW */ 20134e8e863fSLen Brown case 0x4F: /* BDX */ 20144e8e863fSLen Brown case 0x56: /* BDX-DE */ 2015103a8feaSLen Brown return 1; 2016103a8feaSLen Brown } 2017103a8feaSLen Brown return 0; 2018103a8feaSLen Brown } 2019103a8feaSLen Brown 2020ca58710fSKristen Carlson Accardi int has_c8_c9_c10(unsigned int family, unsigned int model) 2021ca58710fSKristen Carlson Accardi { 2022ca58710fSKristen Carlson Accardi if (!genuine_intel) 2023ca58710fSKristen Carlson Accardi return 0; 2024ca58710fSKristen Carlson Accardi 2025ca58710fSKristen Carlson Accardi switch (model) { 20264e8e863fSLen Brown case 0x45: /* HSW */ 20274e8e863fSLen Brown case 0x3D: /* BDW */ 2028ca58710fSKristen Carlson Accardi return 1; 2029ca58710fSKristen Carlson Accardi } 2030ca58710fSKristen Carlson Accardi return 0; 2031ca58710fSKristen Carlson Accardi } 2032ca58710fSKristen Carlson Accardi 2033ca58710fSKristen Carlson Accardi 2034144b44b1SLen Brown int is_slm(unsigned int family, unsigned int model) 2035144b44b1SLen Brown { 2036144b44b1SLen Brown if (!genuine_intel) 2037144b44b1SLen Brown return 0; 2038144b44b1SLen Brown switch (model) { 2039144b44b1SLen Brown case 0x37: /* BYT */ 2040144b44b1SLen Brown case 0x4D: /* AVN */ 2041144b44b1SLen Brown return 1; 2042144b44b1SLen Brown } 2043144b44b1SLen Brown return 0; 2044144b44b1SLen Brown } 2045144b44b1SLen Brown 2046144b44b1SLen Brown #define SLM_BCLK_FREQS 5 2047144b44b1SLen Brown double slm_freq_table[SLM_BCLK_FREQS] = { 83.3, 100.0, 133.3, 116.7, 80.0}; 2048144b44b1SLen Brown 2049144b44b1SLen Brown double slm_bclk(void) 2050144b44b1SLen Brown { 2051144b44b1SLen Brown unsigned long long msr = 3; 2052144b44b1SLen Brown unsigned int i; 2053144b44b1SLen Brown double freq; 2054144b44b1SLen Brown 2055144b44b1SLen Brown if (get_msr(0, MSR_FSB_FREQ, &msr)) 2056144b44b1SLen Brown fprintf(stderr, "SLM BCLK: unknown\n"); 2057144b44b1SLen Brown 2058144b44b1SLen Brown i = msr & 0xf; 2059144b44b1SLen Brown if (i >= SLM_BCLK_FREQS) { 2060144b44b1SLen Brown fprintf(stderr, "SLM BCLK[%d] invalid\n", i); 2061144b44b1SLen Brown msr = 3; 2062144b44b1SLen Brown } 2063144b44b1SLen Brown freq = slm_freq_table[i]; 2064144b44b1SLen Brown 2065144b44b1SLen Brown fprintf(stderr, "SLM BCLK: %.1f Mhz\n", freq); 2066144b44b1SLen Brown 2067144b44b1SLen Brown return freq; 2068144b44b1SLen Brown } 2069144b44b1SLen Brown 2070103a8feaSLen Brown double discover_bclk(unsigned int family, unsigned int model) 2071103a8feaSLen Brown { 2072103a8feaSLen Brown if (is_snb(family, model)) 2073103a8feaSLen Brown return 100.00; 2074144b44b1SLen Brown else if (is_slm(family, model)) 2075144b44b1SLen Brown return slm_bclk(); 2076103a8feaSLen Brown else 2077103a8feaSLen Brown return 133.33; 2078103a8feaSLen Brown } 2079103a8feaSLen Brown 2080889facbeSLen Brown /* 2081889facbeSLen Brown * MSR_IA32_TEMPERATURE_TARGET indicates the temperature where 2082889facbeSLen Brown * the Thermal Control Circuit (TCC) activates. 2083889facbeSLen Brown * This is usually equal to tjMax. 2084889facbeSLen Brown * 2085889facbeSLen Brown * Older processors do not have this MSR, so there we guess, 2086889facbeSLen Brown * but also allow cmdline over-ride with -T. 2087889facbeSLen Brown * 2088889facbeSLen Brown * Several MSR temperature values are in units of degrees-C 2089889facbeSLen Brown * below this value, including the Digital Thermal Sensor (DTS), 2090889facbeSLen Brown * Package Thermal Management Sensor (PTM), and thermal event thresholds. 2091889facbeSLen Brown */ 2092889facbeSLen Brown int set_temperature_target(struct thread_data *t, struct core_data *c, struct pkg_data *p) 2093889facbeSLen Brown { 2094889facbeSLen Brown unsigned long long msr; 2095889facbeSLen Brown unsigned int target_c_local; 2096889facbeSLen Brown int cpu; 2097889facbeSLen Brown 2098889facbeSLen Brown /* tcc_activation_temp is used only for dts or ptm */ 2099889facbeSLen Brown if (!(do_dts || do_ptm)) 2100889facbeSLen Brown return 0; 2101889facbeSLen Brown 2102889facbeSLen Brown /* this is a per-package concept */ 2103889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 2104889facbeSLen Brown return 0; 2105889facbeSLen Brown 2106889facbeSLen Brown cpu = t->cpu_id; 2107889facbeSLen Brown if (cpu_migrate(cpu)) { 2108889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 2109889facbeSLen Brown return -1; 2110889facbeSLen Brown } 2111889facbeSLen Brown 2112889facbeSLen Brown if (tcc_activation_temp_override != 0) { 2113889facbeSLen Brown tcc_activation_temp = tcc_activation_temp_override; 2114889facbeSLen Brown fprintf(stderr, "cpu%d: Using cmdline TCC Target (%d C)\n", 2115889facbeSLen Brown cpu, tcc_activation_temp); 2116889facbeSLen Brown return 0; 2117889facbeSLen Brown } 2118889facbeSLen Brown 2119889facbeSLen Brown /* Temperature Target MSR is Nehalem and newer only */ 2120889facbeSLen Brown if (!do_nehalem_platform_info) 2121889facbeSLen Brown goto guess; 2122889facbeSLen Brown 2123889facbeSLen Brown if (get_msr(0, MSR_IA32_TEMPERATURE_TARGET, &msr)) 2124889facbeSLen Brown goto guess; 2125889facbeSLen Brown 21263482124aSJean Delvare target_c_local = (msr >> 16) & 0xFF; 2127889facbeSLen Brown 2128889facbeSLen Brown if (verbose) 2129889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_TEMPERATURE_TARGET: 0x%08llx (%d C)\n", 2130889facbeSLen Brown cpu, msr, target_c_local); 2131889facbeSLen Brown 21323482124aSJean Delvare if (!target_c_local) 2133889facbeSLen Brown goto guess; 2134889facbeSLen Brown 2135889facbeSLen Brown tcc_activation_temp = target_c_local; 2136889facbeSLen Brown 2137889facbeSLen Brown return 0; 2138889facbeSLen Brown 2139889facbeSLen Brown guess: 2140889facbeSLen Brown tcc_activation_temp = TJMAX_DEFAULT; 2141889facbeSLen Brown fprintf(stderr, "cpu%d: Guessing tjMax %d C, Please use -T to specify\n", 2142889facbeSLen Brown cpu, tcc_activation_temp); 2143889facbeSLen Brown 2144889facbeSLen Brown return 0; 2145889facbeSLen Brown } 2146103a8feaSLen Brown void check_cpuid() 2147103a8feaSLen Brown { 2148103a8feaSLen Brown unsigned int eax, ebx, ecx, edx, max_level; 2149103a8feaSLen Brown unsigned int fms, family, model, stepping; 2150103a8feaSLen Brown 2151103a8feaSLen Brown eax = ebx = ecx = edx = 0; 2152103a8feaSLen Brown 21532b92865eSJosh Triplett __get_cpuid(0, &max_level, &ebx, &ecx, &edx); 2154103a8feaSLen Brown 2155103a8feaSLen Brown if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e) 2156103a8feaSLen Brown genuine_intel = 1; 2157103a8feaSLen Brown 2158103a8feaSLen Brown if (verbose) 2159889facbeSLen Brown fprintf(stderr, "CPUID(0): %.4s%.4s%.4s ", 2160103a8feaSLen Brown (char *)&ebx, (char *)&edx, (char *)&ecx); 2161103a8feaSLen Brown 21622b92865eSJosh Triplett __get_cpuid(1, &fms, &ebx, &ecx, &edx); 2163103a8feaSLen Brown family = (fms >> 8) & 0xf; 2164103a8feaSLen Brown model = (fms >> 4) & 0xf; 2165103a8feaSLen Brown stepping = fms & 0xf; 2166103a8feaSLen Brown if (family == 6 || family == 0xf) 2167103a8feaSLen Brown model += ((fms >> 16) & 0xf) << 4; 2168103a8feaSLen Brown 2169103a8feaSLen Brown if (verbose) 2170103a8feaSLen Brown fprintf(stderr, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n", 2171103a8feaSLen Brown max_level, family, model, stepping, family, model, stepping); 2172103a8feaSLen Brown 2173b2c95d90SJosh Triplett if (!(edx & (1 << 5))) 2174b2c95d90SJosh Triplett errx(1, "CPUID: no MSR"); 2175103a8feaSLen Brown 2176103a8feaSLen Brown /* 2177103a8feaSLen Brown * check max extended function levels of CPUID. 2178103a8feaSLen Brown * This is needed to check for invariant TSC. 2179103a8feaSLen Brown * This check is valid for both Intel and AMD. 2180103a8feaSLen Brown */ 2181103a8feaSLen Brown ebx = ecx = edx = 0; 21822b92865eSJosh Triplett __get_cpuid(0x80000000, &max_level, &ebx, &ecx, &edx); 2183103a8feaSLen Brown 2184b2c95d90SJosh Triplett if (max_level < 0x80000007) 2185b2c95d90SJosh Triplett errx(1, "CPUID: no invariant TSC (max_level 0x%x)", max_level); 2186103a8feaSLen Brown 2187103a8feaSLen Brown /* 2188103a8feaSLen Brown * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8 2189103a8feaSLen Brown * this check is valid for both Intel and AMD 2190103a8feaSLen Brown */ 21912b92865eSJosh Triplett __get_cpuid(0x80000007, &eax, &ebx, &ecx, &edx); 21928209e054SThomas Renninger has_invariant_tsc = edx & (1 << 8); 2193103a8feaSLen Brown 2194b2c95d90SJosh Triplett if (!has_invariant_tsc) 2195b2c95d90SJosh Triplett errx(1, "No invariant TSC"); 2196103a8feaSLen Brown 2197103a8feaSLen Brown /* 2198103a8feaSLen Brown * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0 2199103a8feaSLen Brown * this check is valid for both Intel and AMD 2200103a8feaSLen Brown */ 2201103a8feaSLen Brown 22022b92865eSJosh Triplett __get_cpuid(0x6, &eax, &ebx, &ecx, &edx); 22038209e054SThomas Renninger has_aperf = ecx & (1 << 0); 2204889facbeSLen Brown do_dts = eax & (1 << 0); 2205889facbeSLen Brown do_ptm = eax & (1 << 6); 2206889facbeSLen Brown has_epb = ecx & (1 << 3); 2207889facbeSLen Brown 2208889facbeSLen Brown if (verbose) 2209889facbeSLen Brown fprintf(stderr, "CPUID(6): %s%s%s%s\n", 2210889facbeSLen Brown has_aperf ? "APERF" : "No APERF!", 2211889facbeSLen Brown do_dts ? ", DTS" : "", 2212889facbeSLen Brown do_ptm ? ", PTM": "", 2213889facbeSLen Brown has_epb ? ", EPB": ""); 2214889facbeSLen Brown 2215889facbeSLen Brown if (!has_aperf) 2216b2c95d90SJosh Triplett errx(-1, "No APERF"); 2217103a8feaSLen Brown 2218103a8feaSLen Brown do_nehalem_platform_info = genuine_intel && has_invariant_tsc; 2219103a8feaSLen Brown do_nhm_cstates = genuine_intel; /* all Intel w/ non-stop TSC have NHM counters */ 22201ed51011SLen Brown do_smi = do_nhm_cstates; 2221103a8feaSLen Brown do_snb_cstates = is_snb(family, model); 2222ca58710fSKristen Carlson Accardi do_c8_c9_c10 = has_c8_c9_c10(family, model); 2223144b44b1SLen Brown do_slm_cstates = is_slm(family, model); 2224103a8feaSLen Brown bclk = discover_bclk(family, model); 2225103a8feaSLen Brown 2226103a8feaSLen Brown do_nehalem_turbo_ratio_limit = has_nehalem_turbo_ratio_limit(family, model); 22276574a5d5SLen Brown do_ivt_turbo_ratio_limit = has_ivt_turbo_ratio_limit(family, model); 2228889facbeSLen Brown rapl_probe(family, model); 2229*3a9a941dSLen Brown perf_limit_reasons_probe(family, model); 2230889facbeSLen Brown 2231889facbeSLen Brown return; 2232103a8feaSLen Brown } 2233103a8feaSLen Brown 2234103a8feaSLen Brown 2235103a8feaSLen Brown void usage() 2236103a8feaSLen Brown { 2237f591c38bSAndy Shevchenko errx(1, "%s: [-v][-R][-T][-p|-P|-S][-c MSR#][-C MSR#][-m MSR#][-M MSR#][-i interval_sec | command ...]\n", 2238103a8feaSLen Brown progname); 2239103a8feaSLen Brown } 2240103a8feaSLen Brown 2241103a8feaSLen Brown 2242103a8feaSLen Brown /* 2243103a8feaSLen Brown * in /dev/cpu/ return success for names that are numbers 2244103a8feaSLen Brown * ie. filter out ".", "..", "microcode". 2245103a8feaSLen Brown */ 2246103a8feaSLen Brown int dir_filter(const struct dirent *dirp) 2247103a8feaSLen Brown { 2248103a8feaSLen Brown if (isdigit(dirp->d_name[0])) 2249103a8feaSLen Brown return 1; 2250103a8feaSLen Brown else 2251103a8feaSLen Brown return 0; 2252103a8feaSLen Brown } 2253103a8feaSLen Brown 2254103a8feaSLen Brown int open_dev_cpu_msr(int dummy1) 2255103a8feaSLen Brown { 2256103a8feaSLen Brown return 0; 2257103a8feaSLen Brown } 2258103a8feaSLen Brown 2259c98d5d94SLen Brown void topology_probe() 2260c98d5d94SLen Brown { 2261c98d5d94SLen Brown int i; 2262c98d5d94SLen Brown int max_core_id = 0; 2263c98d5d94SLen Brown int max_package_id = 0; 2264c98d5d94SLen Brown int max_siblings = 0; 2265c98d5d94SLen Brown struct cpu_topology { 2266c98d5d94SLen Brown int core_id; 2267c98d5d94SLen Brown int physical_package_id; 2268c98d5d94SLen Brown } *cpus; 2269c98d5d94SLen Brown 2270c98d5d94SLen Brown /* Initialize num_cpus, max_cpu_num */ 2271c98d5d94SLen Brown topo.num_cpus = 0; 2272c98d5d94SLen Brown topo.max_cpu_num = 0; 2273c98d5d94SLen Brown for_all_proc_cpus(count_cpus); 2274c98d5d94SLen Brown if (!summary_only && topo.num_cpus > 1) 2275c98d5d94SLen Brown show_cpu = 1; 2276c98d5d94SLen Brown 2277c98d5d94SLen Brown if (verbose > 1) 2278c98d5d94SLen Brown fprintf(stderr, "num_cpus %d max_cpu_num %d\n", topo.num_cpus, topo.max_cpu_num); 2279c98d5d94SLen Brown 2280c98d5d94SLen Brown cpus = calloc(1, (topo.max_cpu_num + 1) * sizeof(struct cpu_topology)); 2281b2c95d90SJosh Triplett if (cpus == NULL) 2282b2c95d90SJosh Triplett err(1, "calloc cpus"); 2283c98d5d94SLen Brown 2284c98d5d94SLen Brown /* 2285c98d5d94SLen Brown * Allocate and initialize cpu_present_set 2286c98d5d94SLen Brown */ 2287c98d5d94SLen Brown cpu_present_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2288b2c95d90SJosh Triplett if (cpu_present_set == NULL) 2289b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2290c98d5d94SLen Brown cpu_present_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2291c98d5d94SLen Brown CPU_ZERO_S(cpu_present_setsize, cpu_present_set); 2292c98d5d94SLen Brown for_all_proc_cpus(mark_cpu_present); 2293c98d5d94SLen Brown 2294c98d5d94SLen Brown /* 2295c98d5d94SLen Brown * Allocate and initialize cpu_affinity_set 2296c98d5d94SLen Brown */ 2297c98d5d94SLen Brown cpu_affinity_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2298b2c95d90SJosh Triplett if (cpu_affinity_set == NULL) 2299b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2300c98d5d94SLen Brown cpu_affinity_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2301c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 2302c98d5d94SLen Brown 2303c98d5d94SLen Brown 2304c98d5d94SLen Brown /* 2305c98d5d94SLen Brown * For online cpus 2306c98d5d94SLen Brown * find max_core_id, max_package_id 2307c98d5d94SLen Brown */ 2308c98d5d94SLen Brown for (i = 0; i <= topo.max_cpu_num; ++i) { 2309c98d5d94SLen Brown int siblings; 2310c98d5d94SLen Brown 2311c98d5d94SLen Brown if (cpu_is_not_present(i)) { 2312c98d5d94SLen Brown if (verbose > 1) 2313c98d5d94SLen Brown fprintf(stderr, "cpu%d NOT PRESENT\n", i); 2314c98d5d94SLen Brown continue; 2315c98d5d94SLen Brown } 2316c98d5d94SLen Brown cpus[i].core_id = get_core_id(i); 2317c98d5d94SLen Brown if (cpus[i].core_id > max_core_id) 2318c98d5d94SLen Brown max_core_id = cpus[i].core_id; 2319c98d5d94SLen Brown 2320c98d5d94SLen Brown cpus[i].physical_package_id = get_physical_package_id(i); 2321c98d5d94SLen Brown if (cpus[i].physical_package_id > max_package_id) 2322c98d5d94SLen Brown max_package_id = cpus[i].physical_package_id; 2323c98d5d94SLen Brown 2324c98d5d94SLen Brown siblings = get_num_ht_siblings(i); 2325c98d5d94SLen Brown if (siblings > max_siblings) 2326c98d5d94SLen Brown max_siblings = siblings; 2327c98d5d94SLen Brown if (verbose > 1) 2328c98d5d94SLen Brown fprintf(stderr, "cpu %d pkg %d core %d\n", 2329c98d5d94SLen Brown i, cpus[i].physical_package_id, cpus[i].core_id); 2330c98d5d94SLen Brown } 2331c98d5d94SLen Brown topo.num_cores_per_pkg = max_core_id + 1; 2332c98d5d94SLen Brown if (verbose > 1) 2333c98d5d94SLen Brown fprintf(stderr, "max_core_id %d, sizing for %d cores per package\n", 2334c98d5d94SLen Brown max_core_id, topo.num_cores_per_pkg); 2335c98d5d94SLen Brown if (!summary_only && topo.num_cores_per_pkg > 1) 2336c98d5d94SLen Brown show_core = 1; 2337c98d5d94SLen Brown 2338c98d5d94SLen Brown topo.num_packages = max_package_id + 1; 2339c98d5d94SLen Brown if (verbose > 1) 2340c98d5d94SLen Brown fprintf(stderr, "max_package_id %d, sizing for %d packages\n", 2341c98d5d94SLen Brown max_package_id, topo.num_packages); 2342c98d5d94SLen Brown if (!summary_only && topo.num_packages > 1) 2343c98d5d94SLen Brown show_pkg = 1; 2344c98d5d94SLen Brown 2345c98d5d94SLen Brown topo.num_threads_per_core = max_siblings; 2346c98d5d94SLen Brown if (verbose > 1) 2347c98d5d94SLen Brown fprintf(stderr, "max_siblings %d\n", max_siblings); 2348c98d5d94SLen Brown 2349c98d5d94SLen Brown free(cpus); 2350c98d5d94SLen Brown } 2351c98d5d94SLen Brown 2352c98d5d94SLen Brown void 2353c98d5d94SLen Brown allocate_counters(struct thread_data **t, struct core_data **c, struct pkg_data **p) 2354c98d5d94SLen Brown { 2355c98d5d94SLen Brown int i; 2356c98d5d94SLen Brown 2357c98d5d94SLen Brown *t = calloc(topo.num_threads_per_core * topo.num_cores_per_pkg * 2358c98d5d94SLen Brown topo.num_packages, sizeof(struct thread_data)); 2359c98d5d94SLen Brown if (*t == NULL) 2360c98d5d94SLen Brown goto error; 2361c98d5d94SLen Brown 2362c98d5d94SLen Brown for (i = 0; i < topo.num_threads_per_core * 2363c98d5d94SLen Brown topo.num_cores_per_pkg * topo.num_packages; i++) 2364c98d5d94SLen Brown (*t)[i].cpu_id = -1; 2365c98d5d94SLen Brown 2366c98d5d94SLen Brown *c = calloc(topo.num_cores_per_pkg * topo.num_packages, 2367c98d5d94SLen Brown sizeof(struct core_data)); 2368c98d5d94SLen Brown if (*c == NULL) 2369c98d5d94SLen Brown goto error; 2370c98d5d94SLen Brown 2371c98d5d94SLen Brown for (i = 0; i < topo.num_cores_per_pkg * topo.num_packages; i++) 2372c98d5d94SLen Brown (*c)[i].core_id = -1; 2373c98d5d94SLen Brown 2374c98d5d94SLen Brown *p = calloc(topo.num_packages, sizeof(struct pkg_data)); 2375c98d5d94SLen Brown if (*p == NULL) 2376c98d5d94SLen Brown goto error; 2377c98d5d94SLen Brown 2378c98d5d94SLen Brown for (i = 0; i < topo.num_packages; i++) 2379c98d5d94SLen Brown (*p)[i].package_id = i; 2380c98d5d94SLen Brown 2381c98d5d94SLen Brown return; 2382c98d5d94SLen Brown error: 2383b2c95d90SJosh Triplett err(1, "calloc counters"); 2384c98d5d94SLen Brown } 2385c98d5d94SLen Brown /* 2386c98d5d94SLen Brown * init_counter() 2387c98d5d94SLen Brown * 2388c98d5d94SLen Brown * set cpu_id, core_num, pkg_num 2389c98d5d94SLen Brown * set FIRST_THREAD_IN_CORE and FIRST_CORE_IN_PACKAGE 2390c98d5d94SLen Brown * 2391c98d5d94SLen Brown * increment topo.num_cores when 1st core in pkg seen 2392c98d5d94SLen Brown */ 2393c98d5d94SLen Brown void init_counter(struct thread_data *thread_base, struct core_data *core_base, 2394c98d5d94SLen Brown struct pkg_data *pkg_base, int thread_num, int core_num, 2395c98d5d94SLen Brown int pkg_num, int cpu_id) 2396c98d5d94SLen Brown { 2397c98d5d94SLen Brown struct thread_data *t; 2398c98d5d94SLen Brown struct core_data *c; 2399c98d5d94SLen Brown struct pkg_data *p; 2400c98d5d94SLen Brown 2401c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_num, core_num, pkg_num); 2402c98d5d94SLen Brown c = GET_CORE(core_base, core_num, pkg_num); 2403c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_num); 2404c98d5d94SLen Brown 2405c98d5d94SLen Brown t->cpu_id = cpu_id; 2406c98d5d94SLen Brown if (thread_num == 0) { 2407c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_THREAD_IN_CORE; 2408c98d5d94SLen Brown if (cpu_is_first_core_in_package(cpu_id)) 2409c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_CORE_IN_PACKAGE; 2410c98d5d94SLen Brown } 2411c98d5d94SLen Brown 2412c98d5d94SLen Brown c->core_id = core_num; 2413c98d5d94SLen Brown p->package_id = pkg_num; 2414c98d5d94SLen Brown } 2415c98d5d94SLen Brown 2416c98d5d94SLen Brown 2417c98d5d94SLen Brown int initialize_counters(int cpu_id) 2418c98d5d94SLen Brown { 2419c98d5d94SLen Brown int my_thread_id, my_core_id, my_package_id; 2420c98d5d94SLen Brown 2421c98d5d94SLen Brown my_package_id = get_physical_package_id(cpu_id); 2422c98d5d94SLen Brown my_core_id = get_core_id(cpu_id); 2423c98d5d94SLen Brown 2424c98d5d94SLen Brown if (cpu_is_first_sibling_in_core(cpu_id)) { 2425c98d5d94SLen Brown my_thread_id = 0; 2426c98d5d94SLen Brown topo.num_cores++; 2427c98d5d94SLen Brown } else { 2428c98d5d94SLen Brown my_thread_id = 1; 2429c98d5d94SLen Brown } 2430c98d5d94SLen Brown 2431c98d5d94SLen Brown init_counter(EVEN_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2432c98d5d94SLen Brown init_counter(ODD_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2433c98d5d94SLen Brown return 0; 2434c98d5d94SLen Brown } 2435c98d5d94SLen Brown 2436c98d5d94SLen Brown void allocate_output_buffer() 2437c98d5d94SLen Brown { 24383b4d5c7fSAndy Shevchenko output_buffer = calloc(1, (1 + topo.num_cpus) * 1024); 2439c98d5d94SLen Brown outp = output_buffer; 2440b2c95d90SJosh Triplett if (outp == NULL) 2441b2c95d90SJosh Triplett err(-1, "calloc output buffer"); 2442c98d5d94SLen Brown } 2443c98d5d94SLen Brown 2444c98d5d94SLen Brown void setup_all_buffers(void) 2445c98d5d94SLen Brown { 2446c98d5d94SLen Brown topology_probe(); 2447c98d5d94SLen Brown allocate_counters(&thread_even, &core_even, &package_even); 2448c98d5d94SLen Brown allocate_counters(&thread_odd, &core_odd, &package_odd); 2449c98d5d94SLen Brown allocate_output_buffer(); 2450c98d5d94SLen Brown for_all_proc_cpus(initialize_counters); 2451c98d5d94SLen Brown } 24523b4d5c7fSAndy Shevchenko 2453103a8feaSLen Brown void turbostat_init() 2454103a8feaSLen Brown { 2455103a8feaSLen Brown check_dev_msr(); 245698481e79SLen Brown check_permissions(); 245798481e79SLen Brown check_cpuid(); 2458103a8feaSLen Brown 2459c98d5d94SLen Brown setup_all_buffers(); 2460103a8feaSLen Brown 2461103a8feaSLen Brown if (verbose) 2462c98d5d94SLen Brown print_verbose_header(); 2463889facbeSLen Brown 2464889facbeSLen Brown if (verbose) 2465889facbeSLen Brown for_all_cpus(print_epb, ODD_COUNTERS); 2466889facbeSLen Brown 2467889facbeSLen Brown if (verbose) 2468*3a9a941dSLen Brown for_all_cpus(print_perf_limit, ODD_COUNTERS); 2469*3a9a941dSLen Brown 2470*3a9a941dSLen Brown if (verbose) 2471889facbeSLen Brown for_all_cpus(print_rapl, ODD_COUNTERS); 2472889facbeSLen Brown 2473889facbeSLen Brown for_all_cpus(set_temperature_target, ODD_COUNTERS); 2474889facbeSLen Brown 2475889facbeSLen Brown if (verbose) 2476889facbeSLen Brown for_all_cpus(print_thermal, ODD_COUNTERS); 2477103a8feaSLen Brown } 2478103a8feaSLen Brown 2479103a8feaSLen Brown int fork_it(char **argv) 2480103a8feaSLen Brown { 2481103a8feaSLen Brown pid_t child_pid; 2482d91bb17cSLen Brown int status; 2483d15cf7c1SLen Brown 2484d91bb17cSLen Brown status = for_all_cpus(get_counters, EVEN_COUNTERS); 2485d91bb17cSLen Brown if (status) 2486d91bb17cSLen Brown exit(status); 2487d15cf7c1SLen Brown /* clear affinity side-effect of get_counters() */ 2488d15cf7c1SLen Brown sched_setaffinity(0, cpu_present_setsize, cpu_present_set); 2489103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 2490103a8feaSLen Brown 2491103a8feaSLen Brown child_pid = fork(); 2492103a8feaSLen Brown if (!child_pid) { 2493103a8feaSLen Brown /* child */ 2494103a8feaSLen Brown execvp(argv[0], argv); 2495103a8feaSLen Brown } else { 2496103a8feaSLen Brown 2497103a8feaSLen Brown /* parent */ 2498b2c95d90SJosh Triplett if (child_pid == -1) 2499b2c95d90SJosh Triplett err(1, "fork"); 2500103a8feaSLen Brown 2501103a8feaSLen Brown signal(SIGINT, SIG_IGN); 2502103a8feaSLen Brown signal(SIGQUIT, SIG_IGN); 2503b2c95d90SJosh Triplett if (waitpid(child_pid, &status, 0) == -1) 2504b2c95d90SJosh Triplett err(status, "waitpid"); 2505103a8feaSLen Brown } 2506c98d5d94SLen Brown /* 2507c98d5d94SLen Brown * n.b. fork_it() does not check for errors from for_all_cpus() 2508c98d5d94SLen Brown * because re-starting is problematic when forking 2509c98d5d94SLen Brown */ 2510c98d5d94SLen Brown for_all_cpus(get_counters, ODD_COUNTERS); 2511103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 2512103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 2513c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 2514c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 2515c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 2516c98d5d94SLen Brown flush_stderr(); 2517103a8feaSLen Brown 25186eab04a8SJustin P. Mattock fprintf(stderr, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0); 2519103a8feaSLen Brown 2520d91bb17cSLen Brown return status; 2521103a8feaSLen Brown } 2522103a8feaSLen Brown 25233b4d5c7fSAndy Shevchenko int get_and_dump_counters(void) 25243b4d5c7fSAndy Shevchenko { 25253b4d5c7fSAndy Shevchenko int status; 25263b4d5c7fSAndy Shevchenko 25273b4d5c7fSAndy Shevchenko status = for_all_cpus(get_counters, ODD_COUNTERS); 25283b4d5c7fSAndy Shevchenko if (status) 25293b4d5c7fSAndy Shevchenko return status; 25303b4d5c7fSAndy Shevchenko 25313b4d5c7fSAndy Shevchenko status = for_all_cpus(dump_counters, ODD_COUNTERS); 25323b4d5c7fSAndy Shevchenko if (status) 25333b4d5c7fSAndy Shevchenko return status; 25343b4d5c7fSAndy Shevchenko 25353b4d5c7fSAndy Shevchenko flush_stdout(); 25363b4d5c7fSAndy Shevchenko 25373b4d5c7fSAndy Shevchenko return status; 25383b4d5c7fSAndy Shevchenko } 25393b4d5c7fSAndy Shevchenko 2540103a8feaSLen Brown void cmdline(int argc, char **argv) 2541103a8feaSLen Brown { 2542103a8feaSLen Brown int opt; 2543103a8feaSLen Brown 2544103a8feaSLen Brown progname = argv[0]; 2545103a8feaSLen Brown 25463b4d5c7fSAndy Shevchenko while ((opt = getopt(argc, argv, "+pPsSvi:c:C:m:M:RJT:")) != -1) { 2547103a8feaSLen Brown switch (opt) { 2548f9240813SLen Brown case 'p': 2549c98d5d94SLen Brown show_core_only++; 2550c98d5d94SLen Brown break; 2551f9240813SLen Brown case 'P': 2552c98d5d94SLen Brown show_pkg_only++; 2553c98d5d94SLen Brown break; 25543b4d5c7fSAndy Shevchenko case 's': 25553b4d5c7fSAndy Shevchenko dump_only++; 25563b4d5c7fSAndy Shevchenko break; 2557f9240813SLen Brown case 'S': 2558e23da037SLen Brown summary_only++; 2559e23da037SLen Brown break; 2560103a8feaSLen Brown case 'v': 2561103a8feaSLen Brown verbose++; 2562103a8feaSLen Brown break; 2563103a8feaSLen Brown case 'i': 2564103a8feaSLen Brown interval_sec = atoi(optarg); 2565103a8feaSLen Brown break; 2566f9240813SLen Brown case 'c': 25678e180f3cSLen Brown sscanf(optarg, "%x", &extra_delta_offset32); 25688e180f3cSLen Brown break; 2569f9240813SLen Brown case 'C': 25708e180f3cSLen Brown sscanf(optarg, "%x", &extra_delta_offset64); 25718e180f3cSLen Brown break; 25722f32edf1SLen Brown case 'm': 25732f32edf1SLen Brown sscanf(optarg, "%x", &extra_msr_offset32); 25742f32edf1SLen Brown break; 25752f32edf1SLen Brown case 'M': 25762f32edf1SLen Brown sscanf(optarg, "%x", &extra_msr_offset64); 2577103a8feaSLen Brown break; 2578889facbeSLen Brown case 'R': 2579889facbeSLen Brown rapl_verbose++; 2580889facbeSLen Brown break; 2581889facbeSLen Brown case 'T': 2582889facbeSLen Brown tcc_activation_temp_override = atoi(optarg); 2583889facbeSLen Brown break; 25845c56be9aSDirk Brandewie case 'J': 25855c56be9aSDirk Brandewie rapl_joules++; 25865c56be9aSDirk Brandewie break; 25875c56be9aSDirk Brandewie 2588103a8feaSLen Brown default: 2589103a8feaSLen Brown usage(); 2590103a8feaSLen Brown } 2591103a8feaSLen Brown } 2592103a8feaSLen Brown } 2593103a8feaSLen Brown 2594103a8feaSLen Brown int main(int argc, char **argv) 2595103a8feaSLen Brown { 2596103a8feaSLen Brown cmdline(argc, argv); 2597103a8feaSLen Brown 2598889facbeSLen Brown if (verbose) 259998481e79SLen Brown fprintf(stderr, "turbostat v3.8 14-Aug 2014" 2600103a8feaSLen Brown " - Len Brown <lenb@kernel.org>\n"); 2601103a8feaSLen Brown 2602103a8feaSLen Brown turbostat_init(); 2603103a8feaSLen Brown 26043b4d5c7fSAndy Shevchenko /* dump counters and exit */ 26053b4d5c7fSAndy Shevchenko if (dump_only) 26063b4d5c7fSAndy Shevchenko return get_and_dump_counters(); 26073b4d5c7fSAndy Shevchenko 2608103a8feaSLen Brown /* 2609103a8feaSLen Brown * if any params left, it must be a command to fork 2610103a8feaSLen Brown */ 2611103a8feaSLen Brown if (argc - optind) 2612103a8feaSLen Brown return fork_it(argv + optind); 2613103a8feaSLen Brown else 2614103a8feaSLen Brown turbostat_loop(); 2615103a8feaSLen Brown 2616103a8feaSLen Brown return 0; 2617103a8feaSLen Brown } 2618