1103a8feaSLen Brown /* 2103a8feaSLen Brown * turbostat -- show CPU frequency and C-state residency 3103a8feaSLen Brown * on modern Intel turbo-capable processors. 4103a8feaSLen Brown * 5144b44b1SLen Brown * Copyright (c) 2013 Intel Corporation. 6103a8feaSLen Brown * Len Brown <len.brown@intel.com> 7103a8feaSLen Brown * 8103a8feaSLen Brown * This program is free software; you can redistribute it and/or modify it 9103a8feaSLen Brown * under the terms and conditions of the GNU General Public License, 10103a8feaSLen Brown * version 2, as published by the Free Software Foundation. 11103a8feaSLen Brown * 12103a8feaSLen Brown * This program is distributed in the hope it will be useful, but WITHOUT 13103a8feaSLen Brown * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 14103a8feaSLen Brown * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 15103a8feaSLen Brown * more details. 16103a8feaSLen Brown * 17103a8feaSLen Brown * You should have received a copy of the GNU General Public License along with 18103a8feaSLen Brown * this program; if not, write to the Free Software Foundation, Inc., 19103a8feaSLen Brown * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. 20103a8feaSLen Brown */ 21103a8feaSLen Brown 2288c3281fSLen Brown #define _GNU_SOURCE 23b731f311SJosh Triplett #include MSRHEADER 2495aebc44SJosh Triplett #include <stdarg.h> 25103a8feaSLen Brown #include <stdio.h> 26b2c95d90SJosh Triplett #include <err.h> 27103a8feaSLen Brown #include <unistd.h> 28103a8feaSLen Brown #include <sys/types.h> 29103a8feaSLen Brown #include <sys/wait.h> 30103a8feaSLen Brown #include <sys/stat.h> 31103a8feaSLen Brown #include <sys/resource.h> 32103a8feaSLen Brown #include <fcntl.h> 33103a8feaSLen Brown #include <signal.h> 34103a8feaSLen Brown #include <sys/time.h> 35103a8feaSLen Brown #include <stdlib.h> 36103a8feaSLen Brown #include <dirent.h> 37103a8feaSLen Brown #include <string.h> 38103a8feaSLen Brown #include <ctype.h> 3988c3281fSLen Brown #include <sched.h> 402b92865eSJosh Triplett #include <cpuid.h> 41103a8feaSLen Brown 42103a8feaSLen Brown char *proc_stat = "/proc/stat"; 43103a8feaSLen Brown unsigned int interval_sec = 5; /* set with -i interval_sec */ 44103a8feaSLen Brown unsigned int verbose; /* set with -v */ 45889facbeSLen Brown unsigned int rapl_verbose; /* set with -R */ 465c56be9aSDirk Brandewie unsigned int rapl_joules; /* set with -J */ 47889facbeSLen Brown unsigned int thermal_verbose; /* set with -T */ 48*f591c38bSAndy Shevchenko unsigned int summary_only; /* set with -S */ 49103a8feaSLen Brown unsigned int skip_c0; 50103a8feaSLen Brown unsigned int skip_c1; 51103a8feaSLen Brown unsigned int do_nhm_cstates; 52103a8feaSLen Brown unsigned int do_snb_cstates; 53ca58710fSKristen Carlson Accardi unsigned int do_c8_c9_c10; 54144b44b1SLen Brown unsigned int do_slm_cstates; 55144b44b1SLen Brown unsigned int use_c1_residency_msr; 56103a8feaSLen Brown unsigned int has_aperf; 57889facbeSLen Brown unsigned int has_epb; 58103a8feaSLen Brown unsigned int units = 1000000000; /* Ghz etc */ 59103a8feaSLen Brown unsigned int genuine_intel; 60103a8feaSLen Brown unsigned int has_invariant_tsc; 61103a8feaSLen Brown unsigned int do_nehalem_platform_info; 62103a8feaSLen Brown unsigned int do_nehalem_turbo_ratio_limit; 636574a5d5SLen Brown unsigned int do_ivt_turbo_ratio_limit; 642f32edf1SLen Brown unsigned int extra_msr_offset32; 652f32edf1SLen Brown unsigned int extra_msr_offset64; 668e180f3cSLen Brown unsigned int extra_delta_offset32; 678e180f3cSLen Brown unsigned int extra_delta_offset64; 681ed51011SLen Brown int do_smi; 69103a8feaSLen Brown double bclk; 70103a8feaSLen Brown unsigned int show_pkg; 71103a8feaSLen Brown unsigned int show_core; 72103a8feaSLen Brown unsigned int show_cpu; 73c98d5d94SLen Brown unsigned int show_pkg_only; 74c98d5d94SLen Brown unsigned int show_core_only; 75c98d5d94SLen Brown char *output_buffer, *outp; 76889facbeSLen Brown unsigned int do_rapl; 77889facbeSLen Brown unsigned int do_dts; 78889facbeSLen Brown unsigned int do_ptm; 79889facbeSLen Brown unsigned int tcc_activation_temp; 80889facbeSLen Brown unsigned int tcc_activation_temp_override; 81889facbeSLen Brown double rapl_power_units, rapl_energy_units, rapl_time_units; 82889facbeSLen Brown double rapl_joule_counter_range; 83889facbeSLen Brown 84889facbeSLen Brown #define RAPL_PKG (1 << 0) 85e6f9bb3cSLen Brown /* 0x610 MSR_PKG_POWER_LIMIT */ 86e6f9bb3cSLen Brown /* 0x611 MSR_PKG_ENERGY_STATUS */ 87e6f9bb3cSLen Brown #define RAPL_PKG_PERF_STATUS (1 << 1) 88e6f9bb3cSLen Brown /* 0x613 MSR_PKG_PERF_STATUS */ 89e6f9bb3cSLen Brown #define RAPL_PKG_POWER_INFO (1 << 2) 90e6f9bb3cSLen Brown /* 0x614 MSR_PKG_POWER_INFO */ 91e6f9bb3cSLen Brown 92889facbeSLen Brown #define RAPL_DRAM (1 << 3) 93e6f9bb3cSLen Brown /* 0x618 MSR_DRAM_POWER_LIMIT */ 94e6f9bb3cSLen Brown /* 0x619 MSR_DRAM_ENERGY_STATUS */ 95e6f9bb3cSLen Brown /* 0x61c MSR_DRAM_POWER_INFO */ 96e6f9bb3cSLen Brown #define RAPL_DRAM_PERF_STATUS (1 << 4) 97e6f9bb3cSLen Brown /* 0x61b MSR_DRAM_PERF_STATUS */ 98e6f9bb3cSLen Brown 99e6f9bb3cSLen Brown #define RAPL_CORES (1 << 5) 100e6f9bb3cSLen Brown /* 0x638 MSR_PP0_POWER_LIMIT */ 101e6f9bb3cSLen Brown /* 0x639 MSR_PP0_ENERGY_STATUS */ 102e6f9bb3cSLen Brown #define RAPL_CORE_POLICY (1 << 6) 103e6f9bb3cSLen Brown /* 0x63a MSR_PP0_POLICY */ 104e6f9bb3cSLen Brown 105e6f9bb3cSLen Brown 106e6f9bb3cSLen Brown #define RAPL_GFX (1 << 7) 107e6f9bb3cSLen Brown /* 0x640 MSR_PP1_POWER_LIMIT */ 108e6f9bb3cSLen Brown /* 0x641 MSR_PP1_ENERGY_STATUS */ 109e6f9bb3cSLen Brown /* 0x642 MSR_PP1_POLICY */ 110889facbeSLen Brown #define TJMAX_DEFAULT 100 111889facbeSLen Brown 112889facbeSLen Brown #define MAX(a, b) ((a) > (b) ? (a) : (b)) 113103a8feaSLen Brown 114103a8feaSLen Brown int aperf_mperf_unstable; 115103a8feaSLen Brown int backwards_count; 116103a8feaSLen Brown char *progname; 117103a8feaSLen Brown 118c98d5d94SLen Brown cpu_set_t *cpu_present_set, *cpu_affinity_set; 119c98d5d94SLen Brown size_t cpu_present_setsize, cpu_affinity_setsize; 120c98d5d94SLen Brown 121c98d5d94SLen Brown struct thread_data { 122c98d5d94SLen Brown unsigned long long tsc; 123c98d5d94SLen Brown unsigned long long aperf; 124c98d5d94SLen Brown unsigned long long mperf; 125144b44b1SLen Brown unsigned long long c1; 1262f32edf1SLen Brown unsigned long long extra_msr64; 1278e180f3cSLen Brown unsigned long long extra_delta64; 1288e180f3cSLen Brown unsigned long long extra_msr32; 1298e180f3cSLen Brown unsigned long long extra_delta32; 1301ed51011SLen Brown unsigned int smi_count; 131c98d5d94SLen Brown unsigned int cpu_id; 132c98d5d94SLen Brown unsigned int flags; 133c98d5d94SLen Brown #define CPU_IS_FIRST_THREAD_IN_CORE 0x2 134c98d5d94SLen Brown #define CPU_IS_FIRST_CORE_IN_PACKAGE 0x4 135c98d5d94SLen Brown } *thread_even, *thread_odd; 136c98d5d94SLen Brown 137c98d5d94SLen Brown struct core_data { 138c98d5d94SLen Brown unsigned long long c3; 139c98d5d94SLen Brown unsigned long long c6; 140c98d5d94SLen Brown unsigned long long c7; 141889facbeSLen Brown unsigned int core_temp_c; 142c98d5d94SLen Brown unsigned int core_id; 143c98d5d94SLen Brown } *core_even, *core_odd; 144c98d5d94SLen Brown 145c98d5d94SLen Brown struct pkg_data { 146c98d5d94SLen Brown unsigned long long pc2; 147c98d5d94SLen Brown unsigned long long pc3; 148c98d5d94SLen Brown unsigned long long pc6; 149c98d5d94SLen Brown unsigned long long pc7; 150ca58710fSKristen Carlson Accardi unsigned long long pc8; 151ca58710fSKristen Carlson Accardi unsigned long long pc9; 152ca58710fSKristen Carlson Accardi unsigned long long pc10; 153c98d5d94SLen Brown unsigned int package_id; 154889facbeSLen Brown unsigned int energy_pkg; /* MSR_PKG_ENERGY_STATUS */ 155889facbeSLen Brown unsigned int energy_dram; /* MSR_DRAM_ENERGY_STATUS */ 156889facbeSLen Brown unsigned int energy_cores; /* MSR_PP0_ENERGY_STATUS */ 157889facbeSLen Brown unsigned int energy_gfx; /* MSR_PP1_ENERGY_STATUS */ 158889facbeSLen Brown unsigned int rapl_pkg_perf_status; /* MSR_PKG_PERF_STATUS */ 159889facbeSLen Brown unsigned int rapl_dram_perf_status; /* MSR_DRAM_PERF_STATUS */ 160889facbeSLen Brown unsigned int pkg_temp_c; 161889facbeSLen Brown 162c98d5d94SLen Brown } *package_even, *package_odd; 163c98d5d94SLen Brown 164c98d5d94SLen Brown #define ODD_COUNTERS thread_odd, core_odd, package_odd 165c98d5d94SLen Brown #define EVEN_COUNTERS thread_even, core_even, package_even 166c98d5d94SLen Brown 167c98d5d94SLen Brown #define GET_THREAD(thread_base, thread_no, core_no, pkg_no) \ 168c98d5d94SLen Brown (thread_base + (pkg_no) * topo.num_cores_per_pkg * \ 169c98d5d94SLen Brown topo.num_threads_per_core + \ 170c98d5d94SLen Brown (core_no) * topo.num_threads_per_core + (thread_no)) 171c98d5d94SLen Brown #define GET_CORE(core_base, core_no, pkg_no) \ 172c98d5d94SLen Brown (core_base + (pkg_no) * topo.num_cores_per_pkg + (core_no)) 173c98d5d94SLen Brown #define GET_PKG(pkg_base, pkg_no) (pkg_base + pkg_no) 174c98d5d94SLen Brown 175c98d5d94SLen Brown struct system_summary { 176c98d5d94SLen Brown struct thread_data threads; 177c98d5d94SLen Brown struct core_data cores; 178c98d5d94SLen Brown struct pkg_data packages; 179c98d5d94SLen Brown } sum, average; 180c98d5d94SLen Brown 181c98d5d94SLen Brown 182c98d5d94SLen Brown struct topo_params { 183c98d5d94SLen Brown int num_packages; 184103a8feaSLen Brown int num_cpus; 185c98d5d94SLen Brown int num_cores; 186c98d5d94SLen Brown int max_cpu_num; 187c98d5d94SLen Brown int num_cores_per_pkg; 188c98d5d94SLen Brown int num_threads_per_core; 189c98d5d94SLen Brown } topo; 190103a8feaSLen Brown 191c98d5d94SLen Brown struct timeval tv_even, tv_odd, tv_delta; 192103a8feaSLen Brown 193c98d5d94SLen Brown void setup_all_buffers(void); 194103a8feaSLen Brown 195c98d5d94SLen Brown int cpu_is_not_present(int cpu) 196d15cf7c1SLen Brown { 197c98d5d94SLen Brown return !CPU_ISSET_S(cpu, cpu_present_setsize, cpu_present_set); 198c98d5d94SLen Brown } 199c98d5d94SLen Brown /* 200c98d5d94SLen Brown * run func(thread, core, package) in topology order 201c98d5d94SLen Brown * skip non-present cpus 202c98d5d94SLen Brown */ 203c98d5d94SLen Brown 204c98d5d94SLen Brown int for_all_cpus(int (func)(struct thread_data *, struct core_data *, struct pkg_data *), 205c98d5d94SLen Brown struct thread_data *thread_base, struct core_data *core_base, struct pkg_data *pkg_base) 206c98d5d94SLen Brown { 207c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 208c98d5d94SLen Brown 209c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 210c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 211c98d5d94SLen Brown for (thread_no = 0; thread_no < 212c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 213c98d5d94SLen Brown struct thread_data *t; 214c98d5d94SLen Brown struct core_data *c; 215c98d5d94SLen Brown struct pkg_data *p; 216c98d5d94SLen Brown 217c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 218c98d5d94SLen Brown 219c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 220c98d5d94SLen Brown continue; 221c98d5d94SLen Brown 222c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 223c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 224c98d5d94SLen Brown 225c98d5d94SLen Brown retval = func(t, c, p); 226c98d5d94SLen Brown if (retval) 227c98d5d94SLen Brown return retval; 228c98d5d94SLen Brown } 229c98d5d94SLen Brown } 230c98d5d94SLen Brown } 231d15cf7c1SLen Brown return 0; 232d15cf7c1SLen Brown } 233d15cf7c1SLen Brown 23488c3281fSLen Brown int cpu_migrate(int cpu) 23588c3281fSLen Brown { 236c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 237c98d5d94SLen Brown CPU_SET_S(cpu, cpu_affinity_setsize, cpu_affinity_set); 238c98d5d94SLen Brown if (sched_setaffinity(0, cpu_affinity_setsize, cpu_affinity_set) == -1) 23988c3281fSLen Brown return -1; 24088c3281fSLen Brown else 24188c3281fSLen Brown return 0; 24288c3281fSLen Brown } 24388c3281fSLen Brown 24415aaa346SLen Brown int get_msr(int cpu, off_t offset, unsigned long long *msr) 245103a8feaSLen Brown { 246103a8feaSLen Brown ssize_t retval; 247103a8feaSLen Brown char pathname[32]; 248103a8feaSLen Brown int fd; 249103a8feaSLen Brown 250103a8feaSLen Brown sprintf(pathname, "/dev/cpu/%d/msr", cpu); 251103a8feaSLen Brown fd = open(pathname, O_RDONLY); 25215aaa346SLen Brown if (fd < 0) 25315aaa346SLen Brown return -1; 254103a8feaSLen Brown 25515aaa346SLen Brown retval = pread(fd, msr, sizeof *msr, offset); 256103a8feaSLen Brown close(fd); 25715aaa346SLen Brown 258d91bb17cSLen Brown if (retval != sizeof *msr) { 2592e9c6bc7SJosh Triplett fprintf(stderr, "%s offset 0x%llx read failed\n", pathname, (unsigned long long)offset); 26015aaa346SLen Brown return -1; 261d91bb17cSLen Brown } 26215aaa346SLen Brown 26315aaa346SLen Brown return 0; 264103a8feaSLen Brown } 265103a8feaSLen Brown 266a829eb4dSLen Brown void print_header(void) 267103a8feaSLen Brown { 268103a8feaSLen Brown if (show_pkg) 269c98d5d94SLen Brown outp += sprintf(outp, "pk"); 270e23da037SLen Brown if (show_pkg) 271c98d5d94SLen Brown outp += sprintf(outp, " "); 272103a8feaSLen Brown if (show_core) 273c98d5d94SLen Brown outp += sprintf(outp, "cor"); 274103a8feaSLen Brown if (show_cpu) 275c98d5d94SLen Brown outp += sprintf(outp, " CPU"); 276e23da037SLen Brown if (show_pkg || show_core || show_cpu) 277c98d5d94SLen Brown outp += sprintf(outp, " "); 278103a8feaSLen Brown if (do_nhm_cstates) 279c98d5d94SLen Brown outp += sprintf(outp, " %%c0"); 280103a8feaSLen Brown if (has_aperf) 281c98d5d94SLen Brown outp += sprintf(outp, " GHz"); 282c98d5d94SLen Brown outp += sprintf(outp, " TSC"); 2831ed51011SLen Brown if (do_smi) 2841ed51011SLen Brown outp += sprintf(outp, " SMI"); 2858e180f3cSLen Brown if (extra_delta_offset32) 286f9240813SLen Brown outp += sprintf(outp, " count 0x%03X", extra_delta_offset32); 2878e180f3cSLen Brown if (extra_delta_offset64) 288f9240813SLen Brown outp += sprintf(outp, " COUNT 0x%03X", extra_delta_offset64); 2892f32edf1SLen Brown if (extra_msr_offset32) 2908e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset32); 2912f32edf1SLen Brown if (extra_msr_offset64) 2928e180f3cSLen Brown outp += sprintf(outp, " MSR 0x%03X", extra_msr_offset64); 293103a8feaSLen Brown if (do_nhm_cstates) 294c98d5d94SLen Brown outp += sprintf(outp, " %%c1"); 295144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 296c98d5d94SLen Brown outp += sprintf(outp, " %%c3"); 297103a8feaSLen Brown if (do_nhm_cstates) 298c98d5d94SLen Brown outp += sprintf(outp, " %%c6"); 299103a8feaSLen Brown if (do_snb_cstates) 300c98d5d94SLen Brown outp += sprintf(outp, " %%c7"); 301889facbeSLen Brown 302889facbeSLen Brown if (do_dts) 303889facbeSLen Brown outp += sprintf(outp, " CTMP"); 304889facbeSLen Brown if (do_ptm) 305889facbeSLen Brown outp += sprintf(outp, " PTMP"); 306889facbeSLen Brown 307103a8feaSLen Brown if (do_snb_cstates) 308c98d5d94SLen Brown outp += sprintf(outp, " %%pc2"); 309144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 310c98d5d94SLen Brown outp += sprintf(outp, " %%pc3"); 311144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 312c98d5d94SLen Brown outp += sprintf(outp, " %%pc6"); 313103a8feaSLen Brown if (do_snb_cstates) 314c98d5d94SLen Brown outp += sprintf(outp, " %%pc7"); 315ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 316ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %%pc8"); 317ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %%pc9"); 318ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %%pc10"); 319ca58710fSKristen Carlson Accardi } 320103a8feaSLen Brown 3215c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 322889facbeSLen Brown if (do_rapl & RAPL_PKG) 323889facbeSLen Brown outp += sprintf(outp, " Pkg_W"); 324889facbeSLen Brown if (do_rapl & RAPL_CORES) 325889facbeSLen Brown outp += sprintf(outp, " Cor_W"); 326889facbeSLen Brown if (do_rapl & RAPL_GFX) 327889facbeSLen Brown outp += sprintf(outp, " GFX_W"); 328889facbeSLen Brown if (do_rapl & RAPL_DRAM) 329889facbeSLen Brown outp += sprintf(outp, " RAM_W"); 330889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 331889facbeSLen Brown outp += sprintf(outp, " PKG_%%"); 332889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 333889facbeSLen Brown outp += sprintf(outp, " RAM_%%"); 3345c56be9aSDirk Brandewie } else { 3355c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 3365c56be9aSDirk Brandewie outp += sprintf(outp, " Pkg_J"); 3375c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 3385c56be9aSDirk Brandewie outp += sprintf(outp, " Cor_J"); 3395c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 3405c56be9aSDirk Brandewie outp += sprintf(outp, " GFX_J"); 3415c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 3425c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_W"); 3435c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 3445c56be9aSDirk Brandewie outp += sprintf(outp, " PKG_%%"); 3455c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 3465c56be9aSDirk Brandewie outp += sprintf(outp, " RAM_%%"); 3475c56be9aSDirk Brandewie outp += sprintf(outp, " time"); 348889facbeSLen Brown 3495c56be9aSDirk Brandewie } 350c98d5d94SLen Brown outp += sprintf(outp, "\n"); 351103a8feaSLen Brown } 352103a8feaSLen Brown 353c98d5d94SLen Brown int dump_counters(struct thread_data *t, struct core_data *c, 354c98d5d94SLen Brown struct pkg_data *p) 355103a8feaSLen Brown { 356c98d5d94SLen Brown fprintf(stderr, "t %p, c %p, p %p\n", t, c, p); 357c98d5d94SLen Brown 358c98d5d94SLen Brown if (t) { 359c98d5d94SLen Brown fprintf(stderr, "CPU: %d flags 0x%x\n", t->cpu_id, t->flags); 360c98d5d94SLen Brown fprintf(stderr, "TSC: %016llX\n", t->tsc); 361c98d5d94SLen Brown fprintf(stderr, "aperf: %016llX\n", t->aperf); 362c98d5d94SLen Brown fprintf(stderr, "mperf: %016llX\n", t->mperf); 363c98d5d94SLen Brown fprintf(stderr, "c1: %016llX\n", t->c1); 3648e180f3cSLen Brown fprintf(stderr, "msr0x%x: %08llX\n", 3658e180f3cSLen Brown extra_delta_offset32, t->extra_delta32); 3668e180f3cSLen Brown fprintf(stderr, "msr0x%x: %016llX\n", 3678e180f3cSLen Brown extra_delta_offset64, t->extra_delta64); 3688e180f3cSLen Brown fprintf(stderr, "msr0x%x: %08llX\n", 3692f32edf1SLen Brown extra_msr_offset32, t->extra_msr32); 370c98d5d94SLen Brown fprintf(stderr, "msr0x%x: %016llX\n", 3712f32edf1SLen Brown extra_msr_offset64, t->extra_msr64); 3721ed51011SLen Brown if (do_smi) 3731ed51011SLen Brown fprintf(stderr, "SMI: %08X\n", t->smi_count); 374103a8feaSLen Brown } 375103a8feaSLen Brown 376c98d5d94SLen Brown if (c) { 377c98d5d94SLen Brown fprintf(stderr, "core: %d\n", c->core_id); 378c98d5d94SLen Brown fprintf(stderr, "c3: %016llX\n", c->c3); 379c98d5d94SLen Brown fprintf(stderr, "c6: %016llX\n", c->c6); 380c98d5d94SLen Brown fprintf(stderr, "c7: %016llX\n", c->c7); 381889facbeSLen Brown fprintf(stderr, "DTS: %dC\n", c->core_temp_c); 382c98d5d94SLen Brown } 383103a8feaSLen Brown 384c98d5d94SLen Brown if (p) { 385c98d5d94SLen Brown fprintf(stderr, "package: %d\n", p->package_id); 386c98d5d94SLen Brown fprintf(stderr, "pc2: %016llX\n", p->pc2); 387c98d5d94SLen Brown fprintf(stderr, "pc3: %016llX\n", p->pc3); 388c98d5d94SLen Brown fprintf(stderr, "pc6: %016llX\n", p->pc6); 389c98d5d94SLen Brown fprintf(stderr, "pc7: %016llX\n", p->pc7); 390ca58710fSKristen Carlson Accardi fprintf(stderr, "pc8: %016llX\n", p->pc8); 391ca58710fSKristen Carlson Accardi fprintf(stderr, "pc9: %016llX\n", p->pc9); 392ca58710fSKristen Carlson Accardi fprintf(stderr, "pc10: %016llX\n", p->pc10); 393889facbeSLen Brown fprintf(stderr, "Joules PKG: %0X\n", p->energy_pkg); 394889facbeSLen Brown fprintf(stderr, "Joules COR: %0X\n", p->energy_cores); 395889facbeSLen Brown fprintf(stderr, "Joules GFX: %0X\n", p->energy_gfx); 396889facbeSLen Brown fprintf(stderr, "Joules RAM: %0X\n", p->energy_dram); 397889facbeSLen Brown fprintf(stderr, "Throttle PKG: %0X\n", p->rapl_pkg_perf_status); 398889facbeSLen Brown fprintf(stderr, "Throttle RAM: %0X\n", p->rapl_dram_perf_status); 399889facbeSLen Brown fprintf(stderr, "PTM: %dC\n", p->pkg_temp_c); 400c98d5d94SLen Brown } 401c98d5d94SLen Brown return 0; 402103a8feaSLen Brown } 403103a8feaSLen Brown 404e23da037SLen Brown /* 405e23da037SLen Brown * column formatting convention & formats 406e23da037SLen Brown * package: "pk" 2 columns %2d 407e23da037SLen Brown * core: "cor" 3 columns %3d 408e23da037SLen Brown * CPU: "CPU" 3 columns %3d 409889facbeSLen Brown * Pkg_W: %6.2 410889facbeSLen Brown * Cor_W: %6.2 411889facbeSLen Brown * GFX_W: %5.2 412889facbeSLen Brown * RAM_W: %5.2 413e23da037SLen Brown * GHz: "GHz" 3 columns %3.2 414e23da037SLen Brown * TSC: "TSC" 3 columns %3.2 4151ed51011SLen Brown * SMI: "SMI" 4 columns %4d 416e23da037SLen Brown * percentage " %pc3" %6.2 417889facbeSLen Brown * Perf Status percentage: %5.2 418889facbeSLen Brown * "CTMP" 4 columns %4d 419e23da037SLen Brown */ 420c98d5d94SLen Brown int format_counters(struct thread_data *t, struct core_data *c, 421c98d5d94SLen Brown struct pkg_data *p) 422103a8feaSLen Brown { 423103a8feaSLen Brown double interval_float; 424889facbeSLen Brown char *fmt5, *fmt6; 425103a8feaSLen Brown 426c98d5d94SLen Brown /* if showing only 1st thread in core and this isn't one, bail out */ 427c98d5d94SLen Brown if (show_core_only && !(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 428c98d5d94SLen Brown return 0; 429c98d5d94SLen Brown 430c98d5d94SLen Brown /* if showing only 1st thread in pkg and this isn't one, bail out */ 431c98d5d94SLen Brown if (show_pkg_only && !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 432c98d5d94SLen Brown return 0; 433c98d5d94SLen Brown 434103a8feaSLen Brown interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0; 435103a8feaSLen Brown 436c98d5d94SLen Brown /* topo columns, print blanks on 1st (average) line */ 437c98d5d94SLen Brown if (t == &average.threads) { 438103a8feaSLen Brown if (show_pkg) 439c98d5d94SLen Brown outp += sprintf(outp, " "); 440e23da037SLen Brown if (show_pkg && show_core) 441c98d5d94SLen Brown outp += sprintf(outp, " "); 442103a8feaSLen Brown if (show_core) 443c98d5d94SLen Brown outp += sprintf(outp, " "); 444103a8feaSLen Brown if (show_cpu) 445c98d5d94SLen Brown outp += sprintf(outp, " " " "); 446103a8feaSLen Brown } else { 447c98d5d94SLen Brown if (show_pkg) { 448c98d5d94SLen Brown if (p) 449c98d5d94SLen Brown outp += sprintf(outp, "%2d", p->package_id); 450c98d5d94SLen Brown else 451c98d5d94SLen Brown outp += sprintf(outp, " "); 452c98d5d94SLen Brown } 453e23da037SLen Brown if (show_pkg && show_core) 454c98d5d94SLen Brown outp += sprintf(outp, " "); 455c98d5d94SLen Brown if (show_core) { 456c98d5d94SLen Brown if (c) 457c98d5d94SLen Brown outp += sprintf(outp, "%3d", c->core_id); 458c98d5d94SLen Brown else 459c98d5d94SLen Brown outp += sprintf(outp, " "); 460c98d5d94SLen Brown } 461103a8feaSLen Brown if (show_cpu) 462c98d5d94SLen Brown outp += sprintf(outp, " %3d", t->cpu_id); 463103a8feaSLen Brown } 464103a8feaSLen Brown /* %c0 */ 465103a8feaSLen Brown if (do_nhm_cstates) { 466e23da037SLen Brown if (show_pkg || show_core || show_cpu) 467c98d5d94SLen Brown outp += sprintf(outp, " "); 468103a8feaSLen Brown if (!skip_c0) 469c98d5d94SLen Brown outp += sprintf(outp, "%6.2f", 100.0 * t->mperf/t->tsc); 470103a8feaSLen Brown else 471c98d5d94SLen Brown outp += sprintf(outp, " ****"); 472103a8feaSLen Brown } 473103a8feaSLen Brown 474103a8feaSLen Brown /* GHz */ 475103a8feaSLen Brown if (has_aperf) { 476103a8feaSLen Brown if (!aperf_mperf_unstable) { 477c98d5d94SLen Brown outp += sprintf(outp, " %3.2f", 478c98d5d94SLen Brown 1.0 * t->tsc / units * t->aperf / 479c98d5d94SLen Brown t->mperf / interval_float); 480103a8feaSLen Brown } else { 481c98d5d94SLen Brown if (t->aperf > t->tsc || t->mperf > t->tsc) { 482c98d5d94SLen Brown outp += sprintf(outp, " ***"); 483103a8feaSLen Brown } else { 484c98d5d94SLen Brown outp += sprintf(outp, "%3.1f*", 485c98d5d94SLen Brown 1.0 * t->tsc / 486c98d5d94SLen Brown units * t->aperf / 487c98d5d94SLen Brown t->mperf / interval_float); 488103a8feaSLen Brown } 489103a8feaSLen Brown } 490103a8feaSLen Brown } 491103a8feaSLen Brown 492103a8feaSLen Brown /* TSC */ 493c98d5d94SLen Brown outp += sprintf(outp, "%5.2f", 1.0 * t->tsc/units/interval_float); 494103a8feaSLen Brown 4951ed51011SLen Brown /* SMI */ 4961ed51011SLen Brown if (do_smi) 4971ed51011SLen Brown outp += sprintf(outp, "%4d", t->smi_count); 4981ed51011SLen Brown 4998e180f3cSLen Brown /* delta */ 5008e180f3cSLen Brown if (extra_delta_offset32) 5018e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta32); 5028e180f3cSLen Brown 5038e180f3cSLen Brown /* DELTA */ 5048e180f3cSLen Brown if (extra_delta_offset64) 5058e180f3cSLen Brown outp += sprintf(outp, " %11llu", t->extra_delta64); 5062f32edf1SLen Brown /* msr */ 5072f32edf1SLen Brown if (extra_msr_offset32) 5088e180f3cSLen Brown outp += sprintf(outp, " 0x%08llx", t->extra_msr32); 5092f32edf1SLen Brown 510130ff304SLen Brown /* MSR */ 5112f32edf1SLen Brown if (extra_msr_offset64) 5122f32edf1SLen Brown outp += sprintf(outp, " 0x%016llx", t->extra_msr64); 513130ff304SLen Brown 514103a8feaSLen Brown if (do_nhm_cstates) { 515103a8feaSLen Brown if (!skip_c1) 516c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * t->c1/t->tsc); 517103a8feaSLen Brown else 518c98d5d94SLen Brown outp += sprintf(outp, " ****"); 519103a8feaSLen Brown } 520c98d5d94SLen Brown 521c98d5d94SLen Brown /* print per-core data only for 1st thread in core */ 522c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 523c98d5d94SLen Brown goto done; 524c98d5d94SLen Brown 525144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 526c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c3/t->tsc); 527103a8feaSLen Brown if (do_nhm_cstates) 528c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c6/t->tsc); 529103a8feaSLen Brown if (do_snb_cstates) 530c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c7/t->tsc); 531c98d5d94SLen Brown 532889facbeSLen Brown if (do_dts) 533889facbeSLen Brown outp += sprintf(outp, " %4d", c->core_temp_c); 534889facbeSLen Brown 535c98d5d94SLen Brown /* print per-package data only for 1st core in package */ 536c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 537c98d5d94SLen Brown goto done; 538c98d5d94SLen Brown 539889facbeSLen Brown if (do_ptm) 540889facbeSLen Brown outp += sprintf(outp, " %4d", p->pkg_temp_c); 541889facbeSLen Brown 542103a8feaSLen Brown if (do_snb_cstates) 543c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc2/t->tsc); 544144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 545c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc3/t->tsc); 546144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) 547c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc6/t->tsc); 548103a8feaSLen Brown if (do_snb_cstates) 549c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc7/t->tsc); 550ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 551ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %6.2f", 100.0 * p->pc8/t->tsc); 552ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %6.2f", 100.0 * p->pc9/t->tsc); 553ca58710fSKristen Carlson Accardi outp += sprintf(outp, " %6.2f", 100.0 * p->pc10/t->tsc); 554ca58710fSKristen Carlson Accardi } 555889facbeSLen Brown 556889facbeSLen Brown /* 557889facbeSLen Brown * If measurement interval exceeds minimum RAPL Joule Counter range, 558889facbeSLen Brown * indicate that results are suspect by printing "**" in fraction place. 559889facbeSLen Brown */ 560889facbeSLen Brown if (interval_float < rapl_joule_counter_range) { 561889facbeSLen Brown fmt5 = " %5.2f"; 562889facbeSLen Brown fmt6 = " %6.2f"; 563889facbeSLen Brown } else { 564889facbeSLen Brown fmt5 = " %3.0f**"; 565889facbeSLen Brown fmt6 = " %4.0f**"; 566889facbeSLen Brown } 567889facbeSLen Brown 5685c56be9aSDirk Brandewie if (do_rapl && !rapl_joules) { 569889facbeSLen Brown if (do_rapl & RAPL_PKG) 570889facbeSLen Brown outp += sprintf(outp, fmt6, p->energy_pkg * rapl_energy_units / interval_float); 571889facbeSLen Brown if (do_rapl & RAPL_CORES) 572889facbeSLen Brown outp += sprintf(outp, fmt6, p->energy_cores * rapl_energy_units / interval_float); 573889facbeSLen Brown if (do_rapl & RAPL_GFX) 574889facbeSLen Brown outp += sprintf(outp, fmt5, p->energy_gfx * rapl_energy_units / interval_float); 575889facbeSLen Brown if (do_rapl & RAPL_DRAM) 576889facbeSLen Brown outp += sprintf(outp, fmt5, p->energy_dram * rapl_energy_units / interval_float); 577889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) 578889facbeSLen Brown outp += sprintf(outp, fmt5, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 579889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) 580889facbeSLen Brown outp += sprintf(outp, fmt5, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 5815c56be9aSDirk Brandewie } else { 5825c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG) 5835c56be9aSDirk Brandewie outp += sprintf(outp, fmt6, 5845c56be9aSDirk Brandewie p->energy_pkg * rapl_energy_units); 5855c56be9aSDirk Brandewie if (do_rapl & RAPL_CORES) 5865c56be9aSDirk Brandewie outp += sprintf(outp, fmt6, 5875c56be9aSDirk Brandewie p->energy_cores * rapl_energy_units); 5885c56be9aSDirk Brandewie if (do_rapl & RAPL_GFX) 5895c56be9aSDirk Brandewie outp += sprintf(outp, fmt5, 5905c56be9aSDirk Brandewie p->energy_gfx * rapl_energy_units); 5915c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM) 5925c56be9aSDirk Brandewie outp += sprintf(outp, fmt5, 5935c56be9aSDirk Brandewie p->energy_dram * rapl_energy_units); 5945c56be9aSDirk Brandewie if (do_rapl & RAPL_PKG_PERF_STATUS) 5955c56be9aSDirk Brandewie outp += sprintf(outp, fmt5, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float); 5965c56be9aSDirk Brandewie if (do_rapl & RAPL_DRAM_PERF_STATUS) 5975c56be9aSDirk Brandewie outp += sprintf(outp, fmt5, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float); 5985c56be9aSDirk Brandewie outp += sprintf(outp, fmt5, interval_float); 599889facbeSLen Brown 6005c56be9aSDirk Brandewie } 601c98d5d94SLen Brown done: 602c98d5d94SLen Brown outp += sprintf(outp, "\n"); 603c98d5d94SLen Brown 604c98d5d94SLen Brown return 0; 605103a8feaSLen Brown } 606103a8feaSLen Brown 607c98d5d94SLen Brown void flush_stdout() 608103a8feaSLen Brown { 609c98d5d94SLen Brown fputs(output_buffer, stdout); 610ddac0d68SLen Brown fflush(stdout); 611c98d5d94SLen Brown outp = output_buffer; 612c98d5d94SLen Brown } 613c98d5d94SLen Brown void flush_stderr() 614c98d5d94SLen Brown { 615c98d5d94SLen Brown fputs(output_buffer, stderr); 616c98d5d94SLen Brown outp = output_buffer; 617c98d5d94SLen Brown } 618c98d5d94SLen Brown void format_all_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 619c98d5d94SLen Brown { 620e23da037SLen Brown static int printed; 621103a8feaSLen Brown 622e23da037SLen Brown if (!printed || !summary_only) 623103a8feaSLen Brown print_header(); 624103a8feaSLen Brown 625c98d5d94SLen Brown if (topo.num_cpus > 1) 626c98d5d94SLen Brown format_counters(&average.threads, &average.cores, 627c98d5d94SLen Brown &average.packages); 628103a8feaSLen Brown 629e23da037SLen Brown printed = 1; 630e23da037SLen Brown 631e23da037SLen Brown if (summary_only) 632e23da037SLen Brown return; 633e23da037SLen Brown 634c98d5d94SLen Brown for_all_cpus(format_counters, t, c, p); 635103a8feaSLen Brown } 636103a8feaSLen Brown 637889facbeSLen Brown #define DELTA_WRAP32(new, old) \ 638889facbeSLen Brown if (new > old) { \ 639889facbeSLen Brown old = new - old; \ 640889facbeSLen Brown } else { \ 641889facbeSLen Brown old = 0x100000000 + new - old; \ 642889facbeSLen Brown } 643889facbeSLen Brown 644c98d5d94SLen Brown void 645c98d5d94SLen Brown delta_package(struct pkg_data *new, struct pkg_data *old) 646103a8feaSLen Brown { 647c98d5d94SLen Brown old->pc2 = new->pc2 - old->pc2; 648c98d5d94SLen Brown old->pc3 = new->pc3 - old->pc3; 649c98d5d94SLen Brown old->pc6 = new->pc6 - old->pc6; 650c98d5d94SLen Brown old->pc7 = new->pc7 - old->pc7; 651ca58710fSKristen Carlson Accardi old->pc8 = new->pc8 - old->pc8; 652ca58710fSKristen Carlson Accardi old->pc9 = new->pc9 - old->pc9; 653ca58710fSKristen Carlson Accardi old->pc10 = new->pc10 - old->pc10; 654889facbeSLen Brown old->pkg_temp_c = new->pkg_temp_c; 655889facbeSLen Brown 656889facbeSLen Brown DELTA_WRAP32(new->energy_pkg, old->energy_pkg); 657889facbeSLen Brown DELTA_WRAP32(new->energy_cores, old->energy_cores); 658889facbeSLen Brown DELTA_WRAP32(new->energy_gfx, old->energy_gfx); 659889facbeSLen Brown DELTA_WRAP32(new->energy_dram, old->energy_dram); 660889facbeSLen Brown DELTA_WRAP32(new->rapl_pkg_perf_status, old->rapl_pkg_perf_status); 661889facbeSLen Brown DELTA_WRAP32(new->rapl_dram_perf_status, old->rapl_dram_perf_status); 662103a8feaSLen Brown } 663103a8feaSLen Brown 664c98d5d94SLen Brown void 665c98d5d94SLen Brown delta_core(struct core_data *new, struct core_data *old) 666c98d5d94SLen Brown { 667c98d5d94SLen Brown old->c3 = new->c3 - old->c3; 668c98d5d94SLen Brown old->c6 = new->c6 - old->c6; 669c98d5d94SLen Brown old->c7 = new->c7 - old->c7; 670889facbeSLen Brown old->core_temp_c = new->core_temp_c; 671103a8feaSLen Brown } 672c98d5d94SLen Brown 673c3ae331dSLen Brown /* 674c3ae331dSLen Brown * old = new - old 675c3ae331dSLen Brown */ 676c98d5d94SLen Brown void 677c98d5d94SLen Brown delta_thread(struct thread_data *new, struct thread_data *old, 678c98d5d94SLen Brown struct core_data *core_delta) 679c98d5d94SLen Brown { 680c98d5d94SLen Brown old->tsc = new->tsc - old->tsc; 681c98d5d94SLen Brown 682103a8feaSLen Brown /* check for TSC < 1 Mcycles over interval */ 683b2c95d90SJosh Triplett if (old->tsc < (1000 * 1000)) 684b2c95d90SJosh Triplett errx(-3, "Insanely slow TSC rate, TSC stops in idle?\n" 685b2c95d90SJosh Triplett "You can disable all c-states by booting with \"idle=poll\"\n" 686b2c95d90SJosh Triplett "or just the deep ones with \"processor.max_cstate=1\""); 687103a8feaSLen Brown 688c98d5d94SLen Brown old->c1 = new->c1 - old->c1; 689c98d5d94SLen Brown 690c98d5d94SLen Brown if ((new->aperf > old->aperf) && (new->mperf > old->mperf)) { 691c98d5d94SLen Brown old->aperf = new->aperf - old->aperf; 692c98d5d94SLen Brown old->mperf = new->mperf - old->mperf; 693c98d5d94SLen Brown } else { 694c98d5d94SLen Brown 695103a8feaSLen Brown if (!aperf_mperf_unstable) { 696103a8feaSLen Brown fprintf(stderr, "%s: APERF or MPERF went backwards *\n", progname); 697103a8feaSLen Brown fprintf(stderr, "* Frequency results do not cover entire interval *\n"); 698103a8feaSLen Brown fprintf(stderr, "* fix this by running Linux-2.6.30 or later *\n"); 699103a8feaSLen Brown 700103a8feaSLen Brown aperf_mperf_unstable = 1; 701103a8feaSLen Brown } 702103a8feaSLen Brown /* 703103a8feaSLen Brown * mperf delta is likely a huge "positive" number 704103a8feaSLen Brown * can not use it for calculating c0 time 705103a8feaSLen Brown */ 706103a8feaSLen Brown skip_c0 = 1; 707103a8feaSLen Brown skip_c1 = 1; 708103a8feaSLen Brown } 709103a8feaSLen Brown 710c98d5d94SLen Brown 711144b44b1SLen Brown if (use_c1_residency_msr) { 712144b44b1SLen Brown /* 713144b44b1SLen Brown * Some models have a dedicated C1 residency MSR, 714144b44b1SLen Brown * which should be more accurate than the derivation below. 715144b44b1SLen Brown */ 716144b44b1SLen Brown } else { 717103a8feaSLen Brown /* 718c3ae331dSLen Brown * As counter collection is not atomic, 719c3ae331dSLen Brown * it is possible for mperf's non-halted cycles + idle states 720103a8feaSLen Brown * to exceed TSC's all cycles: show c1 = 0% in that case. 721103a8feaSLen Brown */ 722c3ae331dSLen Brown if ((old->mperf + core_delta->c3 + core_delta->c6 + core_delta->c7) > old->tsc) 723c98d5d94SLen Brown old->c1 = 0; 724c98d5d94SLen Brown else { 725c98d5d94SLen Brown /* normal case, derive c1 */ 726c98d5d94SLen Brown old->c1 = old->tsc - old->mperf - core_delta->c3 727c98d5d94SLen Brown - core_delta->c6 - core_delta->c7; 728c98d5d94SLen Brown } 729144b44b1SLen Brown } 730c3ae331dSLen Brown 731c98d5d94SLen Brown if (old->mperf == 0) { 732c3ae331dSLen Brown if (verbose > 1) fprintf(stderr, "cpu%d MPERF 0!\n", old->cpu_id); 733c98d5d94SLen Brown old->mperf = 1; /* divide by 0 protection */ 734c98d5d94SLen Brown } 735103a8feaSLen Brown 7368e180f3cSLen Brown old->extra_delta32 = new->extra_delta32 - old->extra_delta32; 7378e180f3cSLen Brown old->extra_delta32 &= 0xFFFFFFFF; 7388e180f3cSLen Brown 7398e180f3cSLen Brown old->extra_delta64 = new->extra_delta64 - old->extra_delta64; 7408e180f3cSLen Brown 741103a8feaSLen Brown /* 7428e180f3cSLen Brown * Extra MSR is just a snapshot, simply copy latest w/o subtracting 743103a8feaSLen Brown */ 7442f32edf1SLen Brown old->extra_msr32 = new->extra_msr32; 7452f32edf1SLen Brown old->extra_msr64 = new->extra_msr64; 7461ed51011SLen Brown 7471ed51011SLen Brown if (do_smi) 7481ed51011SLen Brown old->smi_count = new->smi_count - old->smi_count; 749103a8feaSLen Brown } 750c98d5d94SLen Brown 751c98d5d94SLen Brown int delta_cpu(struct thread_data *t, struct core_data *c, 752c98d5d94SLen Brown struct pkg_data *p, struct thread_data *t2, 753c98d5d94SLen Brown struct core_data *c2, struct pkg_data *p2) 754c98d5d94SLen Brown { 755c98d5d94SLen Brown /* calculate core delta only for 1st thread in core */ 756c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_THREAD_IN_CORE) 757c98d5d94SLen Brown delta_core(c, c2); 758c98d5d94SLen Brown 759c98d5d94SLen Brown /* always calculate thread delta */ 760c98d5d94SLen Brown delta_thread(t, t2, c2); /* c2 is core delta */ 761c98d5d94SLen Brown 762c98d5d94SLen Brown /* calculate package delta only for 1st core in package */ 763c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE) 764c98d5d94SLen Brown delta_package(p, p2); 765c98d5d94SLen Brown 766103a8feaSLen Brown return 0; 767103a8feaSLen Brown } 768103a8feaSLen Brown 769c98d5d94SLen Brown void clear_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 770103a8feaSLen Brown { 771c98d5d94SLen Brown t->tsc = 0; 772c98d5d94SLen Brown t->aperf = 0; 773c98d5d94SLen Brown t->mperf = 0; 774c98d5d94SLen Brown t->c1 = 0; 775103a8feaSLen Brown 7761ed51011SLen Brown t->smi_count = 0; 7778e180f3cSLen Brown t->extra_delta32 = 0; 7788e180f3cSLen Brown t->extra_delta64 = 0; 7798e180f3cSLen Brown 780c98d5d94SLen Brown /* tells format_counters to dump all fields from this set */ 781c98d5d94SLen Brown t->flags = CPU_IS_FIRST_THREAD_IN_CORE | CPU_IS_FIRST_CORE_IN_PACKAGE; 782c98d5d94SLen Brown 783c98d5d94SLen Brown c->c3 = 0; 784c98d5d94SLen Brown c->c6 = 0; 785c98d5d94SLen Brown c->c7 = 0; 786889facbeSLen Brown c->core_temp_c = 0; 787c98d5d94SLen Brown 788c98d5d94SLen Brown p->pc2 = 0; 789c98d5d94SLen Brown p->pc3 = 0; 790c98d5d94SLen Brown p->pc6 = 0; 791c98d5d94SLen Brown p->pc7 = 0; 792ca58710fSKristen Carlson Accardi p->pc8 = 0; 793ca58710fSKristen Carlson Accardi p->pc9 = 0; 794ca58710fSKristen Carlson Accardi p->pc10 = 0; 795889facbeSLen Brown 796889facbeSLen Brown p->energy_pkg = 0; 797889facbeSLen Brown p->energy_dram = 0; 798889facbeSLen Brown p->energy_cores = 0; 799889facbeSLen Brown p->energy_gfx = 0; 800889facbeSLen Brown p->rapl_pkg_perf_status = 0; 801889facbeSLen Brown p->rapl_dram_perf_status = 0; 802889facbeSLen Brown p->pkg_temp_c = 0; 803103a8feaSLen Brown } 804c98d5d94SLen Brown int sum_counters(struct thread_data *t, struct core_data *c, 805c98d5d94SLen Brown struct pkg_data *p) 806103a8feaSLen Brown { 807c98d5d94SLen Brown average.threads.tsc += t->tsc; 808c98d5d94SLen Brown average.threads.aperf += t->aperf; 809c98d5d94SLen Brown average.threads.mperf += t->mperf; 810c98d5d94SLen Brown average.threads.c1 += t->c1; 81115aaa346SLen Brown 8128e180f3cSLen Brown average.threads.extra_delta32 += t->extra_delta32; 8138e180f3cSLen Brown average.threads.extra_delta64 += t->extra_delta64; 8148e180f3cSLen Brown 815c98d5d94SLen Brown /* sum per-core values only for 1st thread in core */ 816c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 817c98d5d94SLen Brown return 0; 818c98d5d94SLen Brown 819c98d5d94SLen Brown average.cores.c3 += c->c3; 820c98d5d94SLen Brown average.cores.c6 += c->c6; 821c98d5d94SLen Brown average.cores.c7 += c->c7; 822c98d5d94SLen Brown 823889facbeSLen Brown average.cores.core_temp_c = MAX(average.cores.core_temp_c, c->core_temp_c); 824889facbeSLen Brown 825c98d5d94SLen Brown /* sum per-pkg values only for 1st core in pkg */ 826c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 827c98d5d94SLen Brown return 0; 828c98d5d94SLen Brown 829c98d5d94SLen Brown average.packages.pc2 += p->pc2; 830c98d5d94SLen Brown average.packages.pc3 += p->pc3; 831c98d5d94SLen Brown average.packages.pc6 += p->pc6; 832c98d5d94SLen Brown average.packages.pc7 += p->pc7; 833ca58710fSKristen Carlson Accardi average.packages.pc8 += p->pc8; 834ca58710fSKristen Carlson Accardi average.packages.pc9 += p->pc9; 835ca58710fSKristen Carlson Accardi average.packages.pc10 += p->pc10; 836c98d5d94SLen Brown 837889facbeSLen Brown average.packages.energy_pkg += p->energy_pkg; 838889facbeSLen Brown average.packages.energy_dram += p->energy_dram; 839889facbeSLen Brown average.packages.energy_cores += p->energy_cores; 840889facbeSLen Brown average.packages.energy_gfx += p->energy_gfx; 841889facbeSLen Brown 842889facbeSLen Brown average.packages.pkg_temp_c = MAX(average.packages.pkg_temp_c, p->pkg_temp_c); 843889facbeSLen Brown 844889facbeSLen Brown average.packages.rapl_pkg_perf_status += p->rapl_pkg_perf_status; 845889facbeSLen Brown average.packages.rapl_dram_perf_status += p->rapl_dram_perf_status; 846c98d5d94SLen Brown return 0; 847c98d5d94SLen Brown } 848c98d5d94SLen Brown /* 849c98d5d94SLen Brown * sum the counters for all cpus in the system 850c98d5d94SLen Brown * compute the weighted average 851c98d5d94SLen Brown */ 852c98d5d94SLen Brown void compute_average(struct thread_data *t, struct core_data *c, 853c98d5d94SLen Brown struct pkg_data *p) 854c98d5d94SLen Brown { 855c98d5d94SLen Brown clear_counters(&average.threads, &average.cores, &average.packages); 856c98d5d94SLen Brown 857c98d5d94SLen Brown for_all_cpus(sum_counters, t, c, p); 858c98d5d94SLen Brown 859c98d5d94SLen Brown average.threads.tsc /= topo.num_cpus; 860c98d5d94SLen Brown average.threads.aperf /= topo.num_cpus; 861c98d5d94SLen Brown average.threads.mperf /= topo.num_cpus; 862c98d5d94SLen Brown average.threads.c1 /= topo.num_cpus; 863c98d5d94SLen Brown 8648e180f3cSLen Brown average.threads.extra_delta32 /= topo.num_cpus; 8658e180f3cSLen Brown average.threads.extra_delta32 &= 0xFFFFFFFF; 8668e180f3cSLen Brown 8678e180f3cSLen Brown average.threads.extra_delta64 /= topo.num_cpus; 8688e180f3cSLen Brown 869c98d5d94SLen Brown average.cores.c3 /= topo.num_cores; 870c98d5d94SLen Brown average.cores.c6 /= topo.num_cores; 871c98d5d94SLen Brown average.cores.c7 /= topo.num_cores; 872c98d5d94SLen Brown 873c98d5d94SLen Brown average.packages.pc2 /= topo.num_packages; 874c98d5d94SLen Brown average.packages.pc3 /= topo.num_packages; 875c98d5d94SLen Brown average.packages.pc6 /= topo.num_packages; 876c98d5d94SLen Brown average.packages.pc7 /= topo.num_packages; 877ca58710fSKristen Carlson Accardi 878ca58710fSKristen Carlson Accardi average.packages.pc8 /= topo.num_packages; 879ca58710fSKristen Carlson Accardi average.packages.pc9 /= topo.num_packages; 880ca58710fSKristen Carlson Accardi average.packages.pc10 /= topo.num_packages; 881c98d5d94SLen Brown } 882c98d5d94SLen Brown 883c98d5d94SLen Brown static unsigned long long rdtsc(void) 884c98d5d94SLen Brown { 885c98d5d94SLen Brown unsigned int low, high; 886c98d5d94SLen Brown 887c98d5d94SLen Brown asm volatile("rdtsc" : "=a" (low), "=d" (high)); 888c98d5d94SLen Brown 889c98d5d94SLen Brown return low | ((unsigned long long)high) << 32; 890c98d5d94SLen Brown } 891c98d5d94SLen Brown 892c98d5d94SLen Brown 893c98d5d94SLen Brown /* 894c98d5d94SLen Brown * get_counters(...) 895c98d5d94SLen Brown * migrate to cpu 896c98d5d94SLen Brown * acquire and record local counters for that cpu 897c98d5d94SLen Brown */ 898c98d5d94SLen Brown int get_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 899c98d5d94SLen Brown { 900c98d5d94SLen Brown int cpu = t->cpu_id; 901889facbeSLen Brown unsigned long long msr; 902c98d5d94SLen Brown 903e52966c0SLen Brown if (cpu_migrate(cpu)) { 904e52966c0SLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 90515aaa346SLen Brown return -1; 906e52966c0SLen Brown } 90715aaa346SLen Brown 908c98d5d94SLen Brown t->tsc = rdtsc(); /* we are running on local CPU of interest */ 90915aaa346SLen Brown 91015aaa346SLen Brown if (has_aperf) { 9119c63a650SLen Brown if (get_msr(cpu, MSR_IA32_APERF, &t->aperf)) 912c98d5d94SLen Brown return -3; 9139c63a650SLen Brown if (get_msr(cpu, MSR_IA32_MPERF, &t->mperf)) 914c98d5d94SLen Brown return -4; 91588c3281fSLen Brown } 91688c3281fSLen Brown 9171ed51011SLen Brown if (do_smi) { 9181ed51011SLen Brown if (get_msr(cpu, MSR_SMI_COUNT, &msr)) 9191ed51011SLen Brown return -5; 9201ed51011SLen Brown t->smi_count = msr & 0xFFFFFFFF; 9211ed51011SLen Brown } 9228e180f3cSLen Brown if (extra_delta_offset32) { 923889facbeSLen Brown if (get_msr(cpu, extra_delta_offset32, &msr)) 9242f32edf1SLen Brown return -5; 925889facbeSLen Brown t->extra_delta32 = msr & 0xFFFFFFFF; 9268e180f3cSLen Brown } 9278e180f3cSLen Brown 9288e180f3cSLen Brown if (extra_delta_offset64) 9298e180f3cSLen Brown if (get_msr(cpu, extra_delta_offset64, &t->extra_delta64)) 9308e180f3cSLen Brown return -5; 9318e180f3cSLen Brown 9328e180f3cSLen Brown if (extra_msr_offset32) { 933889facbeSLen Brown if (get_msr(cpu, extra_msr_offset32, &msr)) 9348e180f3cSLen Brown return -5; 935889facbeSLen Brown t->extra_msr32 = msr & 0xFFFFFFFF; 9368e180f3cSLen Brown } 9372f32edf1SLen Brown 9382f32edf1SLen Brown if (extra_msr_offset64) 9392f32edf1SLen Brown if (get_msr(cpu, extra_msr_offset64, &t->extra_msr64)) 940c98d5d94SLen Brown return -5; 941c98d5d94SLen Brown 942144b44b1SLen Brown if (use_c1_residency_msr) { 943144b44b1SLen Brown if (get_msr(cpu, MSR_CORE_C1_RES, &t->c1)) 944144b44b1SLen Brown return -6; 945144b44b1SLen Brown } 946144b44b1SLen Brown 947c98d5d94SLen Brown /* collect core counters only for 1st thread in core */ 948c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 949c98d5d94SLen Brown return 0; 950c98d5d94SLen Brown 951144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) { 952c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C3_RESIDENCY, &c->c3)) 953c98d5d94SLen Brown return -6; 954144b44b1SLen Brown } 955144b44b1SLen Brown 956144b44b1SLen Brown if (do_nhm_cstates) { 957c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C6_RESIDENCY, &c->c6)) 958c98d5d94SLen Brown return -7; 959103a8feaSLen Brown } 96015aaa346SLen Brown 96115aaa346SLen Brown if (do_snb_cstates) 962c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C7_RESIDENCY, &c->c7)) 963c98d5d94SLen Brown return -8; 964c98d5d94SLen Brown 965889facbeSLen Brown if (do_dts) { 966889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 967889facbeSLen Brown return -9; 968889facbeSLen Brown c->core_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 969889facbeSLen Brown } 970889facbeSLen Brown 971889facbeSLen Brown 972c98d5d94SLen Brown /* collect package counters only for 1st core in package */ 973c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 974c98d5d94SLen Brown return 0; 97515aaa346SLen Brown 976144b44b1SLen Brown if (do_nhm_cstates && !do_slm_cstates) { 977c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C3_RESIDENCY, &p->pc3)) 978c98d5d94SLen Brown return -9; 979c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C6_RESIDENCY, &p->pc6)) 980c98d5d94SLen Brown return -10; 98115aaa346SLen Brown } 98215aaa346SLen Brown if (do_snb_cstates) { 983c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C2_RESIDENCY, &p->pc2)) 984c98d5d94SLen Brown return -11; 985c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C7_RESIDENCY, &p->pc7)) 986c98d5d94SLen Brown return -12; 98715aaa346SLen Brown } 988ca58710fSKristen Carlson Accardi if (do_c8_c9_c10) { 989ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C8_RESIDENCY, &p->pc8)) 990ca58710fSKristen Carlson Accardi return -13; 991ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C9_RESIDENCY, &p->pc9)) 992ca58710fSKristen Carlson Accardi return -13; 993ca58710fSKristen Carlson Accardi if (get_msr(cpu, MSR_PKG_C10_RESIDENCY, &p->pc10)) 994ca58710fSKristen Carlson Accardi return -13; 995ca58710fSKristen Carlson Accardi } 996889facbeSLen Brown if (do_rapl & RAPL_PKG) { 997889facbeSLen Brown if (get_msr(cpu, MSR_PKG_ENERGY_STATUS, &msr)) 998889facbeSLen Brown return -13; 999889facbeSLen Brown p->energy_pkg = msr & 0xFFFFFFFF; 1000889facbeSLen Brown } 1001889facbeSLen Brown if (do_rapl & RAPL_CORES) { 1002889facbeSLen Brown if (get_msr(cpu, MSR_PP0_ENERGY_STATUS, &msr)) 1003889facbeSLen Brown return -14; 1004889facbeSLen Brown p->energy_cores = msr & 0xFFFFFFFF; 1005889facbeSLen Brown } 1006889facbeSLen Brown if (do_rapl & RAPL_DRAM) { 1007889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_ENERGY_STATUS, &msr)) 1008889facbeSLen Brown return -15; 1009889facbeSLen Brown p->energy_dram = msr & 0xFFFFFFFF; 1010889facbeSLen Brown } 1011889facbeSLen Brown if (do_rapl & RAPL_GFX) { 1012889facbeSLen Brown if (get_msr(cpu, MSR_PP1_ENERGY_STATUS, &msr)) 1013889facbeSLen Brown return -16; 1014889facbeSLen Brown p->energy_gfx = msr & 0xFFFFFFFF; 1015889facbeSLen Brown } 1016889facbeSLen Brown if (do_rapl & RAPL_PKG_PERF_STATUS) { 1017889facbeSLen Brown if (get_msr(cpu, MSR_PKG_PERF_STATUS, &msr)) 1018889facbeSLen Brown return -16; 1019889facbeSLen Brown p->rapl_pkg_perf_status = msr & 0xFFFFFFFF; 1020889facbeSLen Brown } 1021889facbeSLen Brown if (do_rapl & RAPL_DRAM_PERF_STATUS) { 1022889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_PERF_STATUS, &msr)) 1023889facbeSLen Brown return -16; 1024889facbeSLen Brown p->rapl_dram_perf_status = msr & 0xFFFFFFFF; 1025889facbeSLen Brown } 1026889facbeSLen Brown if (do_ptm) { 1027889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 1028889facbeSLen Brown return -17; 1029889facbeSLen Brown p->pkg_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F); 1030889facbeSLen Brown } 103115aaa346SLen Brown return 0; 1032103a8feaSLen Brown } 1033103a8feaSLen Brown 1034c98d5d94SLen Brown void print_verbose_header(void) 1035103a8feaSLen Brown { 1036103a8feaSLen Brown unsigned long long msr; 1037103a8feaSLen Brown unsigned int ratio; 1038103a8feaSLen Brown 1039103a8feaSLen Brown if (!do_nehalem_platform_info) 1040103a8feaSLen Brown return; 1041103a8feaSLen Brown 10429c63a650SLen Brown get_msr(0, MSR_NHM_PLATFORM_INFO, &msr); 1043103a8feaSLen Brown 1044889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_PLATFORM_INFO: 0x%08llx\n", msr); 10456574a5d5SLen Brown 1046103a8feaSLen Brown ratio = (msr >> 40) & 0xFF; 1047103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max efficiency\n", 1048103a8feaSLen Brown ratio, bclk, ratio * bclk); 1049103a8feaSLen Brown 1050103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 1051103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz TSC frequency\n", 1052103a8feaSLen Brown ratio, bclk, ratio * bclk); 1053103a8feaSLen Brown 105467920418SLen Brown get_msr(0, MSR_IA32_POWER_CTL, &msr); 1055144b44b1SLen Brown fprintf(stderr, "cpu0: MSR_IA32_POWER_CTL: 0x%08llx (C1E auto-promotion: %sabled)\n", 105667920418SLen Brown msr, msr & 0x2 ? "EN" : "DIS"); 105767920418SLen Brown 10586574a5d5SLen Brown if (!do_ivt_turbo_ratio_limit) 10596574a5d5SLen Brown goto print_nhm_turbo_ratio_limits; 10606574a5d5SLen Brown 10616574a5d5SLen Brown get_msr(0, MSR_IVT_TURBO_RATIO_LIMIT, &msr); 10626574a5d5SLen Brown 1063889facbeSLen Brown fprintf(stderr, "cpu0: MSR_IVT_TURBO_RATIO_LIMIT: 0x%08llx\n", msr); 10646574a5d5SLen Brown 10656574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 10666574a5d5SLen Brown if (ratio) 10676574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 16 active cores\n", 10686574a5d5SLen Brown ratio, bclk, ratio * bclk); 10696574a5d5SLen Brown 10706574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 10716574a5d5SLen Brown if (ratio) 10726574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 15 active cores\n", 10736574a5d5SLen Brown ratio, bclk, ratio * bclk); 10746574a5d5SLen Brown 10756574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 10766574a5d5SLen Brown if (ratio) 10776574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 14 active cores\n", 10786574a5d5SLen Brown ratio, bclk, ratio * bclk); 10796574a5d5SLen Brown 10806574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 10816574a5d5SLen Brown if (ratio) 10826574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 13 active cores\n", 10836574a5d5SLen Brown ratio, bclk, ratio * bclk); 10846574a5d5SLen Brown 10856574a5d5SLen Brown ratio = (msr >> 24) & 0xFF; 10866574a5d5SLen Brown if (ratio) 10876574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 12 active cores\n", 10886574a5d5SLen Brown ratio, bclk, ratio * bclk); 10896574a5d5SLen Brown 10906574a5d5SLen Brown ratio = (msr >> 16) & 0xFF; 10916574a5d5SLen Brown if (ratio) 10926574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 11 active cores\n", 10936574a5d5SLen Brown ratio, bclk, ratio * bclk); 10946574a5d5SLen Brown 10956574a5d5SLen Brown ratio = (msr >> 8) & 0xFF; 10966574a5d5SLen Brown if (ratio) 10976574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 10 active cores\n", 10986574a5d5SLen Brown ratio, bclk, ratio * bclk); 10996574a5d5SLen Brown 11006574a5d5SLen Brown ratio = (msr >> 0) & 0xFF; 11016574a5d5SLen Brown if (ratio) 11026574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 9 active cores\n", 11036574a5d5SLen Brown ratio, bclk, ratio * bclk); 11046574a5d5SLen Brown 11056574a5d5SLen Brown print_nhm_turbo_ratio_limits: 1106889facbeSLen Brown get_msr(0, MSR_NHM_SNB_PKG_CST_CFG_CTL, &msr); 1107889facbeSLen Brown 1108889facbeSLen Brown #define SNB_C1_AUTO_UNDEMOTE (1UL << 27) 1109889facbeSLen Brown #define SNB_C3_AUTO_UNDEMOTE (1UL << 28) 1110889facbeSLen Brown 1111889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_SNB_PKG_CST_CFG_CTL: 0x%08llx", msr); 1112889facbeSLen Brown 1113889facbeSLen Brown fprintf(stderr, " (%s%s%s%s%slocked: pkg-cstate-limit=%d: ", 1114889facbeSLen Brown (msr & SNB_C3_AUTO_UNDEMOTE) ? "UNdemote-C3, " : "", 1115889facbeSLen Brown (msr & SNB_C1_AUTO_UNDEMOTE) ? "UNdemote-C1, " : "", 1116889facbeSLen Brown (msr & NHM_C3_AUTO_DEMOTE) ? "demote-C3, " : "", 1117889facbeSLen Brown (msr & NHM_C1_AUTO_DEMOTE) ? "demote-C1, " : "", 1118889facbeSLen Brown (msr & (1 << 15)) ? "" : "UN", 1119889facbeSLen Brown (unsigned int)msr & 7); 1120889facbeSLen Brown 1121889facbeSLen Brown 1122889facbeSLen Brown switch(msr & 0x7) { 1123889facbeSLen Brown case 0: 1124144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "no pkg states" : "pc0"); 1125889facbeSLen Brown break; 1126889facbeSLen Brown case 1: 1127144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "no pkg states" : do_snb_cstates ? "pc2" : "pc0"); 1128889facbeSLen Brown break; 1129889facbeSLen Brown case 2: 1130144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : do_snb_cstates ? "pc6-noret" : "pc3"); 1131889facbeSLen Brown break; 1132889facbeSLen Brown case 3: 1133144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : "pc6"); 1134889facbeSLen Brown break; 1135889facbeSLen Brown case 4: 1136144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc4" : "pc7"); 1137889facbeSLen Brown break; 1138889facbeSLen Brown case 5: 1139144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "invalid" : do_snb_cstates ? "pc7s" : "invalid"); 1140144b44b1SLen Brown break; 1141144b44b1SLen Brown case 6: 1142144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc6" : "invalid"); 1143889facbeSLen Brown break; 1144889facbeSLen Brown case 7: 1145144b44b1SLen Brown fprintf(stderr, do_slm_cstates ? "pc7" : "unlimited"); 1146889facbeSLen Brown break; 1147889facbeSLen Brown default: 1148889facbeSLen Brown fprintf(stderr, "invalid"); 1149889facbeSLen Brown } 1150889facbeSLen Brown fprintf(stderr, ")\n"); 1151103a8feaSLen Brown 1152103a8feaSLen Brown if (!do_nehalem_turbo_ratio_limit) 1153103a8feaSLen Brown return; 1154103a8feaSLen Brown 11559c63a650SLen Brown get_msr(0, MSR_NHM_TURBO_RATIO_LIMIT, &msr); 1156103a8feaSLen Brown 1157889facbeSLen Brown fprintf(stderr, "cpu0: MSR_NHM_TURBO_RATIO_LIMIT: 0x%08llx\n", msr); 11586574a5d5SLen Brown 11596574a5d5SLen Brown ratio = (msr >> 56) & 0xFF; 11606574a5d5SLen Brown if (ratio) 11616574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 8 active cores\n", 11626574a5d5SLen Brown ratio, bclk, ratio * bclk); 11636574a5d5SLen Brown 11646574a5d5SLen Brown ratio = (msr >> 48) & 0xFF; 11656574a5d5SLen Brown if (ratio) 11666574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 7 active cores\n", 11676574a5d5SLen Brown ratio, bclk, ratio * bclk); 11686574a5d5SLen Brown 11696574a5d5SLen Brown ratio = (msr >> 40) & 0xFF; 11706574a5d5SLen Brown if (ratio) 11716574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 6 active cores\n", 11726574a5d5SLen Brown ratio, bclk, ratio * bclk); 11736574a5d5SLen Brown 11746574a5d5SLen Brown ratio = (msr >> 32) & 0xFF; 11756574a5d5SLen Brown if (ratio) 11766574a5d5SLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 5 active cores\n", 11776574a5d5SLen Brown ratio, bclk, ratio * bclk); 11786574a5d5SLen Brown 1179103a8feaSLen Brown ratio = (msr >> 24) & 0xFF; 1180103a8feaSLen Brown if (ratio) 1181103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 4 active cores\n", 1182103a8feaSLen Brown ratio, bclk, ratio * bclk); 1183103a8feaSLen Brown 1184103a8feaSLen Brown ratio = (msr >> 16) & 0xFF; 1185103a8feaSLen Brown if (ratio) 1186103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 3 active cores\n", 1187103a8feaSLen Brown ratio, bclk, ratio * bclk); 1188103a8feaSLen Brown 1189103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 1190103a8feaSLen Brown if (ratio) 1191103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 2 active cores\n", 1192103a8feaSLen Brown ratio, bclk, ratio * bclk); 1193103a8feaSLen Brown 1194103a8feaSLen Brown ratio = (msr >> 0) & 0xFF; 1195103a8feaSLen Brown if (ratio) 1196103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 1 active cores\n", 1197103a8feaSLen Brown ratio, bclk, ratio * bclk); 1198103a8feaSLen Brown } 1199103a8feaSLen Brown 1200c98d5d94SLen Brown void free_all_buffers(void) 1201103a8feaSLen Brown { 1202c98d5d94SLen Brown CPU_FREE(cpu_present_set); 1203c98d5d94SLen Brown cpu_present_set = NULL; 1204c98d5d94SLen Brown cpu_present_set = 0; 1205103a8feaSLen Brown 1206c98d5d94SLen Brown CPU_FREE(cpu_affinity_set); 1207c98d5d94SLen Brown cpu_affinity_set = NULL; 1208c98d5d94SLen Brown cpu_affinity_setsize = 0; 1209103a8feaSLen Brown 1210c98d5d94SLen Brown free(thread_even); 1211c98d5d94SLen Brown free(core_even); 1212c98d5d94SLen Brown free(package_even); 1213103a8feaSLen Brown 1214c98d5d94SLen Brown thread_even = NULL; 1215c98d5d94SLen Brown core_even = NULL; 1216c98d5d94SLen Brown package_even = NULL; 1217103a8feaSLen Brown 1218c98d5d94SLen Brown free(thread_odd); 1219c98d5d94SLen Brown free(core_odd); 1220c98d5d94SLen Brown free(package_odd); 1221103a8feaSLen Brown 1222c98d5d94SLen Brown thread_odd = NULL; 1223c98d5d94SLen Brown core_odd = NULL; 1224c98d5d94SLen Brown package_odd = NULL; 1225103a8feaSLen Brown 1226c98d5d94SLen Brown free(output_buffer); 1227c98d5d94SLen Brown output_buffer = NULL; 1228c98d5d94SLen Brown outp = NULL; 1229103a8feaSLen Brown } 1230103a8feaSLen Brown 1231103a8feaSLen Brown /* 123257a42a34SJosh Triplett * Open a file, and exit on failure 123357a42a34SJosh Triplett */ 123457a42a34SJosh Triplett FILE *fopen_or_die(const char *path, const char *mode) 123557a42a34SJosh Triplett { 123657a42a34SJosh Triplett FILE *filep = fopen(path, "r"); 1237b2c95d90SJosh Triplett if (!filep) 1238b2c95d90SJosh Triplett err(1, "%s: open failed", path); 123957a42a34SJosh Triplett return filep; 124057a42a34SJosh Triplett } 124157a42a34SJosh Triplett 124257a42a34SJosh Triplett /* 124395aebc44SJosh Triplett * Parse a file containing a single int. 124495aebc44SJosh Triplett */ 124595aebc44SJosh Triplett int parse_int_file(const char *fmt, ...) 124695aebc44SJosh Triplett { 124795aebc44SJosh Triplett va_list args; 124895aebc44SJosh Triplett char path[PATH_MAX]; 124995aebc44SJosh Triplett FILE *filep; 125095aebc44SJosh Triplett int value; 125195aebc44SJosh Triplett 125295aebc44SJosh Triplett va_start(args, fmt); 125395aebc44SJosh Triplett vsnprintf(path, sizeof(path), fmt, args); 125495aebc44SJosh Triplett va_end(args); 125557a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1256b2c95d90SJosh Triplett if (fscanf(filep, "%d", &value) != 1) 1257b2c95d90SJosh Triplett err(1, "%s: failed to parse number from file", path); 125895aebc44SJosh Triplett fclose(filep); 125995aebc44SJosh Triplett return value; 126095aebc44SJosh Triplett } 126195aebc44SJosh Triplett 126295aebc44SJosh Triplett /* 1263c98d5d94SLen Brown * cpu_is_first_sibling_in_core(cpu) 1264c98d5d94SLen Brown * return 1 if given CPU is 1st HT sibling in the core 1265103a8feaSLen Brown */ 1266c98d5d94SLen Brown int cpu_is_first_sibling_in_core(int cpu) 1267103a8feaSLen Brown { 126895aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 1269c98d5d94SLen Brown } 1270103a8feaSLen Brown 1271c98d5d94SLen Brown /* 1272c98d5d94SLen Brown * cpu_is_first_core_in_package(cpu) 1273c98d5d94SLen Brown * return 1 if given CPU is 1st core in package 1274c98d5d94SLen Brown */ 1275c98d5d94SLen Brown int cpu_is_first_core_in_package(int cpu) 1276c98d5d94SLen Brown { 127795aebc44SJosh Triplett return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_siblings_list", cpu); 1278103a8feaSLen Brown } 1279103a8feaSLen Brown 1280103a8feaSLen Brown int get_physical_package_id(int cpu) 1281103a8feaSLen Brown { 128295aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu); 1283103a8feaSLen Brown } 1284103a8feaSLen Brown 1285103a8feaSLen Brown int get_core_id(int cpu) 1286103a8feaSLen Brown { 128795aebc44SJosh Triplett return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_id", cpu); 1288103a8feaSLen Brown } 1289103a8feaSLen Brown 1290c98d5d94SLen Brown int get_num_ht_siblings(int cpu) 1291c98d5d94SLen Brown { 1292c98d5d94SLen Brown char path[80]; 1293c98d5d94SLen Brown FILE *filep; 1294c98d5d94SLen Brown int sib1, sib2; 1295c98d5d94SLen Brown int matches; 1296c98d5d94SLen Brown char character; 1297c98d5d94SLen Brown 1298c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 129957a42a34SJosh Triplett filep = fopen_or_die(path, "r"); 1300103a8feaSLen Brown /* 1301c98d5d94SLen Brown * file format: 1302c98d5d94SLen Brown * if a pair of number with a character between: 2 siblings (eg. 1-2, or 1,4) 1303c98d5d94SLen Brown * otherwinse 1 sibling (self). 1304c98d5d94SLen Brown */ 1305c98d5d94SLen Brown matches = fscanf(filep, "%d%c%d\n", &sib1, &character, &sib2); 1306c98d5d94SLen Brown 1307c98d5d94SLen Brown fclose(filep); 1308c98d5d94SLen Brown 1309c98d5d94SLen Brown if (matches == 3) 1310c98d5d94SLen Brown return 2; 1311c98d5d94SLen Brown else 1312c98d5d94SLen Brown return 1; 1313c98d5d94SLen Brown } 1314c98d5d94SLen Brown 1315c98d5d94SLen Brown /* 1316c98d5d94SLen Brown * run func(thread, core, package) in topology order 1317c98d5d94SLen Brown * skip non-present cpus 1318103a8feaSLen Brown */ 1319103a8feaSLen Brown 1320c98d5d94SLen Brown int for_all_cpus_2(int (func)(struct thread_data *, struct core_data *, 1321c98d5d94SLen Brown struct pkg_data *, struct thread_data *, struct core_data *, 1322c98d5d94SLen Brown struct pkg_data *), struct thread_data *thread_base, 1323c98d5d94SLen Brown struct core_data *core_base, struct pkg_data *pkg_base, 1324c98d5d94SLen Brown struct thread_data *thread_base2, struct core_data *core_base2, 1325c98d5d94SLen Brown struct pkg_data *pkg_base2) 1326c98d5d94SLen Brown { 1327c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 1328c98d5d94SLen Brown 1329c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 1330c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 1331c98d5d94SLen Brown for (thread_no = 0; thread_no < 1332c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 1333c98d5d94SLen Brown struct thread_data *t, *t2; 1334c98d5d94SLen Brown struct core_data *c, *c2; 1335c98d5d94SLen Brown struct pkg_data *p, *p2; 1336c98d5d94SLen Brown 1337c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 1338c98d5d94SLen Brown 1339c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 1340c98d5d94SLen Brown continue; 1341c98d5d94SLen Brown 1342c98d5d94SLen Brown t2 = GET_THREAD(thread_base2, thread_no, core_no, pkg_no); 1343c98d5d94SLen Brown 1344c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 1345c98d5d94SLen Brown c2 = GET_CORE(core_base2, core_no, pkg_no); 1346c98d5d94SLen Brown 1347c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 1348c98d5d94SLen Brown p2 = GET_PKG(pkg_base2, pkg_no); 1349c98d5d94SLen Brown 1350c98d5d94SLen Brown retval = func(t, c, p, t2, c2, p2); 1351c98d5d94SLen Brown if (retval) 1352c98d5d94SLen Brown return retval; 1353c98d5d94SLen Brown } 1354c98d5d94SLen Brown } 1355c98d5d94SLen Brown } 1356c98d5d94SLen Brown return 0; 1357c98d5d94SLen Brown } 1358c98d5d94SLen Brown 1359c98d5d94SLen Brown /* 1360c98d5d94SLen Brown * run func(cpu) on every cpu in /proc/stat 1361c98d5d94SLen Brown * return max_cpu number 1362c98d5d94SLen Brown */ 1363c98d5d94SLen Brown int for_all_proc_cpus(int (func)(int)) 1364103a8feaSLen Brown { 1365103a8feaSLen Brown FILE *fp; 1366c98d5d94SLen Brown int cpu_num; 1367103a8feaSLen Brown int retval; 1368103a8feaSLen Brown 136957a42a34SJosh Triplett fp = fopen_or_die(proc_stat, "r"); 1370103a8feaSLen Brown 1371103a8feaSLen Brown retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n"); 1372b2c95d90SJosh Triplett if (retval != 0) 1373b2c95d90SJosh Triplett err(1, "%s: failed to parse format", proc_stat); 1374103a8feaSLen Brown 1375c98d5d94SLen Brown while (1) { 1376c98d5d94SLen Brown retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu_num); 1377103a8feaSLen Brown if (retval != 1) 1378103a8feaSLen Brown break; 1379103a8feaSLen Brown 1380c98d5d94SLen Brown retval = func(cpu_num); 1381c98d5d94SLen Brown if (retval) { 1382c98d5d94SLen Brown fclose(fp); 1383c98d5d94SLen Brown return(retval); 1384c98d5d94SLen Brown } 1385103a8feaSLen Brown } 1386103a8feaSLen Brown fclose(fp); 1387c98d5d94SLen Brown return 0; 1388103a8feaSLen Brown } 1389103a8feaSLen Brown 1390103a8feaSLen Brown void re_initialize(void) 1391103a8feaSLen Brown { 1392c98d5d94SLen Brown free_all_buffers(); 1393c98d5d94SLen Brown setup_all_buffers(); 1394c98d5d94SLen Brown printf("turbostat: re-initialized with num_cpus %d\n", topo.num_cpus); 1395103a8feaSLen Brown } 1396103a8feaSLen Brown 1397c98d5d94SLen Brown 1398103a8feaSLen Brown /* 1399c98d5d94SLen Brown * count_cpus() 1400c98d5d94SLen Brown * remember the last one seen, it will be the max 1401103a8feaSLen Brown */ 1402c98d5d94SLen Brown int count_cpus(int cpu) 1403103a8feaSLen Brown { 1404c98d5d94SLen Brown if (topo.max_cpu_num < cpu) 1405c98d5d94SLen Brown topo.max_cpu_num = cpu; 1406103a8feaSLen Brown 1407c98d5d94SLen Brown topo.num_cpus += 1; 1408c98d5d94SLen Brown return 0; 1409103a8feaSLen Brown } 1410c98d5d94SLen Brown int mark_cpu_present(int cpu) 1411c98d5d94SLen Brown { 1412c98d5d94SLen Brown CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set); 141315aaa346SLen Brown return 0; 1414103a8feaSLen Brown } 1415103a8feaSLen Brown 1416103a8feaSLen Brown void turbostat_loop() 1417103a8feaSLen Brown { 1418c98d5d94SLen Brown int retval; 1419e52966c0SLen Brown int restarted = 0; 1420c98d5d94SLen Brown 1421103a8feaSLen Brown restart: 1422e52966c0SLen Brown restarted++; 1423e52966c0SLen Brown 1424c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1425d91bb17cSLen Brown if (retval < -1) { 1426d91bb17cSLen Brown exit(retval); 1427d91bb17cSLen Brown } else if (retval == -1) { 1428e52966c0SLen Brown if (restarted > 1) { 1429e52966c0SLen Brown exit(retval); 1430e52966c0SLen Brown } 1431c98d5d94SLen Brown re_initialize(); 1432c98d5d94SLen Brown goto restart; 1433c98d5d94SLen Brown } 1434e52966c0SLen Brown restarted = 0; 1435103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1436103a8feaSLen Brown 1437103a8feaSLen Brown while (1) { 1438c98d5d94SLen Brown if (for_all_proc_cpus(cpu_is_not_present)) { 1439103a8feaSLen Brown re_initialize(); 1440103a8feaSLen Brown goto restart; 1441103a8feaSLen Brown } 1442103a8feaSLen Brown sleep(interval_sec); 1443c98d5d94SLen Brown retval = for_all_cpus(get_counters, ODD_COUNTERS); 1444d91bb17cSLen Brown if (retval < -1) { 1445d91bb17cSLen Brown exit(retval); 1446d91bb17cSLen Brown } else if (retval == -1) { 144715aaa346SLen Brown re_initialize(); 144815aaa346SLen Brown goto restart; 144915aaa346SLen Brown } 1450103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 1451103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 1452c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 1453c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 1454c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 1455c98d5d94SLen Brown flush_stdout(); 145615aaa346SLen Brown sleep(interval_sec); 1457c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 1458d91bb17cSLen Brown if (retval < -1) { 1459d91bb17cSLen Brown exit(retval); 1460d91bb17cSLen Brown } else if (retval == -1) { 1461103a8feaSLen Brown re_initialize(); 1462103a8feaSLen Brown goto restart; 1463103a8feaSLen Brown } 1464103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1465103a8feaSLen Brown timersub(&tv_even, &tv_odd, &tv_delta); 1466c98d5d94SLen Brown for_all_cpus_2(delta_cpu, EVEN_COUNTERS, ODD_COUNTERS); 1467c98d5d94SLen Brown compute_average(ODD_COUNTERS); 1468c98d5d94SLen Brown format_all_counters(ODD_COUNTERS); 1469c98d5d94SLen Brown flush_stdout(); 1470103a8feaSLen Brown } 1471103a8feaSLen Brown } 1472103a8feaSLen Brown 1473103a8feaSLen Brown void check_dev_msr() 1474103a8feaSLen Brown { 1475103a8feaSLen Brown struct stat sb; 1476103a8feaSLen Brown 1477b2c95d90SJosh Triplett if (stat("/dev/cpu/0/msr", &sb)) 1478b2c95d90SJosh Triplett err(-5, "no /dev/cpu/0/msr\n" 1479b2c95d90SJosh Triplett "Try \"# modprobe msr\""); 1480103a8feaSLen Brown } 1481103a8feaSLen Brown 1482103a8feaSLen Brown void check_super_user() 1483103a8feaSLen Brown { 1484b2c95d90SJosh Triplett if (getuid() != 0) 1485b2c95d90SJosh Triplett errx(-6, "must be root"); 1486103a8feaSLen Brown } 1487103a8feaSLen Brown 1488103a8feaSLen Brown int has_nehalem_turbo_ratio_limit(unsigned int family, unsigned int model) 1489103a8feaSLen Brown { 1490103a8feaSLen Brown if (!genuine_intel) 1491103a8feaSLen Brown return 0; 1492103a8feaSLen Brown 1493103a8feaSLen Brown if (family != 6) 1494103a8feaSLen Brown return 0; 1495103a8feaSLen Brown 1496103a8feaSLen Brown switch (model) { 1497103a8feaSLen Brown case 0x1A: /* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */ 1498103a8feaSLen Brown case 0x1E: /* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */ 1499103a8feaSLen Brown case 0x1F: /* Core i7 and i5 Processor - Nehalem */ 1500103a8feaSLen Brown case 0x25: /* Westmere Client - Clarkdale, Arrandale */ 1501103a8feaSLen Brown case 0x2C: /* Westmere EP - Gulftown */ 1502103a8feaSLen Brown case 0x2A: /* SNB */ 1503103a8feaSLen Brown case 0x2D: /* SNB Xeon */ 1504553575f1SLen Brown case 0x3A: /* IVB */ 15051300651bSLen Brown case 0x3E: /* IVB Xeon */ 150670b43400SLen Brown case 0x3C: /* HSW */ 1507e6f9bb3cSLen Brown case 0x3F: /* HSX */ 150870b43400SLen Brown case 0x45: /* HSW */ 1509149c2319SLen Brown case 0x46: /* HSW */ 1510144b44b1SLen Brown case 0x37: /* BYT */ 1511144b44b1SLen Brown case 0x4D: /* AVN */ 1512103a8feaSLen Brown return 1; 1513103a8feaSLen Brown case 0x2E: /* Nehalem-EX Xeon - Beckton */ 1514103a8feaSLen Brown case 0x2F: /* Westmere-EX Xeon - Eagleton */ 1515103a8feaSLen Brown default: 1516103a8feaSLen Brown return 0; 1517103a8feaSLen Brown } 1518103a8feaSLen Brown } 15196574a5d5SLen Brown int has_ivt_turbo_ratio_limit(unsigned int family, unsigned int model) 15206574a5d5SLen Brown { 15216574a5d5SLen Brown if (!genuine_intel) 15226574a5d5SLen Brown return 0; 15236574a5d5SLen Brown 15246574a5d5SLen Brown if (family != 6) 15256574a5d5SLen Brown return 0; 15266574a5d5SLen Brown 15276574a5d5SLen Brown switch (model) { 15286574a5d5SLen Brown case 0x3E: /* IVB Xeon */ 15296574a5d5SLen Brown return 1; 15306574a5d5SLen Brown default: 15316574a5d5SLen Brown return 0; 15326574a5d5SLen Brown } 15336574a5d5SLen Brown } 15346574a5d5SLen Brown 1535889facbeSLen Brown /* 1536889facbeSLen Brown * print_epb() 1537889facbeSLen Brown * Decode the ENERGY_PERF_BIAS MSR 1538889facbeSLen Brown */ 1539889facbeSLen Brown int print_epb(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1540889facbeSLen Brown { 1541889facbeSLen Brown unsigned long long msr; 1542889facbeSLen Brown char *epb_string; 1543889facbeSLen Brown int cpu; 1544889facbeSLen Brown 1545889facbeSLen Brown if (!has_epb) 1546889facbeSLen Brown return 0; 1547889facbeSLen Brown 1548889facbeSLen Brown cpu = t->cpu_id; 1549889facbeSLen Brown 1550889facbeSLen Brown /* EPB is per-package */ 1551889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1552889facbeSLen Brown return 0; 1553889facbeSLen Brown 1554889facbeSLen Brown if (cpu_migrate(cpu)) { 1555889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1556889facbeSLen Brown return -1; 1557889facbeSLen Brown } 1558889facbeSLen Brown 1559889facbeSLen Brown if (get_msr(cpu, MSR_IA32_ENERGY_PERF_BIAS, &msr)) 1560889facbeSLen Brown return 0; 1561889facbeSLen Brown 1562889facbeSLen Brown switch (msr & 0x7) { 1563889facbeSLen Brown case ENERGY_PERF_BIAS_PERFORMANCE: 1564889facbeSLen Brown epb_string = "performance"; 1565889facbeSLen Brown break; 1566889facbeSLen Brown case ENERGY_PERF_BIAS_NORMAL: 1567889facbeSLen Brown epb_string = "balanced"; 1568889facbeSLen Brown break; 1569889facbeSLen Brown case ENERGY_PERF_BIAS_POWERSAVE: 1570889facbeSLen Brown epb_string = "powersave"; 1571889facbeSLen Brown break; 1572889facbeSLen Brown default: 1573889facbeSLen Brown epb_string = "custom"; 1574889facbeSLen Brown break; 1575889facbeSLen Brown } 1576889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_ENERGY_PERF_BIAS: 0x%08llx (%s)\n", cpu, msr, epb_string); 1577889facbeSLen Brown 1578889facbeSLen Brown return 0; 1579889facbeSLen Brown } 1580889facbeSLen Brown 1581889facbeSLen Brown #define RAPL_POWER_GRANULARITY 0x7FFF /* 15 bit power granularity */ 1582889facbeSLen Brown #define RAPL_TIME_GRANULARITY 0x3F /* 6 bit time granularity */ 1583889facbeSLen Brown 1584144b44b1SLen Brown double get_tdp(model) 1585144b44b1SLen Brown { 1586144b44b1SLen Brown unsigned long long msr; 1587144b44b1SLen Brown 1588144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) 1589144b44b1SLen Brown if (!get_msr(0, MSR_PKG_POWER_INFO, &msr)) 1590144b44b1SLen Brown return ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units; 1591144b44b1SLen Brown 1592144b44b1SLen Brown switch (model) { 1593144b44b1SLen Brown case 0x37: 1594144b44b1SLen Brown case 0x4D: 1595144b44b1SLen Brown return 30.0; 1596144b44b1SLen Brown default: 1597144b44b1SLen Brown return 135.0; 1598144b44b1SLen Brown } 1599144b44b1SLen Brown } 1600144b44b1SLen Brown 1601144b44b1SLen Brown 1602889facbeSLen Brown /* 1603889facbeSLen Brown * rapl_probe() 1604889facbeSLen Brown * 1605144b44b1SLen Brown * sets do_rapl, rapl_power_units, rapl_energy_units, rapl_time_units 1606889facbeSLen Brown */ 1607889facbeSLen Brown void rapl_probe(unsigned int family, unsigned int model) 1608889facbeSLen Brown { 1609889facbeSLen Brown unsigned long long msr; 1610144b44b1SLen Brown unsigned int time_unit; 1611889facbeSLen Brown double tdp; 1612889facbeSLen Brown 1613889facbeSLen Brown if (!genuine_intel) 1614889facbeSLen Brown return; 1615889facbeSLen Brown 1616889facbeSLen Brown if (family != 6) 1617889facbeSLen Brown return; 1618889facbeSLen Brown 1619889facbeSLen Brown switch (model) { 1620889facbeSLen Brown case 0x2A: 1621889facbeSLen Brown case 0x3A: 162270b43400SLen Brown case 0x3C: /* HSW */ 162370b43400SLen Brown case 0x45: /* HSW */ 1624149c2319SLen Brown case 0x46: /* HSW */ 1625144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_GFX | RAPL_PKG_POWER_INFO; 1626889facbeSLen Brown break; 1627e6f9bb3cSLen Brown case 0x3F: /* HSX */ 1628e6f9bb3cSLen Brown do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO; 1629e6f9bb3cSLen Brown break; 1630889facbeSLen Brown case 0x2D: 1631889facbeSLen Brown case 0x3E: 1632144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_DRAM | RAPL_PKG_PERF_STATUS | RAPL_DRAM_PERF_STATUS | RAPL_PKG_POWER_INFO; 1633144b44b1SLen Brown break; 1634144b44b1SLen Brown case 0x37: /* BYT */ 1635144b44b1SLen Brown case 0x4D: /* AVN */ 1636144b44b1SLen Brown do_rapl = RAPL_PKG | RAPL_CORES ; 1637889facbeSLen Brown break; 1638889facbeSLen Brown default: 1639889facbeSLen Brown return; 1640889facbeSLen Brown } 1641889facbeSLen Brown 1642889facbeSLen Brown /* units on package 0, verify later other packages match */ 1643889facbeSLen Brown if (get_msr(0, MSR_RAPL_POWER_UNIT, &msr)) 1644889facbeSLen Brown return; 1645889facbeSLen Brown 1646889facbeSLen Brown rapl_power_units = 1.0 / (1 << (msr & 0xF)); 1647144b44b1SLen Brown if (model == 0x37) 1648144b44b1SLen Brown rapl_energy_units = 1.0 * (1 << (msr >> 8 & 0x1F)) / 1000000; 1649144b44b1SLen Brown else 1650889facbeSLen Brown rapl_energy_units = 1.0 / (1 << (msr >> 8 & 0x1F)); 1651889facbeSLen Brown 1652144b44b1SLen Brown time_unit = msr >> 16 & 0xF; 1653144b44b1SLen Brown if (time_unit == 0) 1654144b44b1SLen Brown time_unit = 0xA; 1655889facbeSLen Brown 1656144b44b1SLen Brown rapl_time_units = 1.0 / (1 << (time_unit)); 1657144b44b1SLen Brown 1658144b44b1SLen Brown tdp = get_tdp(model); 1659889facbeSLen Brown 1660889facbeSLen Brown rapl_joule_counter_range = 0xFFFFFFFF * rapl_energy_units / tdp; 1661889facbeSLen Brown if (verbose) 1662144b44b1SLen Brown fprintf(stderr, "RAPL: %.0f sec. Joule Counter Range, at %.0f Watts\n", rapl_joule_counter_range, tdp); 1663889facbeSLen Brown 1664889facbeSLen Brown return; 1665889facbeSLen Brown } 1666889facbeSLen Brown 1667889facbeSLen Brown int print_thermal(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1668889facbeSLen Brown { 1669889facbeSLen Brown unsigned long long msr; 1670889facbeSLen Brown unsigned int dts; 1671889facbeSLen Brown int cpu; 1672889facbeSLen Brown 1673889facbeSLen Brown if (!(do_dts || do_ptm)) 1674889facbeSLen Brown return 0; 1675889facbeSLen Brown 1676889facbeSLen Brown cpu = t->cpu_id; 1677889facbeSLen Brown 1678889facbeSLen Brown /* DTS is per-core, no need to print for each thread */ 1679889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 1680889facbeSLen Brown return 0; 1681889facbeSLen Brown 1682889facbeSLen Brown if (cpu_migrate(cpu)) { 1683889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1684889facbeSLen Brown return -1; 1685889facbeSLen Brown } 1686889facbeSLen Brown 1687889facbeSLen Brown if (do_ptm && (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) { 1688889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr)) 1689889facbeSLen Brown return 0; 1690889facbeSLen Brown 1691889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1692889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_STATUS: 0x%08llx (%d C)\n", 1693889facbeSLen Brown cpu, msr, tcc_activation_temp - dts); 1694889facbeSLen Brown 1695889facbeSLen Brown #ifdef THERM_DEBUG 1696889facbeSLen Brown if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_INTERRUPT, &msr)) 1697889facbeSLen Brown return 0; 1698889facbeSLen Brown 1699889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1700889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 1701889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_PACKAGE_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 1702889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 1703889facbeSLen Brown #endif 1704889facbeSLen Brown } 1705889facbeSLen Brown 1706889facbeSLen Brown 1707889facbeSLen Brown if (do_dts) { 1708889facbeSLen Brown unsigned int resolution; 1709889facbeSLen Brown 1710889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr)) 1711889facbeSLen Brown return 0; 1712889facbeSLen Brown 1713889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1714889facbeSLen Brown resolution = (msr >> 27) & 0xF; 1715889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_STATUS: 0x%08llx (%d C +/- %d)\n", 1716889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, resolution); 1717889facbeSLen Brown 1718889facbeSLen Brown #ifdef THERM_DEBUG 1719889facbeSLen Brown if (get_msr(cpu, MSR_IA32_THERM_INTERRUPT, &msr)) 1720889facbeSLen Brown return 0; 1721889facbeSLen Brown 1722889facbeSLen Brown dts = (msr >> 16) & 0x7F; 1723889facbeSLen Brown dts2 = (msr >> 8) & 0x7F; 1724889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n", 1725889facbeSLen Brown cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2); 1726889facbeSLen Brown #endif 1727889facbeSLen Brown } 1728889facbeSLen Brown 1729889facbeSLen Brown return 0; 1730889facbeSLen Brown } 1731889facbeSLen Brown 1732889facbeSLen Brown void print_power_limit_msr(int cpu, unsigned long long msr, char *label) 1733889facbeSLen Brown { 1734889facbeSLen Brown fprintf(stderr, "cpu%d: %s: %sabled (%f Watts, %f sec, clamp %sabled)\n", 1735889facbeSLen Brown cpu, label, 1736889facbeSLen Brown ((msr >> 15) & 1) ? "EN" : "DIS", 1737889facbeSLen Brown ((msr >> 0) & 0x7FFF) * rapl_power_units, 1738889facbeSLen Brown (1.0 + (((msr >> 22) & 0x3)/4.0)) * (1 << ((msr >> 17) & 0x1F)) * rapl_time_units, 1739889facbeSLen Brown (((msr >> 16) & 1) ? "EN" : "DIS")); 1740889facbeSLen Brown 1741889facbeSLen Brown return; 1742889facbeSLen Brown } 1743889facbeSLen Brown 1744889facbeSLen Brown int print_rapl(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1745889facbeSLen Brown { 1746889facbeSLen Brown unsigned long long msr; 1747889facbeSLen Brown int cpu; 1748889facbeSLen Brown 1749889facbeSLen Brown if (!do_rapl) 1750889facbeSLen Brown return 0; 1751889facbeSLen Brown 1752889facbeSLen Brown /* RAPL counters are per package, so print only for 1st thread/package */ 1753889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1754889facbeSLen Brown return 0; 1755889facbeSLen Brown 1756889facbeSLen Brown cpu = t->cpu_id; 1757889facbeSLen Brown if (cpu_migrate(cpu)) { 1758889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1759889facbeSLen Brown return -1; 1760889facbeSLen Brown } 1761889facbeSLen Brown 1762889facbeSLen Brown if (get_msr(cpu, MSR_RAPL_POWER_UNIT, &msr)) 1763889facbeSLen Brown return -1; 1764889facbeSLen Brown 1765889facbeSLen Brown if (verbose) { 1766889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_RAPL_POWER_UNIT: 0x%08llx " 1767889facbeSLen Brown "(%f Watts, %f Joules, %f sec.)\n", cpu, msr, 1768144b44b1SLen Brown rapl_power_units, rapl_energy_units, rapl_time_units); 1769889facbeSLen Brown } 1770144b44b1SLen Brown if (do_rapl & RAPL_PKG_POWER_INFO) { 1771144b44b1SLen Brown 1772889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_INFO, &msr)) 1773889facbeSLen Brown return -5; 1774889facbeSLen Brown 1775889facbeSLen Brown 1776889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_INFO: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 1777889facbeSLen Brown cpu, msr, 1778889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1779889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1780889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1781889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 1782889facbeSLen Brown 1783144b44b1SLen Brown } 1784144b44b1SLen Brown if (do_rapl & RAPL_PKG) { 1785144b44b1SLen Brown 1786889facbeSLen Brown if (get_msr(cpu, MSR_PKG_POWER_LIMIT, &msr)) 1787889facbeSLen Brown return -9; 1788889facbeSLen Brown 1789889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PKG_POWER_LIMIT: 0x%08llx (%slocked)\n", 1790889facbeSLen Brown cpu, msr, (msr >> 63) & 1 ? "": "UN"); 1791889facbeSLen Brown 1792889facbeSLen Brown print_power_limit_msr(cpu, msr, "PKG Limit #1"); 1793889facbeSLen Brown fprintf(stderr, "cpu%d: PKG Limit #2: %sabled (%f Watts, %f* sec, clamp %sabled)\n", 1794889facbeSLen Brown cpu, 1795889facbeSLen Brown ((msr >> 47) & 1) ? "EN" : "DIS", 1796889facbeSLen Brown ((msr >> 32) & 0x7FFF) * rapl_power_units, 1797889facbeSLen Brown (1.0 + (((msr >> 54) & 0x3)/4.0)) * (1 << ((msr >> 49) & 0x1F)) * rapl_time_units, 1798889facbeSLen Brown ((msr >> 48) & 1) ? "EN" : "DIS"); 1799889facbeSLen Brown } 1800889facbeSLen Brown 1801889facbeSLen Brown if (do_rapl & RAPL_DRAM) { 1802889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_INFO, &msr)) 1803889facbeSLen Brown return -6; 1804889facbeSLen Brown 1805889facbeSLen Brown 1806889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_INFO,: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n", 1807889facbeSLen Brown cpu, msr, 1808889facbeSLen Brown ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1809889facbeSLen Brown ((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1810889facbeSLen Brown ((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units, 1811889facbeSLen Brown ((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units); 1812889facbeSLen Brown 1813889facbeSLen Brown 1814889facbeSLen Brown if (get_msr(cpu, MSR_DRAM_POWER_LIMIT, &msr)) 1815889facbeSLen Brown return -9; 1816889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_DRAM_POWER_LIMIT: 0x%08llx (%slocked)\n", 1817889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1818889facbeSLen Brown 1819889facbeSLen Brown print_power_limit_msr(cpu, msr, "DRAM Limit"); 1820889facbeSLen Brown } 1821144b44b1SLen Brown if (do_rapl & RAPL_CORE_POLICY) { 1822889facbeSLen Brown if (verbose) { 1823889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POLICY, &msr)) 1824889facbeSLen Brown return -7; 1825889facbeSLen Brown 1826889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POLICY: %lld\n", cpu, msr & 0xF); 1827144b44b1SLen Brown } 1828144b44b1SLen Brown } 1829144b44b1SLen Brown if (do_rapl & RAPL_CORES) { 1830144b44b1SLen Brown if (verbose) { 1831889facbeSLen Brown 1832889facbeSLen Brown if (get_msr(cpu, MSR_PP0_POWER_LIMIT, &msr)) 1833889facbeSLen Brown return -9; 1834889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP0_POWER_LIMIT: 0x%08llx (%slocked)\n", 1835889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1836889facbeSLen Brown print_power_limit_msr(cpu, msr, "Cores Limit"); 1837889facbeSLen Brown } 1838889facbeSLen Brown } 1839889facbeSLen Brown if (do_rapl & RAPL_GFX) { 1840889facbeSLen Brown if (verbose) { 1841889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POLICY, &msr)) 1842889facbeSLen Brown return -8; 1843889facbeSLen Brown 1844889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POLICY: %lld\n", cpu, msr & 0xF); 1845889facbeSLen Brown 1846889facbeSLen Brown if (get_msr(cpu, MSR_PP1_POWER_LIMIT, &msr)) 1847889facbeSLen Brown return -9; 1848889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_PP1_POWER_LIMIT: 0x%08llx (%slocked)\n", 1849889facbeSLen Brown cpu, msr, (msr >> 31) & 1 ? "": "UN"); 1850889facbeSLen Brown print_power_limit_msr(cpu, msr, "GFX Limit"); 1851889facbeSLen Brown } 1852889facbeSLen Brown } 1853889facbeSLen Brown return 0; 1854889facbeSLen Brown } 1855889facbeSLen Brown 1856103a8feaSLen Brown 1857103a8feaSLen Brown int is_snb(unsigned int family, unsigned int model) 1858103a8feaSLen Brown { 1859103a8feaSLen Brown if (!genuine_intel) 1860103a8feaSLen Brown return 0; 1861103a8feaSLen Brown 1862103a8feaSLen Brown switch (model) { 1863103a8feaSLen Brown case 0x2A: 1864103a8feaSLen Brown case 0x2D: 1865650a37f3SLen Brown case 0x3A: /* IVB */ 18661300651bSLen Brown case 0x3E: /* IVB Xeon */ 186770b43400SLen Brown case 0x3C: /* HSW */ 186870b43400SLen Brown case 0x3F: /* HSW */ 186970b43400SLen Brown case 0x45: /* HSW */ 1870149c2319SLen Brown case 0x46: /* HSW */ 1871103a8feaSLen Brown return 1; 1872103a8feaSLen Brown } 1873103a8feaSLen Brown return 0; 1874103a8feaSLen Brown } 1875103a8feaSLen Brown 1876ca58710fSKristen Carlson Accardi int has_c8_c9_c10(unsigned int family, unsigned int model) 1877ca58710fSKristen Carlson Accardi { 1878ca58710fSKristen Carlson Accardi if (!genuine_intel) 1879ca58710fSKristen Carlson Accardi return 0; 1880ca58710fSKristen Carlson Accardi 1881ca58710fSKristen Carlson Accardi switch (model) { 1882ca58710fSKristen Carlson Accardi case 0x45: 1883ca58710fSKristen Carlson Accardi return 1; 1884ca58710fSKristen Carlson Accardi } 1885ca58710fSKristen Carlson Accardi return 0; 1886ca58710fSKristen Carlson Accardi } 1887ca58710fSKristen Carlson Accardi 1888ca58710fSKristen Carlson Accardi 1889144b44b1SLen Brown int is_slm(unsigned int family, unsigned int model) 1890144b44b1SLen Brown { 1891144b44b1SLen Brown if (!genuine_intel) 1892144b44b1SLen Brown return 0; 1893144b44b1SLen Brown switch (model) { 1894144b44b1SLen Brown case 0x37: /* BYT */ 1895144b44b1SLen Brown case 0x4D: /* AVN */ 1896144b44b1SLen Brown return 1; 1897144b44b1SLen Brown } 1898144b44b1SLen Brown return 0; 1899144b44b1SLen Brown } 1900144b44b1SLen Brown 1901144b44b1SLen Brown #define SLM_BCLK_FREQS 5 1902144b44b1SLen Brown double slm_freq_table[SLM_BCLK_FREQS] = { 83.3, 100.0, 133.3, 116.7, 80.0}; 1903144b44b1SLen Brown 1904144b44b1SLen Brown double slm_bclk(void) 1905144b44b1SLen Brown { 1906144b44b1SLen Brown unsigned long long msr = 3; 1907144b44b1SLen Brown unsigned int i; 1908144b44b1SLen Brown double freq; 1909144b44b1SLen Brown 1910144b44b1SLen Brown if (get_msr(0, MSR_FSB_FREQ, &msr)) 1911144b44b1SLen Brown fprintf(stderr, "SLM BCLK: unknown\n"); 1912144b44b1SLen Brown 1913144b44b1SLen Brown i = msr & 0xf; 1914144b44b1SLen Brown if (i >= SLM_BCLK_FREQS) { 1915144b44b1SLen Brown fprintf(stderr, "SLM BCLK[%d] invalid\n", i); 1916144b44b1SLen Brown msr = 3; 1917144b44b1SLen Brown } 1918144b44b1SLen Brown freq = slm_freq_table[i]; 1919144b44b1SLen Brown 1920144b44b1SLen Brown fprintf(stderr, "SLM BCLK: %.1f Mhz\n", freq); 1921144b44b1SLen Brown 1922144b44b1SLen Brown return freq; 1923144b44b1SLen Brown } 1924144b44b1SLen Brown 1925103a8feaSLen Brown double discover_bclk(unsigned int family, unsigned int model) 1926103a8feaSLen Brown { 1927103a8feaSLen Brown if (is_snb(family, model)) 1928103a8feaSLen Brown return 100.00; 1929144b44b1SLen Brown else if (is_slm(family, model)) 1930144b44b1SLen Brown return slm_bclk(); 1931103a8feaSLen Brown else 1932103a8feaSLen Brown return 133.33; 1933103a8feaSLen Brown } 1934103a8feaSLen Brown 1935889facbeSLen Brown /* 1936889facbeSLen Brown * MSR_IA32_TEMPERATURE_TARGET indicates the temperature where 1937889facbeSLen Brown * the Thermal Control Circuit (TCC) activates. 1938889facbeSLen Brown * This is usually equal to tjMax. 1939889facbeSLen Brown * 1940889facbeSLen Brown * Older processors do not have this MSR, so there we guess, 1941889facbeSLen Brown * but also allow cmdline over-ride with -T. 1942889facbeSLen Brown * 1943889facbeSLen Brown * Several MSR temperature values are in units of degrees-C 1944889facbeSLen Brown * below this value, including the Digital Thermal Sensor (DTS), 1945889facbeSLen Brown * Package Thermal Management Sensor (PTM), and thermal event thresholds. 1946889facbeSLen Brown */ 1947889facbeSLen Brown int set_temperature_target(struct thread_data *t, struct core_data *c, struct pkg_data *p) 1948889facbeSLen Brown { 1949889facbeSLen Brown unsigned long long msr; 1950889facbeSLen Brown unsigned int target_c_local; 1951889facbeSLen Brown int cpu; 1952889facbeSLen Brown 1953889facbeSLen Brown /* tcc_activation_temp is used only for dts or ptm */ 1954889facbeSLen Brown if (!(do_dts || do_ptm)) 1955889facbeSLen Brown return 0; 1956889facbeSLen Brown 1957889facbeSLen Brown /* this is a per-package concept */ 1958889facbeSLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 1959889facbeSLen Brown return 0; 1960889facbeSLen Brown 1961889facbeSLen Brown cpu = t->cpu_id; 1962889facbeSLen Brown if (cpu_migrate(cpu)) { 1963889facbeSLen Brown fprintf(stderr, "Could not migrate to CPU %d\n", cpu); 1964889facbeSLen Brown return -1; 1965889facbeSLen Brown } 1966889facbeSLen Brown 1967889facbeSLen Brown if (tcc_activation_temp_override != 0) { 1968889facbeSLen Brown tcc_activation_temp = tcc_activation_temp_override; 1969889facbeSLen Brown fprintf(stderr, "cpu%d: Using cmdline TCC Target (%d C)\n", 1970889facbeSLen Brown cpu, tcc_activation_temp); 1971889facbeSLen Brown return 0; 1972889facbeSLen Brown } 1973889facbeSLen Brown 1974889facbeSLen Brown /* Temperature Target MSR is Nehalem and newer only */ 1975889facbeSLen Brown if (!do_nehalem_platform_info) 1976889facbeSLen Brown goto guess; 1977889facbeSLen Brown 1978889facbeSLen Brown if (get_msr(0, MSR_IA32_TEMPERATURE_TARGET, &msr)) 1979889facbeSLen Brown goto guess; 1980889facbeSLen Brown 1981889facbeSLen Brown target_c_local = (msr >> 16) & 0x7F; 1982889facbeSLen Brown 1983889facbeSLen Brown if (verbose) 1984889facbeSLen Brown fprintf(stderr, "cpu%d: MSR_IA32_TEMPERATURE_TARGET: 0x%08llx (%d C)\n", 1985889facbeSLen Brown cpu, msr, target_c_local); 1986889facbeSLen Brown 1987144b44b1SLen Brown if (target_c_local < 85 || target_c_local > 127) 1988889facbeSLen Brown goto guess; 1989889facbeSLen Brown 1990889facbeSLen Brown tcc_activation_temp = target_c_local; 1991889facbeSLen Brown 1992889facbeSLen Brown return 0; 1993889facbeSLen Brown 1994889facbeSLen Brown guess: 1995889facbeSLen Brown tcc_activation_temp = TJMAX_DEFAULT; 1996889facbeSLen Brown fprintf(stderr, "cpu%d: Guessing tjMax %d C, Please use -T to specify\n", 1997889facbeSLen Brown cpu, tcc_activation_temp); 1998889facbeSLen Brown 1999889facbeSLen Brown return 0; 2000889facbeSLen Brown } 2001103a8feaSLen Brown void check_cpuid() 2002103a8feaSLen Brown { 2003103a8feaSLen Brown unsigned int eax, ebx, ecx, edx, max_level; 2004103a8feaSLen Brown unsigned int fms, family, model, stepping; 2005103a8feaSLen Brown 2006103a8feaSLen Brown eax = ebx = ecx = edx = 0; 2007103a8feaSLen Brown 20082b92865eSJosh Triplett __get_cpuid(0, &max_level, &ebx, &ecx, &edx); 2009103a8feaSLen Brown 2010103a8feaSLen Brown if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e) 2011103a8feaSLen Brown genuine_intel = 1; 2012103a8feaSLen Brown 2013103a8feaSLen Brown if (verbose) 2014889facbeSLen Brown fprintf(stderr, "CPUID(0): %.4s%.4s%.4s ", 2015103a8feaSLen Brown (char *)&ebx, (char *)&edx, (char *)&ecx); 2016103a8feaSLen Brown 20172b92865eSJosh Triplett __get_cpuid(1, &fms, &ebx, &ecx, &edx); 2018103a8feaSLen Brown family = (fms >> 8) & 0xf; 2019103a8feaSLen Brown model = (fms >> 4) & 0xf; 2020103a8feaSLen Brown stepping = fms & 0xf; 2021103a8feaSLen Brown if (family == 6 || family == 0xf) 2022103a8feaSLen Brown model += ((fms >> 16) & 0xf) << 4; 2023103a8feaSLen Brown 2024103a8feaSLen Brown if (verbose) 2025103a8feaSLen Brown fprintf(stderr, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n", 2026103a8feaSLen Brown max_level, family, model, stepping, family, model, stepping); 2027103a8feaSLen Brown 2028b2c95d90SJosh Triplett if (!(edx & (1 << 5))) 2029b2c95d90SJosh Triplett errx(1, "CPUID: no MSR"); 2030103a8feaSLen Brown 2031103a8feaSLen Brown /* 2032103a8feaSLen Brown * check max extended function levels of CPUID. 2033103a8feaSLen Brown * This is needed to check for invariant TSC. 2034103a8feaSLen Brown * This check is valid for both Intel and AMD. 2035103a8feaSLen Brown */ 2036103a8feaSLen Brown ebx = ecx = edx = 0; 20372b92865eSJosh Triplett __get_cpuid(0x80000000, &max_level, &ebx, &ecx, &edx); 2038103a8feaSLen Brown 2039b2c95d90SJosh Triplett if (max_level < 0x80000007) 2040b2c95d90SJosh Triplett errx(1, "CPUID: no invariant TSC (max_level 0x%x)", max_level); 2041103a8feaSLen Brown 2042103a8feaSLen Brown /* 2043103a8feaSLen Brown * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8 2044103a8feaSLen Brown * this check is valid for both Intel and AMD 2045103a8feaSLen Brown */ 20462b92865eSJosh Triplett __get_cpuid(0x80000007, &eax, &ebx, &ecx, &edx); 20478209e054SThomas Renninger has_invariant_tsc = edx & (1 << 8); 2048103a8feaSLen Brown 2049b2c95d90SJosh Triplett if (!has_invariant_tsc) 2050b2c95d90SJosh Triplett errx(1, "No invariant TSC"); 2051103a8feaSLen Brown 2052103a8feaSLen Brown /* 2053103a8feaSLen Brown * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0 2054103a8feaSLen Brown * this check is valid for both Intel and AMD 2055103a8feaSLen Brown */ 2056103a8feaSLen Brown 20572b92865eSJosh Triplett __get_cpuid(0x6, &eax, &ebx, &ecx, &edx); 20588209e054SThomas Renninger has_aperf = ecx & (1 << 0); 2059889facbeSLen Brown do_dts = eax & (1 << 0); 2060889facbeSLen Brown do_ptm = eax & (1 << 6); 2061889facbeSLen Brown has_epb = ecx & (1 << 3); 2062889facbeSLen Brown 2063889facbeSLen Brown if (verbose) 2064889facbeSLen Brown fprintf(stderr, "CPUID(6): %s%s%s%s\n", 2065889facbeSLen Brown has_aperf ? "APERF" : "No APERF!", 2066889facbeSLen Brown do_dts ? ", DTS" : "", 2067889facbeSLen Brown do_ptm ? ", PTM": "", 2068889facbeSLen Brown has_epb ? ", EPB": ""); 2069889facbeSLen Brown 2070889facbeSLen Brown if (!has_aperf) 2071b2c95d90SJosh Triplett errx(-1, "No APERF"); 2072103a8feaSLen Brown 2073103a8feaSLen Brown do_nehalem_platform_info = genuine_intel && has_invariant_tsc; 2074103a8feaSLen Brown do_nhm_cstates = genuine_intel; /* all Intel w/ non-stop TSC have NHM counters */ 20751ed51011SLen Brown do_smi = do_nhm_cstates; 2076103a8feaSLen Brown do_snb_cstates = is_snb(family, model); 2077ca58710fSKristen Carlson Accardi do_c8_c9_c10 = has_c8_c9_c10(family, model); 2078144b44b1SLen Brown do_slm_cstates = is_slm(family, model); 2079103a8feaSLen Brown bclk = discover_bclk(family, model); 2080103a8feaSLen Brown 2081103a8feaSLen Brown do_nehalem_turbo_ratio_limit = has_nehalem_turbo_ratio_limit(family, model); 20826574a5d5SLen Brown do_ivt_turbo_ratio_limit = has_ivt_turbo_ratio_limit(family, model); 2083889facbeSLen Brown rapl_probe(family, model); 2084889facbeSLen Brown 2085889facbeSLen Brown return; 2086103a8feaSLen Brown } 2087103a8feaSLen Brown 2088103a8feaSLen Brown 2089103a8feaSLen Brown void usage() 2090103a8feaSLen Brown { 2091*f591c38bSAndy Shevchenko errx(1, "%s: [-v][-R][-T][-p|-P|-S][-c MSR#][-C MSR#][-m MSR#][-M MSR#][-i interval_sec | command ...]\n", 2092103a8feaSLen Brown progname); 2093103a8feaSLen Brown } 2094103a8feaSLen Brown 2095103a8feaSLen Brown 2096103a8feaSLen Brown /* 2097103a8feaSLen Brown * in /dev/cpu/ return success for names that are numbers 2098103a8feaSLen Brown * ie. filter out ".", "..", "microcode". 2099103a8feaSLen Brown */ 2100103a8feaSLen Brown int dir_filter(const struct dirent *dirp) 2101103a8feaSLen Brown { 2102103a8feaSLen Brown if (isdigit(dirp->d_name[0])) 2103103a8feaSLen Brown return 1; 2104103a8feaSLen Brown else 2105103a8feaSLen Brown return 0; 2106103a8feaSLen Brown } 2107103a8feaSLen Brown 2108103a8feaSLen Brown int open_dev_cpu_msr(int dummy1) 2109103a8feaSLen Brown { 2110103a8feaSLen Brown return 0; 2111103a8feaSLen Brown } 2112103a8feaSLen Brown 2113c98d5d94SLen Brown void topology_probe() 2114c98d5d94SLen Brown { 2115c98d5d94SLen Brown int i; 2116c98d5d94SLen Brown int max_core_id = 0; 2117c98d5d94SLen Brown int max_package_id = 0; 2118c98d5d94SLen Brown int max_siblings = 0; 2119c98d5d94SLen Brown struct cpu_topology { 2120c98d5d94SLen Brown int core_id; 2121c98d5d94SLen Brown int physical_package_id; 2122c98d5d94SLen Brown } *cpus; 2123c98d5d94SLen Brown 2124c98d5d94SLen Brown /* Initialize num_cpus, max_cpu_num */ 2125c98d5d94SLen Brown topo.num_cpus = 0; 2126c98d5d94SLen Brown topo.max_cpu_num = 0; 2127c98d5d94SLen Brown for_all_proc_cpus(count_cpus); 2128c98d5d94SLen Brown if (!summary_only && topo.num_cpus > 1) 2129c98d5d94SLen Brown show_cpu = 1; 2130c98d5d94SLen Brown 2131c98d5d94SLen Brown if (verbose > 1) 2132c98d5d94SLen Brown fprintf(stderr, "num_cpus %d max_cpu_num %d\n", topo.num_cpus, topo.max_cpu_num); 2133c98d5d94SLen Brown 2134c98d5d94SLen Brown cpus = calloc(1, (topo.max_cpu_num + 1) * sizeof(struct cpu_topology)); 2135b2c95d90SJosh Triplett if (cpus == NULL) 2136b2c95d90SJosh Triplett err(1, "calloc cpus"); 2137c98d5d94SLen Brown 2138c98d5d94SLen Brown /* 2139c98d5d94SLen Brown * Allocate and initialize cpu_present_set 2140c98d5d94SLen Brown */ 2141c98d5d94SLen Brown cpu_present_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2142b2c95d90SJosh Triplett if (cpu_present_set == NULL) 2143b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2144c98d5d94SLen Brown cpu_present_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2145c98d5d94SLen Brown CPU_ZERO_S(cpu_present_setsize, cpu_present_set); 2146c98d5d94SLen Brown for_all_proc_cpus(mark_cpu_present); 2147c98d5d94SLen Brown 2148c98d5d94SLen Brown /* 2149c98d5d94SLen Brown * Allocate and initialize cpu_affinity_set 2150c98d5d94SLen Brown */ 2151c98d5d94SLen Brown cpu_affinity_set = CPU_ALLOC((topo.max_cpu_num + 1)); 2152b2c95d90SJosh Triplett if (cpu_affinity_set == NULL) 2153b2c95d90SJosh Triplett err(3, "CPU_ALLOC"); 2154c98d5d94SLen Brown cpu_affinity_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 2155c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 2156c98d5d94SLen Brown 2157c98d5d94SLen Brown 2158c98d5d94SLen Brown /* 2159c98d5d94SLen Brown * For online cpus 2160c98d5d94SLen Brown * find max_core_id, max_package_id 2161c98d5d94SLen Brown */ 2162c98d5d94SLen Brown for (i = 0; i <= topo.max_cpu_num; ++i) { 2163c98d5d94SLen Brown int siblings; 2164c98d5d94SLen Brown 2165c98d5d94SLen Brown if (cpu_is_not_present(i)) { 2166c98d5d94SLen Brown if (verbose > 1) 2167c98d5d94SLen Brown fprintf(stderr, "cpu%d NOT PRESENT\n", i); 2168c98d5d94SLen Brown continue; 2169c98d5d94SLen Brown } 2170c98d5d94SLen Brown cpus[i].core_id = get_core_id(i); 2171c98d5d94SLen Brown if (cpus[i].core_id > max_core_id) 2172c98d5d94SLen Brown max_core_id = cpus[i].core_id; 2173c98d5d94SLen Brown 2174c98d5d94SLen Brown cpus[i].physical_package_id = get_physical_package_id(i); 2175c98d5d94SLen Brown if (cpus[i].physical_package_id > max_package_id) 2176c98d5d94SLen Brown max_package_id = cpus[i].physical_package_id; 2177c98d5d94SLen Brown 2178c98d5d94SLen Brown siblings = get_num_ht_siblings(i); 2179c98d5d94SLen Brown if (siblings > max_siblings) 2180c98d5d94SLen Brown max_siblings = siblings; 2181c98d5d94SLen Brown if (verbose > 1) 2182c98d5d94SLen Brown fprintf(stderr, "cpu %d pkg %d core %d\n", 2183c98d5d94SLen Brown i, cpus[i].physical_package_id, cpus[i].core_id); 2184c98d5d94SLen Brown } 2185c98d5d94SLen Brown topo.num_cores_per_pkg = max_core_id + 1; 2186c98d5d94SLen Brown if (verbose > 1) 2187c98d5d94SLen Brown fprintf(stderr, "max_core_id %d, sizing for %d cores per package\n", 2188c98d5d94SLen Brown max_core_id, topo.num_cores_per_pkg); 2189c98d5d94SLen Brown if (!summary_only && topo.num_cores_per_pkg > 1) 2190c98d5d94SLen Brown show_core = 1; 2191c98d5d94SLen Brown 2192c98d5d94SLen Brown topo.num_packages = max_package_id + 1; 2193c98d5d94SLen Brown if (verbose > 1) 2194c98d5d94SLen Brown fprintf(stderr, "max_package_id %d, sizing for %d packages\n", 2195c98d5d94SLen Brown max_package_id, topo.num_packages); 2196c98d5d94SLen Brown if (!summary_only && topo.num_packages > 1) 2197c98d5d94SLen Brown show_pkg = 1; 2198c98d5d94SLen Brown 2199c98d5d94SLen Brown topo.num_threads_per_core = max_siblings; 2200c98d5d94SLen Brown if (verbose > 1) 2201c98d5d94SLen Brown fprintf(stderr, "max_siblings %d\n", max_siblings); 2202c98d5d94SLen Brown 2203c98d5d94SLen Brown free(cpus); 2204c98d5d94SLen Brown } 2205c98d5d94SLen Brown 2206c98d5d94SLen Brown void 2207c98d5d94SLen Brown allocate_counters(struct thread_data **t, struct core_data **c, struct pkg_data **p) 2208c98d5d94SLen Brown { 2209c98d5d94SLen Brown int i; 2210c98d5d94SLen Brown 2211c98d5d94SLen Brown *t = calloc(topo.num_threads_per_core * topo.num_cores_per_pkg * 2212c98d5d94SLen Brown topo.num_packages, sizeof(struct thread_data)); 2213c98d5d94SLen Brown if (*t == NULL) 2214c98d5d94SLen Brown goto error; 2215c98d5d94SLen Brown 2216c98d5d94SLen Brown for (i = 0; i < topo.num_threads_per_core * 2217c98d5d94SLen Brown topo.num_cores_per_pkg * topo.num_packages; i++) 2218c98d5d94SLen Brown (*t)[i].cpu_id = -1; 2219c98d5d94SLen Brown 2220c98d5d94SLen Brown *c = calloc(topo.num_cores_per_pkg * topo.num_packages, 2221c98d5d94SLen Brown sizeof(struct core_data)); 2222c98d5d94SLen Brown if (*c == NULL) 2223c98d5d94SLen Brown goto error; 2224c98d5d94SLen Brown 2225c98d5d94SLen Brown for (i = 0; i < topo.num_cores_per_pkg * topo.num_packages; i++) 2226c98d5d94SLen Brown (*c)[i].core_id = -1; 2227c98d5d94SLen Brown 2228c98d5d94SLen Brown *p = calloc(topo.num_packages, sizeof(struct pkg_data)); 2229c98d5d94SLen Brown if (*p == NULL) 2230c98d5d94SLen Brown goto error; 2231c98d5d94SLen Brown 2232c98d5d94SLen Brown for (i = 0; i < topo.num_packages; i++) 2233c98d5d94SLen Brown (*p)[i].package_id = i; 2234c98d5d94SLen Brown 2235c98d5d94SLen Brown return; 2236c98d5d94SLen Brown error: 2237b2c95d90SJosh Triplett err(1, "calloc counters"); 2238c98d5d94SLen Brown } 2239c98d5d94SLen Brown /* 2240c98d5d94SLen Brown * init_counter() 2241c98d5d94SLen Brown * 2242c98d5d94SLen Brown * set cpu_id, core_num, pkg_num 2243c98d5d94SLen Brown * set FIRST_THREAD_IN_CORE and FIRST_CORE_IN_PACKAGE 2244c98d5d94SLen Brown * 2245c98d5d94SLen Brown * increment topo.num_cores when 1st core in pkg seen 2246c98d5d94SLen Brown */ 2247c98d5d94SLen Brown void init_counter(struct thread_data *thread_base, struct core_data *core_base, 2248c98d5d94SLen Brown struct pkg_data *pkg_base, int thread_num, int core_num, 2249c98d5d94SLen Brown int pkg_num, int cpu_id) 2250c98d5d94SLen Brown { 2251c98d5d94SLen Brown struct thread_data *t; 2252c98d5d94SLen Brown struct core_data *c; 2253c98d5d94SLen Brown struct pkg_data *p; 2254c98d5d94SLen Brown 2255c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_num, core_num, pkg_num); 2256c98d5d94SLen Brown c = GET_CORE(core_base, core_num, pkg_num); 2257c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_num); 2258c98d5d94SLen Brown 2259c98d5d94SLen Brown t->cpu_id = cpu_id; 2260c98d5d94SLen Brown if (thread_num == 0) { 2261c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_THREAD_IN_CORE; 2262c98d5d94SLen Brown if (cpu_is_first_core_in_package(cpu_id)) 2263c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_CORE_IN_PACKAGE; 2264c98d5d94SLen Brown } 2265c98d5d94SLen Brown 2266c98d5d94SLen Brown c->core_id = core_num; 2267c98d5d94SLen Brown p->package_id = pkg_num; 2268c98d5d94SLen Brown } 2269c98d5d94SLen Brown 2270c98d5d94SLen Brown 2271c98d5d94SLen Brown int initialize_counters(int cpu_id) 2272c98d5d94SLen Brown { 2273c98d5d94SLen Brown int my_thread_id, my_core_id, my_package_id; 2274c98d5d94SLen Brown 2275c98d5d94SLen Brown my_package_id = get_physical_package_id(cpu_id); 2276c98d5d94SLen Brown my_core_id = get_core_id(cpu_id); 2277c98d5d94SLen Brown 2278c98d5d94SLen Brown if (cpu_is_first_sibling_in_core(cpu_id)) { 2279c98d5d94SLen Brown my_thread_id = 0; 2280c98d5d94SLen Brown topo.num_cores++; 2281c98d5d94SLen Brown } else { 2282c98d5d94SLen Brown my_thread_id = 1; 2283c98d5d94SLen Brown } 2284c98d5d94SLen Brown 2285c98d5d94SLen Brown init_counter(EVEN_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2286c98d5d94SLen Brown init_counter(ODD_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 2287c98d5d94SLen Brown return 0; 2288c98d5d94SLen Brown } 2289c98d5d94SLen Brown 2290c98d5d94SLen Brown void allocate_output_buffer() 2291c98d5d94SLen Brown { 2292b844db31SJosh Triplett output_buffer = calloc(1, (1 + topo.num_cpus) * 256); 2293c98d5d94SLen Brown outp = output_buffer; 2294b2c95d90SJosh Triplett if (outp == NULL) 2295b2c95d90SJosh Triplett err(-1, "calloc output buffer"); 2296c98d5d94SLen Brown } 2297c98d5d94SLen Brown 2298c98d5d94SLen Brown void setup_all_buffers(void) 2299c98d5d94SLen Brown { 2300c98d5d94SLen Brown topology_probe(); 2301c98d5d94SLen Brown allocate_counters(&thread_even, &core_even, &package_even); 2302c98d5d94SLen Brown allocate_counters(&thread_odd, &core_odd, &package_odd); 2303c98d5d94SLen Brown allocate_output_buffer(); 2304c98d5d94SLen Brown for_all_proc_cpus(initialize_counters); 2305c98d5d94SLen Brown } 2306103a8feaSLen Brown void turbostat_init() 2307103a8feaSLen Brown { 2308103a8feaSLen Brown check_cpuid(); 2309103a8feaSLen Brown 2310103a8feaSLen Brown check_dev_msr(); 2311103a8feaSLen Brown check_super_user(); 2312103a8feaSLen Brown 2313c98d5d94SLen Brown setup_all_buffers(); 2314103a8feaSLen Brown 2315103a8feaSLen Brown if (verbose) 2316c98d5d94SLen Brown print_verbose_header(); 2317889facbeSLen Brown 2318889facbeSLen Brown if (verbose) 2319889facbeSLen Brown for_all_cpus(print_epb, ODD_COUNTERS); 2320889facbeSLen Brown 2321889facbeSLen Brown if (verbose) 2322889facbeSLen Brown for_all_cpus(print_rapl, ODD_COUNTERS); 2323889facbeSLen Brown 2324889facbeSLen Brown for_all_cpus(set_temperature_target, ODD_COUNTERS); 2325889facbeSLen Brown 2326889facbeSLen Brown if (verbose) 2327889facbeSLen Brown for_all_cpus(print_thermal, ODD_COUNTERS); 2328103a8feaSLen Brown } 2329103a8feaSLen Brown 2330103a8feaSLen Brown int fork_it(char **argv) 2331103a8feaSLen Brown { 2332103a8feaSLen Brown pid_t child_pid; 2333d91bb17cSLen Brown int status; 2334d15cf7c1SLen Brown 2335d91bb17cSLen Brown status = for_all_cpus(get_counters, EVEN_COUNTERS); 2336d91bb17cSLen Brown if (status) 2337d91bb17cSLen Brown exit(status); 2338d15cf7c1SLen Brown /* clear affinity side-effect of get_counters() */ 2339d15cf7c1SLen Brown sched_setaffinity(0, cpu_present_setsize, cpu_present_set); 2340103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 2341103a8feaSLen Brown 2342103a8feaSLen Brown child_pid = fork(); 2343103a8feaSLen Brown if (!child_pid) { 2344103a8feaSLen Brown /* child */ 2345103a8feaSLen Brown execvp(argv[0], argv); 2346103a8feaSLen Brown } else { 2347103a8feaSLen Brown 2348103a8feaSLen Brown /* parent */ 2349b2c95d90SJosh Triplett if (child_pid == -1) 2350b2c95d90SJosh Triplett err(1, "fork"); 2351103a8feaSLen Brown 2352103a8feaSLen Brown signal(SIGINT, SIG_IGN); 2353103a8feaSLen Brown signal(SIGQUIT, SIG_IGN); 2354b2c95d90SJosh Triplett if (waitpid(child_pid, &status, 0) == -1) 2355b2c95d90SJosh Triplett err(status, "waitpid"); 2356103a8feaSLen Brown } 2357c98d5d94SLen Brown /* 2358c98d5d94SLen Brown * n.b. fork_it() does not check for errors from for_all_cpus() 2359c98d5d94SLen Brown * because re-starting is problematic when forking 2360c98d5d94SLen Brown */ 2361c98d5d94SLen Brown for_all_cpus(get_counters, ODD_COUNTERS); 2362103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 2363103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 2364c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 2365c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 2366c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 2367c98d5d94SLen Brown flush_stderr(); 2368103a8feaSLen Brown 23696eab04a8SJustin P. Mattock fprintf(stderr, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0); 2370103a8feaSLen Brown 2371d91bb17cSLen Brown return status; 2372103a8feaSLen Brown } 2373103a8feaSLen Brown 2374103a8feaSLen Brown void cmdline(int argc, char **argv) 2375103a8feaSLen Brown { 2376103a8feaSLen Brown int opt; 2377103a8feaSLen Brown 2378103a8feaSLen Brown progname = argv[0]; 2379103a8feaSLen Brown 2380*f591c38bSAndy Shevchenko while ((opt = getopt(argc, argv, "+pPSvi:c:C:m:M:RJT:")) != -1) { 2381103a8feaSLen Brown switch (opt) { 2382f9240813SLen Brown case 'p': 2383c98d5d94SLen Brown show_core_only++; 2384c98d5d94SLen Brown break; 2385f9240813SLen Brown case 'P': 2386c98d5d94SLen Brown show_pkg_only++; 2387c98d5d94SLen Brown break; 2388f9240813SLen Brown case 'S': 2389e23da037SLen Brown summary_only++; 2390e23da037SLen Brown break; 2391103a8feaSLen Brown case 'v': 2392103a8feaSLen Brown verbose++; 2393103a8feaSLen Brown break; 2394103a8feaSLen Brown case 'i': 2395103a8feaSLen Brown interval_sec = atoi(optarg); 2396103a8feaSLen Brown break; 2397f9240813SLen Brown case 'c': 23988e180f3cSLen Brown sscanf(optarg, "%x", &extra_delta_offset32); 23998e180f3cSLen Brown break; 2400f9240813SLen Brown case 'C': 24018e180f3cSLen Brown sscanf(optarg, "%x", &extra_delta_offset64); 24028e180f3cSLen Brown break; 24032f32edf1SLen Brown case 'm': 24042f32edf1SLen Brown sscanf(optarg, "%x", &extra_msr_offset32); 24052f32edf1SLen Brown break; 24062f32edf1SLen Brown case 'M': 24072f32edf1SLen Brown sscanf(optarg, "%x", &extra_msr_offset64); 2408103a8feaSLen Brown break; 2409889facbeSLen Brown case 'R': 2410889facbeSLen Brown rapl_verbose++; 2411889facbeSLen Brown break; 2412889facbeSLen Brown case 'T': 2413889facbeSLen Brown tcc_activation_temp_override = atoi(optarg); 2414889facbeSLen Brown break; 24155c56be9aSDirk Brandewie case 'J': 24165c56be9aSDirk Brandewie rapl_joules++; 24175c56be9aSDirk Brandewie break; 24185c56be9aSDirk Brandewie 2419103a8feaSLen Brown default: 2420103a8feaSLen Brown usage(); 2421103a8feaSLen Brown } 2422103a8feaSLen Brown } 2423103a8feaSLen Brown } 2424103a8feaSLen Brown 2425103a8feaSLen Brown int main(int argc, char **argv) 2426103a8feaSLen Brown { 2427103a8feaSLen Brown cmdline(argc, argv); 2428103a8feaSLen Brown 2429889facbeSLen Brown if (verbose) 2430e6f9bb3cSLen Brown fprintf(stderr, "turbostat v3.6 Dec 2, 2013" 2431103a8feaSLen Brown " - Len Brown <lenb@kernel.org>\n"); 2432103a8feaSLen Brown 2433103a8feaSLen Brown turbostat_init(); 2434103a8feaSLen Brown 2435103a8feaSLen Brown /* 2436103a8feaSLen Brown * if any params left, it must be a command to fork 2437103a8feaSLen Brown */ 2438103a8feaSLen Brown if (argc - optind) 2439103a8feaSLen Brown return fork_it(argv + optind); 2440103a8feaSLen Brown else 2441103a8feaSLen Brown turbostat_loop(); 2442103a8feaSLen Brown 2443103a8feaSLen Brown return 0; 2444103a8feaSLen Brown } 2445