1103a8feaSLen Brown /* 2103a8feaSLen Brown * turbostat -- show CPU frequency and C-state residency 3103a8feaSLen Brown * on modern Intel turbo-capable processors. 4103a8feaSLen Brown * 5e23da037SLen Brown * Copyright (c) 2012 Intel Corporation. 6103a8feaSLen Brown * Len Brown <len.brown@intel.com> 7103a8feaSLen Brown * 8103a8feaSLen Brown * This program is free software; you can redistribute it and/or modify it 9103a8feaSLen Brown * under the terms and conditions of the GNU General Public License, 10103a8feaSLen Brown * version 2, as published by the Free Software Foundation. 11103a8feaSLen Brown * 12103a8feaSLen Brown * This program is distributed in the hope it will be useful, but WITHOUT 13103a8feaSLen Brown * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 14103a8feaSLen Brown * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 15103a8feaSLen Brown * more details. 16103a8feaSLen Brown * 17103a8feaSLen Brown * You should have received a copy of the GNU General Public License along with 18103a8feaSLen Brown * this program; if not, write to the Free Software Foundation, Inc., 19103a8feaSLen Brown * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. 20103a8feaSLen Brown */ 21103a8feaSLen Brown 2288c3281fSLen Brown #define _GNU_SOURCE 23103a8feaSLen Brown #include <stdio.h> 24103a8feaSLen Brown #include <unistd.h> 25103a8feaSLen Brown #include <sys/types.h> 26103a8feaSLen Brown #include <sys/wait.h> 27103a8feaSLen Brown #include <sys/stat.h> 28103a8feaSLen Brown #include <sys/resource.h> 29103a8feaSLen Brown #include <fcntl.h> 30103a8feaSLen Brown #include <signal.h> 31103a8feaSLen Brown #include <sys/time.h> 32103a8feaSLen Brown #include <stdlib.h> 33103a8feaSLen Brown #include <dirent.h> 34103a8feaSLen Brown #include <string.h> 35103a8feaSLen Brown #include <ctype.h> 3688c3281fSLen Brown #include <sched.h> 37103a8feaSLen Brown 38103a8feaSLen Brown #define MSR_TSC 0x10 39103a8feaSLen Brown #define MSR_NEHALEM_PLATFORM_INFO 0xCE 40103a8feaSLen Brown #define MSR_NEHALEM_TURBO_RATIO_LIMIT 0x1AD 41103a8feaSLen Brown #define MSR_APERF 0xE8 42103a8feaSLen Brown #define MSR_MPERF 0xE7 43103a8feaSLen Brown #define MSR_PKG_C2_RESIDENCY 0x60D /* SNB only */ 44103a8feaSLen Brown #define MSR_PKG_C3_RESIDENCY 0x3F8 45103a8feaSLen Brown #define MSR_PKG_C6_RESIDENCY 0x3F9 46103a8feaSLen Brown #define MSR_PKG_C7_RESIDENCY 0x3FA /* SNB only */ 47103a8feaSLen Brown #define MSR_CORE_C3_RESIDENCY 0x3FC 48103a8feaSLen Brown #define MSR_CORE_C6_RESIDENCY 0x3FD 49103a8feaSLen Brown #define MSR_CORE_C7_RESIDENCY 0x3FE /* SNB only */ 50103a8feaSLen Brown 51103a8feaSLen Brown char *proc_stat = "/proc/stat"; 52103a8feaSLen Brown unsigned int interval_sec = 5; /* set with -i interval_sec */ 53103a8feaSLen Brown unsigned int verbose; /* set with -v */ 54e23da037SLen Brown unsigned int summary_only; /* set with -s */ 55103a8feaSLen Brown unsigned int skip_c0; 56103a8feaSLen Brown unsigned int skip_c1; 57103a8feaSLen Brown unsigned int do_nhm_cstates; 58103a8feaSLen Brown unsigned int do_snb_cstates; 59103a8feaSLen Brown unsigned int has_aperf; 60103a8feaSLen Brown unsigned int units = 1000000000; /* Ghz etc */ 61103a8feaSLen Brown unsigned int genuine_intel; 62103a8feaSLen Brown unsigned int has_invariant_tsc; 63103a8feaSLen Brown unsigned int do_nehalem_platform_info; 64103a8feaSLen Brown unsigned int do_nehalem_turbo_ratio_limit; 65103a8feaSLen Brown unsigned int extra_msr_offset; 66103a8feaSLen Brown double bclk; 67103a8feaSLen Brown unsigned int show_pkg; 68103a8feaSLen Brown unsigned int show_core; 69103a8feaSLen Brown unsigned int show_cpu; 70*c98d5d94SLen Brown unsigned int show_pkg_only; 71*c98d5d94SLen Brown unsigned int show_core_only; 72*c98d5d94SLen Brown char *output_buffer, *outp; 73103a8feaSLen Brown 74103a8feaSLen Brown int aperf_mperf_unstable; 75103a8feaSLen Brown int backwards_count; 76103a8feaSLen Brown char *progname; 77103a8feaSLen Brown 78*c98d5d94SLen Brown cpu_set_t *cpu_present_set, *cpu_affinity_set; 79*c98d5d94SLen Brown size_t cpu_present_setsize, cpu_affinity_setsize; 80*c98d5d94SLen Brown 81*c98d5d94SLen Brown struct thread_data { 82*c98d5d94SLen Brown unsigned long long tsc; 83*c98d5d94SLen Brown unsigned long long aperf; 84*c98d5d94SLen Brown unsigned long long mperf; 85*c98d5d94SLen Brown unsigned long long c1; /* derived */ 86*c98d5d94SLen Brown unsigned long long extra_msr; 87*c98d5d94SLen Brown unsigned int cpu_id; 88*c98d5d94SLen Brown unsigned int flags; 89*c98d5d94SLen Brown #define CPU_IS_FIRST_THREAD_IN_CORE 0x2 90*c98d5d94SLen Brown #define CPU_IS_FIRST_CORE_IN_PACKAGE 0x4 91*c98d5d94SLen Brown } *thread_even, *thread_odd; 92*c98d5d94SLen Brown 93*c98d5d94SLen Brown struct core_data { 94*c98d5d94SLen Brown unsigned long long c3; 95*c98d5d94SLen Brown unsigned long long c6; 96*c98d5d94SLen Brown unsigned long long c7; 97*c98d5d94SLen Brown unsigned int core_id; 98*c98d5d94SLen Brown } *core_even, *core_odd; 99*c98d5d94SLen Brown 100*c98d5d94SLen Brown struct pkg_data { 101*c98d5d94SLen Brown unsigned long long pc2; 102*c98d5d94SLen Brown unsigned long long pc3; 103*c98d5d94SLen Brown unsigned long long pc6; 104*c98d5d94SLen Brown unsigned long long pc7; 105*c98d5d94SLen Brown unsigned int package_id; 106*c98d5d94SLen Brown } *package_even, *package_odd; 107*c98d5d94SLen Brown 108*c98d5d94SLen Brown #define ODD_COUNTERS thread_odd, core_odd, package_odd 109*c98d5d94SLen Brown #define EVEN_COUNTERS thread_even, core_even, package_even 110*c98d5d94SLen Brown 111*c98d5d94SLen Brown #define GET_THREAD(thread_base, thread_no, core_no, pkg_no) \ 112*c98d5d94SLen Brown (thread_base + (pkg_no) * topo.num_cores_per_pkg * \ 113*c98d5d94SLen Brown topo.num_threads_per_core + \ 114*c98d5d94SLen Brown (core_no) * topo.num_threads_per_core + (thread_no)) 115*c98d5d94SLen Brown #define GET_CORE(core_base, core_no, pkg_no) \ 116*c98d5d94SLen Brown (core_base + (pkg_no) * topo.num_cores_per_pkg + (core_no)) 117*c98d5d94SLen Brown #define GET_PKG(pkg_base, pkg_no) (pkg_base + pkg_no) 118*c98d5d94SLen Brown 119*c98d5d94SLen Brown struct system_summary { 120*c98d5d94SLen Brown struct thread_data threads; 121*c98d5d94SLen Brown struct core_data cores; 122*c98d5d94SLen Brown struct pkg_data packages; 123*c98d5d94SLen Brown } sum, average; 124*c98d5d94SLen Brown 125*c98d5d94SLen Brown 126*c98d5d94SLen Brown struct topo_params { 127*c98d5d94SLen Brown int num_packages; 128103a8feaSLen Brown int num_cpus; 129*c98d5d94SLen Brown int num_cores; 130*c98d5d94SLen Brown int max_cpu_num; 131*c98d5d94SLen Brown int num_cores_per_pkg; 132*c98d5d94SLen Brown int num_threads_per_core; 133*c98d5d94SLen Brown } topo; 134103a8feaSLen Brown 135*c98d5d94SLen Brown struct timeval tv_even, tv_odd, tv_delta; 136103a8feaSLen Brown 137*c98d5d94SLen Brown void setup_all_buffers(void); 138103a8feaSLen Brown 139*c98d5d94SLen Brown int cpu_is_not_present(int cpu) 140d15cf7c1SLen Brown { 141*c98d5d94SLen Brown return !CPU_ISSET_S(cpu, cpu_present_setsize, cpu_present_set); 142*c98d5d94SLen Brown } 143*c98d5d94SLen Brown /* 144*c98d5d94SLen Brown * run func(thread, core, package) in topology order 145*c98d5d94SLen Brown * skip non-present cpus 146*c98d5d94SLen Brown */ 147*c98d5d94SLen Brown 148*c98d5d94SLen Brown int for_all_cpus(int (func)(struct thread_data *, struct core_data *, struct pkg_data *), 149*c98d5d94SLen Brown struct thread_data *thread_base, struct core_data *core_base, struct pkg_data *pkg_base) 150*c98d5d94SLen Brown { 151*c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 152*c98d5d94SLen Brown 153*c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 154*c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 155*c98d5d94SLen Brown for (thread_no = 0; thread_no < 156*c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 157*c98d5d94SLen Brown struct thread_data *t; 158*c98d5d94SLen Brown struct core_data *c; 159*c98d5d94SLen Brown struct pkg_data *p; 160*c98d5d94SLen Brown 161*c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 162*c98d5d94SLen Brown 163*c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 164*c98d5d94SLen Brown continue; 165*c98d5d94SLen Brown 166*c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 167*c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 168*c98d5d94SLen Brown 169*c98d5d94SLen Brown retval = func(t, c, p); 170*c98d5d94SLen Brown if (retval) 171*c98d5d94SLen Brown return retval; 172*c98d5d94SLen Brown } 173*c98d5d94SLen Brown } 174*c98d5d94SLen Brown } 175d15cf7c1SLen Brown return 0; 176d15cf7c1SLen Brown } 177d15cf7c1SLen Brown 17888c3281fSLen Brown int cpu_migrate(int cpu) 17988c3281fSLen Brown { 180*c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 181*c98d5d94SLen Brown CPU_SET_S(cpu, cpu_affinity_setsize, cpu_affinity_set); 182*c98d5d94SLen Brown if (sched_setaffinity(0, cpu_affinity_setsize, cpu_affinity_set) == -1) 18388c3281fSLen Brown return -1; 18488c3281fSLen Brown else 18588c3281fSLen Brown return 0; 18688c3281fSLen Brown } 18788c3281fSLen Brown 18815aaa346SLen Brown int get_msr(int cpu, off_t offset, unsigned long long *msr) 189103a8feaSLen Brown { 190103a8feaSLen Brown ssize_t retval; 191103a8feaSLen Brown char pathname[32]; 192103a8feaSLen Brown int fd; 193103a8feaSLen Brown 194103a8feaSLen Brown sprintf(pathname, "/dev/cpu/%d/msr", cpu); 195103a8feaSLen Brown fd = open(pathname, O_RDONLY); 19615aaa346SLen Brown if (fd < 0) 19715aaa346SLen Brown return -1; 198103a8feaSLen Brown 19915aaa346SLen Brown retval = pread(fd, msr, sizeof *msr, offset); 200103a8feaSLen Brown close(fd); 20115aaa346SLen Brown 20215aaa346SLen Brown if (retval != sizeof *msr) 20315aaa346SLen Brown return -1; 20415aaa346SLen Brown 20515aaa346SLen Brown return 0; 206103a8feaSLen Brown } 207103a8feaSLen Brown 208a829eb4dSLen Brown void print_header(void) 209103a8feaSLen Brown { 210103a8feaSLen Brown if (show_pkg) 211*c98d5d94SLen Brown outp += sprintf(outp, "pk"); 212e23da037SLen Brown if (show_pkg) 213*c98d5d94SLen Brown outp += sprintf(outp, " "); 214103a8feaSLen Brown if (show_core) 215*c98d5d94SLen Brown outp += sprintf(outp, "cor"); 216103a8feaSLen Brown if (show_cpu) 217*c98d5d94SLen Brown outp += sprintf(outp, " CPU"); 218e23da037SLen Brown if (show_pkg || show_core || show_cpu) 219*c98d5d94SLen Brown outp += sprintf(outp, " "); 220103a8feaSLen Brown if (do_nhm_cstates) 221*c98d5d94SLen Brown outp += sprintf(outp, " %%c0"); 222103a8feaSLen Brown if (has_aperf) 223*c98d5d94SLen Brown outp += sprintf(outp, " GHz"); 224*c98d5d94SLen Brown outp += sprintf(outp, " TSC"); 225103a8feaSLen Brown if (do_nhm_cstates) 226*c98d5d94SLen Brown outp += sprintf(outp, " %%c1"); 227103a8feaSLen Brown if (do_nhm_cstates) 228*c98d5d94SLen Brown outp += sprintf(outp, " %%c3"); 229103a8feaSLen Brown if (do_nhm_cstates) 230*c98d5d94SLen Brown outp += sprintf(outp, " %%c6"); 231103a8feaSLen Brown if (do_snb_cstates) 232*c98d5d94SLen Brown outp += sprintf(outp, " %%c7"); 233103a8feaSLen Brown if (do_snb_cstates) 234*c98d5d94SLen Brown outp += sprintf(outp, " %%pc2"); 235103a8feaSLen Brown if (do_nhm_cstates) 236*c98d5d94SLen Brown outp += sprintf(outp, " %%pc3"); 237103a8feaSLen Brown if (do_nhm_cstates) 238*c98d5d94SLen Brown outp += sprintf(outp, " %%pc6"); 239103a8feaSLen Brown if (do_snb_cstates) 240*c98d5d94SLen Brown outp += sprintf(outp, " %%pc7"); 241103a8feaSLen Brown if (extra_msr_offset) 242*c98d5d94SLen Brown outp += sprintf(outp, " MSR 0x%x ", extra_msr_offset); 243103a8feaSLen Brown 244*c98d5d94SLen Brown outp += sprintf(outp, "\n"); 245103a8feaSLen Brown } 246103a8feaSLen Brown 247*c98d5d94SLen Brown int dump_counters(struct thread_data *t, struct core_data *c, 248*c98d5d94SLen Brown struct pkg_data *p) 249103a8feaSLen Brown { 250*c98d5d94SLen Brown fprintf(stderr, "t %p, c %p, p %p\n", t, c, p); 251*c98d5d94SLen Brown 252*c98d5d94SLen Brown if (t) { 253*c98d5d94SLen Brown fprintf(stderr, "CPU: %d flags 0x%x\n", t->cpu_id, t->flags); 254*c98d5d94SLen Brown fprintf(stderr, "TSC: %016llX\n", t->tsc); 255*c98d5d94SLen Brown fprintf(stderr, "aperf: %016llX\n", t->aperf); 256*c98d5d94SLen Brown fprintf(stderr, "mperf: %016llX\n", t->mperf); 257*c98d5d94SLen Brown fprintf(stderr, "c1: %016llX\n", t->c1); 258*c98d5d94SLen Brown fprintf(stderr, "msr0x%x: %016llX\n", 259*c98d5d94SLen Brown extra_msr_offset, t->extra_msr); 260103a8feaSLen Brown } 261103a8feaSLen Brown 262*c98d5d94SLen Brown if (c) { 263*c98d5d94SLen Brown fprintf(stderr, "core: %d\n", c->core_id); 264*c98d5d94SLen Brown fprintf(stderr, "c3: %016llX\n", c->c3); 265*c98d5d94SLen Brown fprintf(stderr, "c6: %016llX\n", c->c6); 266*c98d5d94SLen Brown fprintf(stderr, "c7: %016llX\n", c->c7); 267*c98d5d94SLen Brown } 268103a8feaSLen Brown 269*c98d5d94SLen Brown if (p) { 270*c98d5d94SLen Brown fprintf(stderr, "package: %d\n", p->package_id); 271*c98d5d94SLen Brown fprintf(stderr, "pc2: %016llX\n", p->pc2); 272*c98d5d94SLen Brown fprintf(stderr, "pc3: %016llX\n", p->pc3); 273*c98d5d94SLen Brown fprintf(stderr, "pc6: %016llX\n", p->pc6); 274*c98d5d94SLen Brown fprintf(stderr, "pc7: %016llX\n", p->pc7); 275*c98d5d94SLen Brown } 276*c98d5d94SLen Brown return 0; 277103a8feaSLen Brown } 278103a8feaSLen Brown 279e23da037SLen Brown /* 280e23da037SLen Brown * column formatting convention & formats 281e23da037SLen Brown * package: "pk" 2 columns %2d 282e23da037SLen Brown * core: "cor" 3 columns %3d 283e23da037SLen Brown * CPU: "CPU" 3 columns %3d 284e23da037SLen Brown * GHz: "GHz" 3 columns %3.2 285e23da037SLen Brown * TSC: "TSC" 3 columns %3.2 286e23da037SLen Brown * percentage " %pc3" %6.2 287e23da037SLen Brown */ 288*c98d5d94SLen Brown int format_counters(struct thread_data *t, struct core_data *c, 289*c98d5d94SLen Brown struct pkg_data *p) 290103a8feaSLen Brown { 291103a8feaSLen Brown double interval_float; 292103a8feaSLen Brown 293*c98d5d94SLen Brown /* if showing only 1st thread in core and this isn't one, bail out */ 294*c98d5d94SLen Brown if (show_core_only && !(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 295*c98d5d94SLen Brown return 0; 296*c98d5d94SLen Brown 297*c98d5d94SLen Brown /* if showing only 1st thread in pkg and this isn't one, bail out */ 298*c98d5d94SLen Brown if (show_pkg_only && !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 299*c98d5d94SLen Brown return 0; 300*c98d5d94SLen Brown 301103a8feaSLen Brown interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0; 302103a8feaSLen Brown 303*c98d5d94SLen Brown /* topo columns, print blanks on 1st (average) line */ 304*c98d5d94SLen Brown if (t == &average.threads) { 305103a8feaSLen Brown if (show_pkg) 306*c98d5d94SLen Brown outp += sprintf(outp, " "); 307e23da037SLen Brown if (show_pkg && show_core) 308*c98d5d94SLen Brown outp += sprintf(outp, " "); 309103a8feaSLen Brown if (show_core) 310*c98d5d94SLen Brown outp += sprintf(outp, " "); 311103a8feaSLen Brown if (show_cpu) 312*c98d5d94SLen Brown outp += sprintf(outp, " " " "); 313103a8feaSLen Brown } else { 314*c98d5d94SLen Brown if (show_pkg) { 315*c98d5d94SLen Brown if (p) 316*c98d5d94SLen Brown outp += sprintf(outp, "%2d", p->package_id); 317*c98d5d94SLen Brown else 318*c98d5d94SLen Brown outp += sprintf(outp, " "); 319*c98d5d94SLen Brown } 320e23da037SLen Brown if (show_pkg && show_core) 321*c98d5d94SLen Brown outp += sprintf(outp, " "); 322*c98d5d94SLen Brown if (show_core) { 323*c98d5d94SLen Brown if (c) 324*c98d5d94SLen Brown outp += sprintf(outp, "%3d", c->core_id); 325*c98d5d94SLen Brown else 326*c98d5d94SLen Brown outp += sprintf(outp, " "); 327*c98d5d94SLen Brown } 328103a8feaSLen Brown if (show_cpu) 329*c98d5d94SLen Brown outp += sprintf(outp, " %3d", t->cpu_id); 330103a8feaSLen Brown } 331103a8feaSLen Brown 332103a8feaSLen Brown /* %c0 */ 333103a8feaSLen Brown if (do_nhm_cstates) { 334e23da037SLen Brown if (show_pkg || show_core || show_cpu) 335*c98d5d94SLen Brown outp += sprintf(outp, " "); 336103a8feaSLen Brown if (!skip_c0) 337*c98d5d94SLen Brown outp += sprintf(outp, "%6.2f", 100.0 * t->mperf/t->tsc); 338103a8feaSLen Brown else 339*c98d5d94SLen Brown outp += sprintf(outp, " ****"); 340103a8feaSLen Brown } 341103a8feaSLen Brown 342103a8feaSLen Brown /* GHz */ 343103a8feaSLen Brown if (has_aperf) { 344103a8feaSLen Brown if (!aperf_mperf_unstable) { 345*c98d5d94SLen Brown outp += sprintf(outp, " %3.2f", 346*c98d5d94SLen Brown 1.0 * t->tsc / units * t->aperf / 347*c98d5d94SLen Brown t->mperf / interval_float); 348103a8feaSLen Brown } else { 349*c98d5d94SLen Brown if (t->aperf > t->tsc || t->mperf > t->tsc) { 350*c98d5d94SLen Brown outp += sprintf(outp, " ***"); 351103a8feaSLen Brown } else { 352*c98d5d94SLen Brown outp += sprintf(outp, "%3.1f*", 353*c98d5d94SLen Brown 1.0 * t->tsc / 354*c98d5d94SLen Brown units * t->aperf / 355*c98d5d94SLen Brown t->mperf / interval_float); 356103a8feaSLen Brown } 357103a8feaSLen Brown } 358103a8feaSLen Brown } 359103a8feaSLen Brown 360103a8feaSLen Brown /* TSC */ 361*c98d5d94SLen Brown outp += sprintf(outp, "%5.2f", 1.0 * t->tsc/units/interval_float); 362103a8feaSLen Brown 363103a8feaSLen Brown if (do_nhm_cstates) { 364103a8feaSLen Brown if (!skip_c1) 365*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * t->c1/t->tsc); 366103a8feaSLen Brown else 367*c98d5d94SLen Brown outp += sprintf(outp, " ****"); 368103a8feaSLen Brown } 369*c98d5d94SLen Brown 370*c98d5d94SLen Brown /* print per-core data only for 1st thread in core */ 371*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 372*c98d5d94SLen Brown goto done; 373*c98d5d94SLen Brown 374103a8feaSLen Brown if (do_nhm_cstates) 375*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c3/t->tsc); 376103a8feaSLen Brown if (do_nhm_cstates) 377*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c6/t->tsc); 378103a8feaSLen Brown if (do_snb_cstates) 379*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * c->c7/t->tsc); 380*c98d5d94SLen Brown 381*c98d5d94SLen Brown /* print per-package data only for 1st core in package */ 382*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 383*c98d5d94SLen Brown goto done; 384*c98d5d94SLen Brown 385103a8feaSLen Brown if (do_snb_cstates) 386*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc2/t->tsc); 387103a8feaSLen Brown if (do_nhm_cstates) 388*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc3/t->tsc); 389103a8feaSLen Brown if (do_nhm_cstates) 390*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc6/t->tsc); 391103a8feaSLen Brown if (do_snb_cstates) 392*c98d5d94SLen Brown outp += sprintf(outp, " %6.2f", 100.0 * p->pc7/t->tsc); 393*c98d5d94SLen Brown done: 394103a8feaSLen Brown if (extra_msr_offset) 395*c98d5d94SLen Brown outp += sprintf(outp, " 0x%016llx", t->extra_msr); 396*c98d5d94SLen Brown outp += sprintf(outp, "\n"); 397*c98d5d94SLen Brown 398*c98d5d94SLen Brown return 0; 399103a8feaSLen Brown } 400103a8feaSLen Brown 401*c98d5d94SLen Brown void flush_stdout() 402103a8feaSLen Brown { 403*c98d5d94SLen Brown fputs(output_buffer, stdout); 404*c98d5d94SLen Brown outp = output_buffer; 405*c98d5d94SLen Brown } 406*c98d5d94SLen Brown void flush_stderr() 407*c98d5d94SLen Brown { 408*c98d5d94SLen Brown fputs(output_buffer, stderr); 409*c98d5d94SLen Brown outp = output_buffer; 410*c98d5d94SLen Brown } 411*c98d5d94SLen Brown void format_all_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 412*c98d5d94SLen Brown { 413e23da037SLen Brown static int printed; 414103a8feaSLen Brown 415e23da037SLen Brown if (!printed || !summary_only) 416103a8feaSLen Brown print_header(); 417103a8feaSLen Brown 418*c98d5d94SLen Brown if (topo.num_cpus > 1) 419*c98d5d94SLen Brown format_counters(&average.threads, &average.cores, 420*c98d5d94SLen Brown &average.packages); 421103a8feaSLen Brown 422e23da037SLen Brown printed = 1; 423e23da037SLen Brown 424e23da037SLen Brown if (summary_only) 425e23da037SLen Brown return; 426e23da037SLen Brown 427*c98d5d94SLen Brown for_all_cpus(format_counters, t, c, p); 428103a8feaSLen Brown } 429103a8feaSLen Brown 430*c98d5d94SLen Brown void 431*c98d5d94SLen Brown delta_package(struct pkg_data *new, struct pkg_data *old) 432103a8feaSLen Brown { 433*c98d5d94SLen Brown old->pc2 = new->pc2 - old->pc2; 434*c98d5d94SLen Brown old->pc3 = new->pc3 - old->pc3; 435*c98d5d94SLen Brown old->pc6 = new->pc6 - old->pc6; 436*c98d5d94SLen Brown old->pc7 = new->pc7 - old->pc7; 437103a8feaSLen Brown } 438103a8feaSLen Brown 439*c98d5d94SLen Brown void 440*c98d5d94SLen Brown delta_core(struct core_data *new, struct core_data *old) 441*c98d5d94SLen Brown { 442*c98d5d94SLen Brown old->c3 = new->c3 - old->c3; 443*c98d5d94SLen Brown old->c6 = new->c6 - old->c6; 444*c98d5d94SLen Brown old->c7 = new->c7 - old->c7; 445103a8feaSLen Brown } 446*c98d5d94SLen Brown 447*c98d5d94SLen Brown void 448*c98d5d94SLen Brown delta_thread(struct thread_data *new, struct thread_data *old, 449*c98d5d94SLen Brown struct core_data *core_delta) 450*c98d5d94SLen Brown { 451*c98d5d94SLen Brown old->tsc = new->tsc - old->tsc; 452*c98d5d94SLen Brown 453103a8feaSLen Brown /* check for TSC < 1 Mcycles over interval */ 454*c98d5d94SLen Brown if (old->tsc < (1000 * 1000)) { 455*c98d5d94SLen Brown fprintf(stderr, "Insanely slow TSC rate, TSC stops in idle?\n"); 456*c98d5d94SLen Brown fprintf(stderr, "You can disable all c-states by booting with \"idle=poll\"\n"); 457*c98d5d94SLen Brown fprintf(stderr, "or just the deep ones with \"processor.max_cstate=1\"\n"); 458103a8feaSLen Brown exit(-3); 459103a8feaSLen Brown } 460103a8feaSLen Brown 461*c98d5d94SLen Brown old->c1 = new->c1 - old->c1; 462*c98d5d94SLen Brown 463*c98d5d94SLen Brown if ((new->aperf > old->aperf) && (new->mperf > old->mperf)) { 464*c98d5d94SLen Brown old->aperf = new->aperf - old->aperf; 465*c98d5d94SLen Brown old->mperf = new->mperf - old->mperf; 466*c98d5d94SLen Brown } else { 467*c98d5d94SLen Brown 468103a8feaSLen Brown if (!aperf_mperf_unstable) { 469103a8feaSLen Brown fprintf(stderr, "%s: APERF or MPERF went backwards *\n", progname); 470103a8feaSLen Brown fprintf(stderr, "* Frequency results do not cover entire interval *\n"); 471103a8feaSLen Brown fprintf(stderr, "* fix this by running Linux-2.6.30 or later *\n"); 472103a8feaSLen Brown 473103a8feaSLen Brown aperf_mperf_unstable = 1; 474103a8feaSLen Brown } 475103a8feaSLen Brown /* 476103a8feaSLen Brown * mperf delta is likely a huge "positive" number 477103a8feaSLen Brown * can not use it for calculating c0 time 478103a8feaSLen Brown */ 479103a8feaSLen Brown skip_c0 = 1; 480103a8feaSLen Brown skip_c1 = 1; 481103a8feaSLen Brown } 482103a8feaSLen Brown 483*c98d5d94SLen Brown 484103a8feaSLen Brown /* 485103a8feaSLen Brown * As mperf and tsc collection are not atomic, 486103a8feaSLen Brown * it is possible for mperf's non-halted cycles 487103a8feaSLen Brown * to exceed TSC's all cycles: show c1 = 0% in that case. 488103a8feaSLen Brown */ 489*c98d5d94SLen Brown if (old->mperf > old->tsc) 490*c98d5d94SLen Brown old->c1 = 0; 491*c98d5d94SLen Brown else { 492*c98d5d94SLen Brown /* normal case, derive c1 */ 493*c98d5d94SLen Brown old->c1 = old->tsc - old->mperf - core_delta->c3 494*c98d5d94SLen Brown - core_delta->c6 - core_delta->c7; 495*c98d5d94SLen Brown } 496*c98d5d94SLen Brown if (old->mperf == 0) { 497*c98d5d94SLen Brown if (verbose) fprintf(stderr, "cpu%d MPERF 0!\n", old->cpu_id); 498*c98d5d94SLen Brown old->mperf = 1; /* divide by 0 protection */ 499*c98d5d94SLen Brown } 500103a8feaSLen Brown 501103a8feaSLen Brown /* 502103a8feaSLen Brown * for "extra msr", just copy the latest w/o subtracting 503103a8feaSLen Brown */ 504*c98d5d94SLen Brown old->extra_msr = new->extra_msr; 505103a8feaSLen Brown } 506*c98d5d94SLen Brown 507*c98d5d94SLen Brown int delta_cpu(struct thread_data *t, struct core_data *c, 508*c98d5d94SLen Brown struct pkg_data *p, struct thread_data *t2, 509*c98d5d94SLen Brown struct core_data *c2, struct pkg_data *p2) 510*c98d5d94SLen Brown { 511*c98d5d94SLen Brown /* calculate core delta only for 1st thread in core */ 512*c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_THREAD_IN_CORE) 513*c98d5d94SLen Brown delta_core(c, c2); 514*c98d5d94SLen Brown 515*c98d5d94SLen Brown /* always calculate thread delta */ 516*c98d5d94SLen Brown delta_thread(t, t2, c2); /* c2 is core delta */ 517*c98d5d94SLen Brown 518*c98d5d94SLen Brown /* calculate package delta only for 1st core in package */ 519*c98d5d94SLen Brown if (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE) 520*c98d5d94SLen Brown delta_package(p, p2); 521*c98d5d94SLen Brown 522103a8feaSLen Brown return 0; 523103a8feaSLen Brown } 524103a8feaSLen Brown 525*c98d5d94SLen Brown void clear_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 526103a8feaSLen Brown { 527*c98d5d94SLen Brown t->tsc = 0; 528*c98d5d94SLen Brown t->aperf = 0; 529*c98d5d94SLen Brown t->mperf = 0; 530*c98d5d94SLen Brown t->c1 = 0; 531103a8feaSLen Brown 532*c98d5d94SLen Brown /* tells format_counters to dump all fields from this set */ 533*c98d5d94SLen Brown t->flags = CPU_IS_FIRST_THREAD_IN_CORE | CPU_IS_FIRST_CORE_IN_PACKAGE; 534*c98d5d94SLen Brown 535*c98d5d94SLen Brown c->c3 = 0; 536*c98d5d94SLen Brown c->c6 = 0; 537*c98d5d94SLen Brown c->c7 = 0; 538*c98d5d94SLen Brown 539*c98d5d94SLen Brown p->pc2 = 0; 540*c98d5d94SLen Brown p->pc3 = 0; 541*c98d5d94SLen Brown p->pc6 = 0; 542*c98d5d94SLen Brown p->pc7 = 0; 543103a8feaSLen Brown } 544*c98d5d94SLen Brown int sum_counters(struct thread_data *t, struct core_data *c, 545*c98d5d94SLen Brown struct pkg_data *p) 546103a8feaSLen Brown { 547*c98d5d94SLen Brown average.threads.tsc += t->tsc; 548*c98d5d94SLen Brown average.threads.aperf += t->aperf; 549*c98d5d94SLen Brown average.threads.mperf += t->mperf; 550*c98d5d94SLen Brown average.threads.c1 += t->c1; 55115aaa346SLen Brown 552*c98d5d94SLen Brown /* sum per-core values only for 1st thread in core */ 553*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 554*c98d5d94SLen Brown return 0; 555*c98d5d94SLen Brown 556*c98d5d94SLen Brown average.cores.c3 += c->c3; 557*c98d5d94SLen Brown average.cores.c6 += c->c6; 558*c98d5d94SLen Brown average.cores.c7 += c->c7; 559*c98d5d94SLen Brown 560*c98d5d94SLen Brown /* sum per-pkg values only for 1st core in pkg */ 561*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 562*c98d5d94SLen Brown return 0; 563*c98d5d94SLen Brown 564*c98d5d94SLen Brown average.packages.pc2 += p->pc2; 565*c98d5d94SLen Brown average.packages.pc3 += p->pc3; 566*c98d5d94SLen Brown average.packages.pc6 += p->pc6; 567*c98d5d94SLen Brown average.packages.pc7 += p->pc7; 568*c98d5d94SLen Brown 569*c98d5d94SLen Brown return 0; 570*c98d5d94SLen Brown } 571*c98d5d94SLen Brown /* 572*c98d5d94SLen Brown * sum the counters for all cpus in the system 573*c98d5d94SLen Brown * compute the weighted average 574*c98d5d94SLen Brown */ 575*c98d5d94SLen Brown void compute_average(struct thread_data *t, struct core_data *c, 576*c98d5d94SLen Brown struct pkg_data *p) 577*c98d5d94SLen Brown { 578*c98d5d94SLen Brown clear_counters(&average.threads, &average.cores, &average.packages); 579*c98d5d94SLen Brown 580*c98d5d94SLen Brown for_all_cpus(sum_counters, t, c, p); 581*c98d5d94SLen Brown 582*c98d5d94SLen Brown average.threads.tsc /= topo.num_cpus; 583*c98d5d94SLen Brown average.threads.aperf /= topo.num_cpus; 584*c98d5d94SLen Brown average.threads.mperf /= topo.num_cpus; 585*c98d5d94SLen Brown average.threads.c1 /= topo.num_cpus; 586*c98d5d94SLen Brown 587*c98d5d94SLen Brown average.cores.c3 /= topo.num_cores; 588*c98d5d94SLen Brown average.cores.c6 /= topo.num_cores; 589*c98d5d94SLen Brown average.cores.c7 /= topo.num_cores; 590*c98d5d94SLen Brown 591*c98d5d94SLen Brown average.packages.pc2 /= topo.num_packages; 592*c98d5d94SLen Brown average.packages.pc3 /= topo.num_packages; 593*c98d5d94SLen Brown average.packages.pc6 /= topo.num_packages; 594*c98d5d94SLen Brown average.packages.pc7 /= topo.num_packages; 595*c98d5d94SLen Brown } 596*c98d5d94SLen Brown 597*c98d5d94SLen Brown static unsigned long long rdtsc(void) 598*c98d5d94SLen Brown { 599*c98d5d94SLen Brown unsigned int low, high; 600*c98d5d94SLen Brown 601*c98d5d94SLen Brown asm volatile("rdtsc" : "=a" (low), "=d" (high)); 602*c98d5d94SLen Brown 603*c98d5d94SLen Brown return low | ((unsigned long long)high) << 32; 604*c98d5d94SLen Brown } 605*c98d5d94SLen Brown 606*c98d5d94SLen Brown 607*c98d5d94SLen Brown /* 608*c98d5d94SLen Brown * get_counters(...) 609*c98d5d94SLen Brown * migrate to cpu 610*c98d5d94SLen Brown * acquire and record local counters for that cpu 611*c98d5d94SLen Brown */ 612*c98d5d94SLen Brown int get_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p) 613*c98d5d94SLen Brown { 614*c98d5d94SLen Brown int cpu = t->cpu_id; 615*c98d5d94SLen Brown 616*c98d5d94SLen Brown if (cpu_migrate(cpu)) 61715aaa346SLen Brown return -1; 61815aaa346SLen Brown 619*c98d5d94SLen Brown t->tsc = rdtsc(); /* we are running on local CPU of interest */ 62015aaa346SLen Brown 62115aaa346SLen Brown if (has_aperf) { 622*c98d5d94SLen Brown if (get_msr(cpu, MSR_APERF, &t->aperf)) 623*c98d5d94SLen Brown return -3; 624*c98d5d94SLen Brown if (get_msr(cpu, MSR_MPERF, &t->mperf)) 625*c98d5d94SLen Brown return -4; 62688c3281fSLen Brown } 62788c3281fSLen Brown 628*c98d5d94SLen Brown if (extra_msr_offset) 629*c98d5d94SLen Brown if (get_msr(cpu, extra_msr_offset, &t->extra_msr)) 630*c98d5d94SLen Brown return -5; 631*c98d5d94SLen Brown 632*c98d5d94SLen Brown /* collect core counters only for 1st thread in core */ 633*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE)) 634*c98d5d94SLen Brown return 0; 635*c98d5d94SLen Brown 63615aaa346SLen Brown if (do_nhm_cstates) { 637*c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C3_RESIDENCY, &c->c3)) 638*c98d5d94SLen Brown return -6; 639*c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C6_RESIDENCY, &c->c6)) 640*c98d5d94SLen Brown return -7; 641103a8feaSLen Brown } 64215aaa346SLen Brown 64315aaa346SLen Brown if (do_snb_cstates) 644*c98d5d94SLen Brown if (get_msr(cpu, MSR_CORE_C7_RESIDENCY, &c->c7)) 645*c98d5d94SLen Brown return -8; 646*c98d5d94SLen Brown 647*c98d5d94SLen Brown /* collect package counters only for 1st core in package */ 648*c98d5d94SLen Brown if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) 649*c98d5d94SLen Brown return 0; 65015aaa346SLen Brown 65115aaa346SLen Brown if (do_nhm_cstates) { 652*c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C3_RESIDENCY, &p->pc3)) 653*c98d5d94SLen Brown return -9; 654*c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C6_RESIDENCY, &p->pc6)) 655*c98d5d94SLen Brown return -10; 65615aaa346SLen Brown } 65715aaa346SLen Brown if (do_snb_cstates) { 658*c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C2_RESIDENCY, &p->pc2)) 659*c98d5d94SLen Brown return -11; 660*c98d5d94SLen Brown if (get_msr(cpu, MSR_PKG_C7_RESIDENCY, &p->pc7)) 661*c98d5d94SLen Brown return -12; 66215aaa346SLen Brown } 66315aaa346SLen Brown return 0; 664103a8feaSLen Brown } 665103a8feaSLen Brown 666*c98d5d94SLen Brown void print_verbose_header(void) 667103a8feaSLen Brown { 668103a8feaSLen Brown unsigned long long msr; 669103a8feaSLen Brown unsigned int ratio; 670103a8feaSLen Brown 671103a8feaSLen Brown if (!do_nehalem_platform_info) 672103a8feaSLen Brown return; 673103a8feaSLen Brown 67415aaa346SLen Brown get_msr(0, MSR_NEHALEM_PLATFORM_INFO, &msr); 675103a8feaSLen Brown 676103a8feaSLen Brown ratio = (msr >> 40) & 0xFF; 677103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max efficiency\n", 678103a8feaSLen Brown ratio, bclk, ratio * bclk); 679103a8feaSLen Brown 680103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 681103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz TSC frequency\n", 682103a8feaSLen Brown ratio, bclk, ratio * bclk); 683103a8feaSLen Brown 684103a8feaSLen Brown if (verbose > 1) 685103a8feaSLen Brown fprintf(stderr, "MSR_NEHALEM_PLATFORM_INFO: 0x%llx\n", msr); 686103a8feaSLen Brown 687103a8feaSLen Brown if (!do_nehalem_turbo_ratio_limit) 688103a8feaSLen Brown return; 689103a8feaSLen Brown 69015aaa346SLen Brown get_msr(0, MSR_NEHALEM_TURBO_RATIO_LIMIT, &msr); 691103a8feaSLen Brown 692103a8feaSLen Brown ratio = (msr >> 24) & 0xFF; 693103a8feaSLen Brown if (ratio) 694103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 4 active cores\n", 695103a8feaSLen Brown ratio, bclk, ratio * bclk); 696103a8feaSLen Brown 697103a8feaSLen Brown ratio = (msr >> 16) & 0xFF; 698103a8feaSLen Brown if (ratio) 699103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 3 active cores\n", 700103a8feaSLen Brown ratio, bclk, ratio * bclk); 701103a8feaSLen Brown 702103a8feaSLen Brown ratio = (msr >> 8) & 0xFF; 703103a8feaSLen Brown if (ratio) 704103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 2 active cores\n", 705103a8feaSLen Brown ratio, bclk, ratio * bclk); 706103a8feaSLen Brown 707103a8feaSLen Brown ratio = (msr >> 0) & 0xFF; 708103a8feaSLen Brown if (ratio) 709103a8feaSLen Brown fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 1 active cores\n", 710103a8feaSLen Brown ratio, bclk, ratio * bclk); 711103a8feaSLen Brown 712103a8feaSLen Brown } 713103a8feaSLen Brown 714*c98d5d94SLen Brown void free_all_buffers(void) 715103a8feaSLen Brown { 716*c98d5d94SLen Brown CPU_FREE(cpu_present_set); 717*c98d5d94SLen Brown cpu_present_set = NULL; 718*c98d5d94SLen Brown cpu_present_set = 0; 719103a8feaSLen Brown 720*c98d5d94SLen Brown CPU_FREE(cpu_affinity_set); 721*c98d5d94SLen Brown cpu_affinity_set = NULL; 722*c98d5d94SLen Brown cpu_affinity_setsize = 0; 723103a8feaSLen Brown 724*c98d5d94SLen Brown free(thread_even); 725*c98d5d94SLen Brown free(core_even); 726*c98d5d94SLen Brown free(package_even); 727103a8feaSLen Brown 728*c98d5d94SLen Brown thread_even = NULL; 729*c98d5d94SLen Brown core_even = NULL; 730*c98d5d94SLen Brown package_even = NULL; 731103a8feaSLen Brown 732*c98d5d94SLen Brown free(thread_odd); 733*c98d5d94SLen Brown free(core_odd); 734*c98d5d94SLen Brown free(package_odd); 735103a8feaSLen Brown 736*c98d5d94SLen Brown thread_odd = NULL; 737*c98d5d94SLen Brown core_odd = NULL; 738*c98d5d94SLen Brown package_odd = NULL; 739103a8feaSLen Brown 740*c98d5d94SLen Brown free(output_buffer); 741*c98d5d94SLen Brown output_buffer = NULL; 742*c98d5d94SLen Brown outp = NULL; 743103a8feaSLen Brown } 744103a8feaSLen Brown 745103a8feaSLen Brown /* 746*c98d5d94SLen Brown * cpu_is_first_sibling_in_core(cpu) 747*c98d5d94SLen Brown * return 1 if given CPU is 1st HT sibling in the core 748103a8feaSLen Brown */ 749*c98d5d94SLen Brown int cpu_is_first_sibling_in_core(int cpu) 750103a8feaSLen Brown { 751*c98d5d94SLen Brown char path[64]; 752*c98d5d94SLen Brown FILE *filep; 753*c98d5d94SLen Brown int first_cpu; 754103a8feaSLen Brown 755*c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 756*c98d5d94SLen Brown filep = fopen(path, "r"); 757*c98d5d94SLen Brown if (filep == NULL) { 758*c98d5d94SLen Brown perror(path); 759103a8feaSLen Brown exit(1); 760103a8feaSLen Brown } 761*c98d5d94SLen Brown fscanf(filep, "%d", &first_cpu); 762*c98d5d94SLen Brown fclose(filep); 763*c98d5d94SLen Brown return (cpu == first_cpu); 764*c98d5d94SLen Brown } 765103a8feaSLen Brown 766*c98d5d94SLen Brown /* 767*c98d5d94SLen Brown * cpu_is_first_core_in_package(cpu) 768*c98d5d94SLen Brown * return 1 if given CPU is 1st core in package 769*c98d5d94SLen Brown */ 770*c98d5d94SLen Brown int cpu_is_first_core_in_package(int cpu) 771*c98d5d94SLen Brown { 772*c98d5d94SLen Brown char path[64]; 773*c98d5d94SLen Brown FILE *filep; 774*c98d5d94SLen Brown int first_cpu; 775*c98d5d94SLen Brown 776*c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/core_siblings_list", cpu); 777*c98d5d94SLen Brown filep = fopen(path, "r"); 778*c98d5d94SLen Brown if (filep == NULL) { 779*c98d5d94SLen Brown perror(path); 780103a8feaSLen Brown exit(1); 781103a8feaSLen Brown } 782*c98d5d94SLen Brown fscanf(filep, "%d", &first_cpu); 783*c98d5d94SLen Brown fclose(filep); 784*c98d5d94SLen Brown return (cpu == first_cpu); 785103a8feaSLen Brown } 786103a8feaSLen Brown 787103a8feaSLen Brown int get_physical_package_id(int cpu) 788103a8feaSLen Brown { 789*c98d5d94SLen Brown char path[80]; 790103a8feaSLen Brown FILE *filep; 791103a8feaSLen Brown int pkg; 792103a8feaSLen Brown 793103a8feaSLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu); 794103a8feaSLen Brown filep = fopen(path, "r"); 795103a8feaSLen Brown if (filep == NULL) { 796103a8feaSLen Brown perror(path); 797103a8feaSLen Brown exit(1); 798103a8feaSLen Brown } 799103a8feaSLen Brown fscanf(filep, "%d", &pkg); 800103a8feaSLen Brown fclose(filep); 801103a8feaSLen Brown return pkg; 802103a8feaSLen Brown } 803103a8feaSLen Brown 804103a8feaSLen Brown int get_core_id(int cpu) 805103a8feaSLen Brown { 806*c98d5d94SLen Brown char path[80]; 807103a8feaSLen Brown FILE *filep; 808103a8feaSLen Brown int core; 809103a8feaSLen Brown 810103a8feaSLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/core_id", cpu); 811103a8feaSLen Brown filep = fopen(path, "r"); 812103a8feaSLen Brown if (filep == NULL) { 813103a8feaSLen Brown perror(path); 814103a8feaSLen Brown exit(1); 815103a8feaSLen Brown } 816103a8feaSLen Brown fscanf(filep, "%d", &core); 817103a8feaSLen Brown fclose(filep); 818103a8feaSLen Brown return core; 819103a8feaSLen Brown } 820103a8feaSLen Brown 821*c98d5d94SLen Brown int get_num_ht_siblings(int cpu) 822*c98d5d94SLen Brown { 823*c98d5d94SLen Brown char path[80]; 824*c98d5d94SLen Brown FILE *filep; 825*c98d5d94SLen Brown int sib1, sib2; 826*c98d5d94SLen Brown int matches; 827*c98d5d94SLen Brown char character; 828*c98d5d94SLen Brown 829*c98d5d94SLen Brown sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu); 830*c98d5d94SLen Brown filep = fopen(path, "r"); 831*c98d5d94SLen Brown if (filep == NULL) { 832*c98d5d94SLen Brown perror(path); 833*c98d5d94SLen Brown exit(1); 834*c98d5d94SLen Brown } 835103a8feaSLen Brown /* 836*c98d5d94SLen Brown * file format: 837*c98d5d94SLen Brown * if a pair of number with a character between: 2 siblings (eg. 1-2, or 1,4) 838*c98d5d94SLen Brown * otherwinse 1 sibling (self). 839*c98d5d94SLen Brown */ 840*c98d5d94SLen Brown matches = fscanf(filep, "%d%c%d\n", &sib1, &character, &sib2); 841*c98d5d94SLen Brown 842*c98d5d94SLen Brown fclose(filep); 843*c98d5d94SLen Brown 844*c98d5d94SLen Brown if (matches == 3) 845*c98d5d94SLen Brown return 2; 846*c98d5d94SLen Brown else 847*c98d5d94SLen Brown return 1; 848*c98d5d94SLen Brown } 849*c98d5d94SLen Brown 850*c98d5d94SLen Brown /* 851*c98d5d94SLen Brown * run func(thread, core, package) in topology order 852*c98d5d94SLen Brown * skip non-present cpus 853103a8feaSLen Brown */ 854103a8feaSLen Brown 855*c98d5d94SLen Brown int for_all_cpus_2(int (func)(struct thread_data *, struct core_data *, 856*c98d5d94SLen Brown struct pkg_data *, struct thread_data *, struct core_data *, 857*c98d5d94SLen Brown struct pkg_data *), struct thread_data *thread_base, 858*c98d5d94SLen Brown struct core_data *core_base, struct pkg_data *pkg_base, 859*c98d5d94SLen Brown struct thread_data *thread_base2, struct core_data *core_base2, 860*c98d5d94SLen Brown struct pkg_data *pkg_base2) 861*c98d5d94SLen Brown { 862*c98d5d94SLen Brown int retval, pkg_no, core_no, thread_no; 863*c98d5d94SLen Brown 864*c98d5d94SLen Brown for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) { 865*c98d5d94SLen Brown for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) { 866*c98d5d94SLen Brown for (thread_no = 0; thread_no < 867*c98d5d94SLen Brown topo.num_threads_per_core; ++thread_no) { 868*c98d5d94SLen Brown struct thread_data *t, *t2; 869*c98d5d94SLen Brown struct core_data *c, *c2; 870*c98d5d94SLen Brown struct pkg_data *p, *p2; 871*c98d5d94SLen Brown 872*c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_no, core_no, pkg_no); 873*c98d5d94SLen Brown 874*c98d5d94SLen Brown if (cpu_is_not_present(t->cpu_id)) 875*c98d5d94SLen Brown continue; 876*c98d5d94SLen Brown 877*c98d5d94SLen Brown t2 = GET_THREAD(thread_base2, thread_no, core_no, pkg_no); 878*c98d5d94SLen Brown 879*c98d5d94SLen Brown c = GET_CORE(core_base, core_no, pkg_no); 880*c98d5d94SLen Brown c2 = GET_CORE(core_base2, core_no, pkg_no); 881*c98d5d94SLen Brown 882*c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_no); 883*c98d5d94SLen Brown p2 = GET_PKG(pkg_base2, pkg_no); 884*c98d5d94SLen Brown 885*c98d5d94SLen Brown retval = func(t, c, p, t2, c2, p2); 886*c98d5d94SLen Brown if (retval) 887*c98d5d94SLen Brown return retval; 888*c98d5d94SLen Brown } 889*c98d5d94SLen Brown } 890*c98d5d94SLen Brown } 891*c98d5d94SLen Brown return 0; 892*c98d5d94SLen Brown } 893*c98d5d94SLen Brown 894*c98d5d94SLen Brown /* 895*c98d5d94SLen Brown * run func(cpu) on every cpu in /proc/stat 896*c98d5d94SLen Brown * return max_cpu number 897*c98d5d94SLen Brown */ 898*c98d5d94SLen Brown int for_all_proc_cpus(int (func)(int)) 899103a8feaSLen Brown { 900103a8feaSLen Brown FILE *fp; 901*c98d5d94SLen Brown int cpu_num; 902103a8feaSLen Brown int retval; 903103a8feaSLen Brown 904103a8feaSLen Brown fp = fopen(proc_stat, "r"); 905103a8feaSLen Brown if (fp == NULL) { 906103a8feaSLen Brown perror(proc_stat); 907103a8feaSLen Brown exit(1); 908103a8feaSLen Brown } 909103a8feaSLen Brown 910103a8feaSLen Brown retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n"); 911103a8feaSLen Brown if (retval != 0) { 912103a8feaSLen Brown perror("/proc/stat format"); 913103a8feaSLen Brown exit(1); 914103a8feaSLen Brown } 915103a8feaSLen Brown 916*c98d5d94SLen Brown while (1) { 917*c98d5d94SLen Brown retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu_num); 918103a8feaSLen Brown if (retval != 1) 919103a8feaSLen Brown break; 920103a8feaSLen Brown 921*c98d5d94SLen Brown retval = func(cpu_num); 922*c98d5d94SLen Brown if (retval) { 923*c98d5d94SLen Brown fclose(fp); 924*c98d5d94SLen Brown return(retval); 925*c98d5d94SLen Brown } 926103a8feaSLen Brown } 927103a8feaSLen Brown fclose(fp); 928*c98d5d94SLen Brown return 0; 929103a8feaSLen Brown } 930103a8feaSLen Brown 931103a8feaSLen Brown void re_initialize(void) 932103a8feaSLen Brown { 933*c98d5d94SLen Brown free_all_buffers(); 934*c98d5d94SLen Brown setup_all_buffers(); 935*c98d5d94SLen Brown printf("turbostat: re-initialized with num_cpus %d\n", topo.num_cpus); 936103a8feaSLen Brown } 937103a8feaSLen Brown 938*c98d5d94SLen Brown 939103a8feaSLen Brown /* 940*c98d5d94SLen Brown * count_cpus() 941*c98d5d94SLen Brown * remember the last one seen, it will be the max 942103a8feaSLen Brown */ 943*c98d5d94SLen Brown int count_cpus(int cpu) 944103a8feaSLen Brown { 945*c98d5d94SLen Brown if (topo.max_cpu_num < cpu) 946*c98d5d94SLen Brown topo.max_cpu_num = cpu; 947103a8feaSLen Brown 948*c98d5d94SLen Brown topo.num_cpus += 1; 949*c98d5d94SLen Brown return 0; 950103a8feaSLen Brown } 951*c98d5d94SLen Brown int mark_cpu_present(int cpu) 952*c98d5d94SLen Brown { 953*c98d5d94SLen Brown CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set); 95415aaa346SLen Brown return 0; 955103a8feaSLen Brown } 956103a8feaSLen Brown 957103a8feaSLen Brown void turbostat_loop() 958103a8feaSLen Brown { 959*c98d5d94SLen Brown int retval; 960*c98d5d94SLen Brown 961103a8feaSLen Brown restart: 962*c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 963*c98d5d94SLen Brown if (retval) { 964*c98d5d94SLen Brown re_initialize(); 965*c98d5d94SLen Brown goto restart; 966*c98d5d94SLen Brown } 967103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 968103a8feaSLen Brown 969103a8feaSLen Brown while (1) { 970*c98d5d94SLen Brown if (for_all_proc_cpus(cpu_is_not_present)) { 971103a8feaSLen Brown re_initialize(); 972103a8feaSLen Brown goto restart; 973103a8feaSLen Brown } 974103a8feaSLen Brown sleep(interval_sec); 975*c98d5d94SLen Brown retval = for_all_cpus(get_counters, ODD_COUNTERS); 976*c98d5d94SLen Brown if (retval) { 97715aaa346SLen Brown re_initialize(); 97815aaa346SLen Brown goto restart; 97915aaa346SLen Brown } 980103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 981103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 982*c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 983*c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 984*c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 985*c98d5d94SLen Brown flush_stdout(); 98615aaa346SLen Brown sleep(interval_sec); 987*c98d5d94SLen Brown retval = for_all_cpus(get_counters, EVEN_COUNTERS); 988*c98d5d94SLen Brown if (retval) { 989103a8feaSLen Brown re_initialize(); 990103a8feaSLen Brown goto restart; 991103a8feaSLen Brown } 992103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 993103a8feaSLen Brown timersub(&tv_even, &tv_odd, &tv_delta); 994*c98d5d94SLen Brown for_all_cpus_2(delta_cpu, EVEN_COUNTERS, ODD_COUNTERS); 995*c98d5d94SLen Brown compute_average(ODD_COUNTERS); 996*c98d5d94SLen Brown format_all_counters(ODD_COUNTERS); 997*c98d5d94SLen Brown flush_stdout(); 998103a8feaSLen Brown } 999103a8feaSLen Brown } 1000103a8feaSLen Brown 1001103a8feaSLen Brown void check_dev_msr() 1002103a8feaSLen Brown { 1003103a8feaSLen Brown struct stat sb; 1004103a8feaSLen Brown 1005103a8feaSLen Brown if (stat("/dev/cpu/0/msr", &sb)) { 1006103a8feaSLen Brown fprintf(stderr, "no /dev/cpu/0/msr\n"); 1007103a8feaSLen Brown fprintf(stderr, "Try \"# modprobe msr\"\n"); 1008103a8feaSLen Brown exit(-5); 1009103a8feaSLen Brown } 1010103a8feaSLen Brown } 1011103a8feaSLen Brown 1012103a8feaSLen Brown void check_super_user() 1013103a8feaSLen Brown { 1014103a8feaSLen Brown if (getuid() != 0) { 1015103a8feaSLen Brown fprintf(stderr, "must be root\n"); 1016103a8feaSLen Brown exit(-6); 1017103a8feaSLen Brown } 1018103a8feaSLen Brown } 1019103a8feaSLen Brown 1020103a8feaSLen Brown int has_nehalem_turbo_ratio_limit(unsigned int family, unsigned int model) 1021103a8feaSLen Brown { 1022103a8feaSLen Brown if (!genuine_intel) 1023103a8feaSLen Brown return 0; 1024103a8feaSLen Brown 1025103a8feaSLen Brown if (family != 6) 1026103a8feaSLen Brown return 0; 1027103a8feaSLen Brown 1028103a8feaSLen Brown switch (model) { 1029103a8feaSLen Brown case 0x1A: /* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */ 1030103a8feaSLen Brown case 0x1E: /* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */ 1031103a8feaSLen Brown case 0x1F: /* Core i7 and i5 Processor - Nehalem */ 1032103a8feaSLen Brown case 0x25: /* Westmere Client - Clarkdale, Arrandale */ 1033103a8feaSLen Brown case 0x2C: /* Westmere EP - Gulftown */ 1034103a8feaSLen Brown case 0x2A: /* SNB */ 1035103a8feaSLen Brown case 0x2D: /* SNB Xeon */ 1036553575f1SLen Brown case 0x3A: /* IVB */ 1037553575f1SLen Brown case 0x3D: /* IVB Xeon */ 1038103a8feaSLen Brown return 1; 1039103a8feaSLen Brown case 0x2E: /* Nehalem-EX Xeon - Beckton */ 1040103a8feaSLen Brown case 0x2F: /* Westmere-EX Xeon - Eagleton */ 1041103a8feaSLen Brown default: 1042103a8feaSLen Brown return 0; 1043103a8feaSLen Brown } 1044103a8feaSLen Brown } 1045103a8feaSLen Brown 1046103a8feaSLen Brown int is_snb(unsigned int family, unsigned int model) 1047103a8feaSLen Brown { 1048103a8feaSLen Brown if (!genuine_intel) 1049103a8feaSLen Brown return 0; 1050103a8feaSLen Brown 1051103a8feaSLen Brown switch (model) { 1052103a8feaSLen Brown case 0x2A: 1053103a8feaSLen Brown case 0x2D: 1054650a37f3SLen Brown case 0x3A: /* IVB */ 1055650a37f3SLen Brown case 0x3D: /* IVB Xeon */ 1056103a8feaSLen Brown return 1; 1057103a8feaSLen Brown } 1058103a8feaSLen Brown return 0; 1059103a8feaSLen Brown } 1060103a8feaSLen Brown 1061103a8feaSLen Brown double discover_bclk(unsigned int family, unsigned int model) 1062103a8feaSLen Brown { 1063103a8feaSLen Brown if (is_snb(family, model)) 1064103a8feaSLen Brown return 100.00; 1065103a8feaSLen Brown else 1066103a8feaSLen Brown return 133.33; 1067103a8feaSLen Brown } 1068103a8feaSLen Brown 1069103a8feaSLen Brown void check_cpuid() 1070103a8feaSLen Brown { 1071103a8feaSLen Brown unsigned int eax, ebx, ecx, edx, max_level; 1072103a8feaSLen Brown unsigned int fms, family, model, stepping; 1073103a8feaSLen Brown 1074103a8feaSLen Brown eax = ebx = ecx = edx = 0; 1075103a8feaSLen Brown 1076103a8feaSLen Brown asm("cpuid" : "=a" (max_level), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0)); 1077103a8feaSLen Brown 1078103a8feaSLen Brown if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e) 1079103a8feaSLen Brown genuine_intel = 1; 1080103a8feaSLen Brown 1081103a8feaSLen Brown if (verbose) 1082103a8feaSLen Brown fprintf(stderr, "%.4s%.4s%.4s ", 1083103a8feaSLen Brown (char *)&ebx, (char *)&edx, (char *)&ecx); 1084103a8feaSLen Brown 1085103a8feaSLen Brown asm("cpuid" : "=a" (fms), "=c" (ecx), "=d" (edx) : "a" (1) : "ebx"); 1086103a8feaSLen Brown family = (fms >> 8) & 0xf; 1087103a8feaSLen Brown model = (fms >> 4) & 0xf; 1088103a8feaSLen Brown stepping = fms & 0xf; 1089103a8feaSLen Brown if (family == 6 || family == 0xf) 1090103a8feaSLen Brown model += ((fms >> 16) & 0xf) << 4; 1091103a8feaSLen Brown 1092103a8feaSLen Brown if (verbose) 1093103a8feaSLen Brown fprintf(stderr, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n", 1094103a8feaSLen Brown max_level, family, model, stepping, family, model, stepping); 1095103a8feaSLen Brown 1096103a8feaSLen Brown if (!(edx & (1 << 5))) { 1097103a8feaSLen Brown fprintf(stderr, "CPUID: no MSR\n"); 1098103a8feaSLen Brown exit(1); 1099103a8feaSLen Brown } 1100103a8feaSLen Brown 1101103a8feaSLen Brown /* 1102103a8feaSLen Brown * check max extended function levels of CPUID. 1103103a8feaSLen Brown * This is needed to check for invariant TSC. 1104103a8feaSLen Brown * This check is valid for both Intel and AMD. 1105103a8feaSLen Brown */ 1106103a8feaSLen Brown ebx = ecx = edx = 0; 1107103a8feaSLen Brown asm("cpuid" : "=a" (max_level), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x80000000)); 1108103a8feaSLen Brown 1109103a8feaSLen Brown if (max_level < 0x80000007) { 1110103a8feaSLen Brown fprintf(stderr, "CPUID: no invariant TSC (max_level 0x%x)\n", max_level); 1111103a8feaSLen Brown exit(1); 1112103a8feaSLen Brown } 1113103a8feaSLen Brown 1114103a8feaSLen Brown /* 1115103a8feaSLen Brown * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8 1116103a8feaSLen Brown * this check is valid for both Intel and AMD 1117103a8feaSLen Brown */ 1118103a8feaSLen Brown asm("cpuid" : "=a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x80000007)); 11198209e054SThomas Renninger has_invariant_tsc = edx & (1 << 8); 1120103a8feaSLen Brown 1121103a8feaSLen Brown if (!has_invariant_tsc) { 1122103a8feaSLen Brown fprintf(stderr, "No invariant TSC\n"); 1123103a8feaSLen Brown exit(1); 1124103a8feaSLen Brown } 1125103a8feaSLen Brown 1126103a8feaSLen Brown /* 1127103a8feaSLen Brown * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0 1128103a8feaSLen Brown * this check is valid for both Intel and AMD 1129103a8feaSLen Brown */ 1130103a8feaSLen Brown 1131103a8feaSLen Brown asm("cpuid" : "=a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x6)); 11328209e054SThomas Renninger has_aperf = ecx & (1 << 0); 1133103a8feaSLen Brown if (!has_aperf) { 1134103a8feaSLen Brown fprintf(stderr, "No APERF MSR\n"); 1135103a8feaSLen Brown exit(1); 1136103a8feaSLen Brown } 1137103a8feaSLen Brown 1138103a8feaSLen Brown do_nehalem_platform_info = genuine_intel && has_invariant_tsc; 1139103a8feaSLen Brown do_nhm_cstates = genuine_intel; /* all Intel w/ non-stop TSC have NHM counters */ 1140103a8feaSLen Brown do_snb_cstates = is_snb(family, model); 1141103a8feaSLen Brown bclk = discover_bclk(family, model); 1142103a8feaSLen Brown 1143103a8feaSLen Brown do_nehalem_turbo_ratio_limit = has_nehalem_turbo_ratio_limit(family, model); 1144103a8feaSLen Brown } 1145103a8feaSLen Brown 1146103a8feaSLen Brown 1147103a8feaSLen Brown void usage() 1148103a8feaSLen Brown { 1149103a8feaSLen Brown fprintf(stderr, "%s: [-v] [-M MSR#] [-i interval_sec | command ...]\n", 1150103a8feaSLen Brown progname); 1151103a8feaSLen Brown exit(1); 1152103a8feaSLen Brown } 1153103a8feaSLen Brown 1154103a8feaSLen Brown 1155103a8feaSLen Brown /* 1156103a8feaSLen Brown * in /dev/cpu/ return success for names that are numbers 1157103a8feaSLen Brown * ie. filter out ".", "..", "microcode". 1158103a8feaSLen Brown */ 1159103a8feaSLen Brown int dir_filter(const struct dirent *dirp) 1160103a8feaSLen Brown { 1161103a8feaSLen Brown if (isdigit(dirp->d_name[0])) 1162103a8feaSLen Brown return 1; 1163103a8feaSLen Brown else 1164103a8feaSLen Brown return 0; 1165103a8feaSLen Brown } 1166103a8feaSLen Brown 1167103a8feaSLen Brown int open_dev_cpu_msr(int dummy1) 1168103a8feaSLen Brown { 1169103a8feaSLen Brown return 0; 1170103a8feaSLen Brown } 1171103a8feaSLen Brown 1172*c98d5d94SLen Brown void topology_probe() 1173*c98d5d94SLen Brown { 1174*c98d5d94SLen Brown int i; 1175*c98d5d94SLen Brown int max_core_id = 0; 1176*c98d5d94SLen Brown int max_package_id = 0; 1177*c98d5d94SLen Brown int max_siblings = 0; 1178*c98d5d94SLen Brown struct cpu_topology { 1179*c98d5d94SLen Brown int core_id; 1180*c98d5d94SLen Brown int physical_package_id; 1181*c98d5d94SLen Brown } *cpus; 1182*c98d5d94SLen Brown 1183*c98d5d94SLen Brown /* Initialize num_cpus, max_cpu_num */ 1184*c98d5d94SLen Brown topo.num_cpus = 0; 1185*c98d5d94SLen Brown topo.max_cpu_num = 0; 1186*c98d5d94SLen Brown for_all_proc_cpus(count_cpus); 1187*c98d5d94SLen Brown if (!summary_only && topo.num_cpus > 1) 1188*c98d5d94SLen Brown show_cpu = 1; 1189*c98d5d94SLen Brown 1190*c98d5d94SLen Brown if (verbose > 1) 1191*c98d5d94SLen Brown fprintf(stderr, "num_cpus %d max_cpu_num %d\n", topo.num_cpus, topo.max_cpu_num); 1192*c98d5d94SLen Brown 1193*c98d5d94SLen Brown cpus = calloc(1, (topo.max_cpu_num + 1) * sizeof(struct cpu_topology)); 1194*c98d5d94SLen Brown if (cpus == NULL) { 1195*c98d5d94SLen Brown perror("calloc cpus"); 1196*c98d5d94SLen Brown exit(1); 1197*c98d5d94SLen Brown } 1198*c98d5d94SLen Brown 1199*c98d5d94SLen Brown /* 1200*c98d5d94SLen Brown * Allocate and initialize cpu_present_set 1201*c98d5d94SLen Brown */ 1202*c98d5d94SLen Brown cpu_present_set = CPU_ALLOC((topo.max_cpu_num + 1)); 1203*c98d5d94SLen Brown if (cpu_present_set == NULL) { 1204*c98d5d94SLen Brown perror("CPU_ALLOC"); 1205*c98d5d94SLen Brown exit(3); 1206*c98d5d94SLen Brown } 1207*c98d5d94SLen Brown cpu_present_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 1208*c98d5d94SLen Brown CPU_ZERO_S(cpu_present_setsize, cpu_present_set); 1209*c98d5d94SLen Brown for_all_proc_cpus(mark_cpu_present); 1210*c98d5d94SLen Brown 1211*c98d5d94SLen Brown /* 1212*c98d5d94SLen Brown * Allocate and initialize cpu_affinity_set 1213*c98d5d94SLen Brown */ 1214*c98d5d94SLen Brown cpu_affinity_set = CPU_ALLOC((topo.max_cpu_num + 1)); 1215*c98d5d94SLen Brown if (cpu_affinity_set == NULL) { 1216*c98d5d94SLen Brown perror("CPU_ALLOC"); 1217*c98d5d94SLen Brown exit(3); 1218*c98d5d94SLen Brown } 1219*c98d5d94SLen Brown cpu_affinity_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1)); 1220*c98d5d94SLen Brown CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set); 1221*c98d5d94SLen Brown 1222*c98d5d94SLen Brown 1223*c98d5d94SLen Brown /* 1224*c98d5d94SLen Brown * For online cpus 1225*c98d5d94SLen Brown * find max_core_id, max_package_id 1226*c98d5d94SLen Brown */ 1227*c98d5d94SLen Brown for (i = 0; i <= topo.max_cpu_num; ++i) { 1228*c98d5d94SLen Brown int siblings; 1229*c98d5d94SLen Brown 1230*c98d5d94SLen Brown if (cpu_is_not_present(i)) { 1231*c98d5d94SLen Brown if (verbose > 1) 1232*c98d5d94SLen Brown fprintf(stderr, "cpu%d NOT PRESENT\n", i); 1233*c98d5d94SLen Brown continue; 1234*c98d5d94SLen Brown } 1235*c98d5d94SLen Brown cpus[i].core_id = get_core_id(i); 1236*c98d5d94SLen Brown if (cpus[i].core_id > max_core_id) 1237*c98d5d94SLen Brown max_core_id = cpus[i].core_id; 1238*c98d5d94SLen Brown 1239*c98d5d94SLen Brown cpus[i].physical_package_id = get_physical_package_id(i); 1240*c98d5d94SLen Brown if (cpus[i].physical_package_id > max_package_id) 1241*c98d5d94SLen Brown max_package_id = cpus[i].physical_package_id; 1242*c98d5d94SLen Brown 1243*c98d5d94SLen Brown siblings = get_num_ht_siblings(i); 1244*c98d5d94SLen Brown if (siblings > max_siblings) 1245*c98d5d94SLen Brown max_siblings = siblings; 1246*c98d5d94SLen Brown if (verbose > 1) 1247*c98d5d94SLen Brown fprintf(stderr, "cpu %d pkg %d core %d\n", 1248*c98d5d94SLen Brown i, cpus[i].physical_package_id, cpus[i].core_id); 1249*c98d5d94SLen Brown } 1250*c98d5d94SLen Brown topo.num_cores_per_pkg = max_core_id + 1; 1251*c98d5d94SLen Brown if (verbose > 1) 1252*c98d5d94SLen Brown fprintf(stderr, "max_core_id %d, sizing for %d cores per package\n", 1253*c98d5d94SLen Brown max_core_id, topo.num_cores_per_pkg); 1254*c98d5d94SLen Brown if (!summary_only && topo.num_cores_per_pkg > 1) 1255*c98d5d94SLen Brown show_core = 1; 1256*c98d5d94SLen Brown 1257*c98d5d94SLen Brown topo.num_packages = max_package_id + 1; 1258*c98d5d94SLen Brown if (verbose > 1) 1259*c98d5d94SLen Brown fprintf(stderr, "max_package_id %d, sizing for %d packages\n", 1260*c98d5d94SLen Brown max_package_id, topo.num_packages); 1261*c98d5d94SLen Brown if (!summary_only && topo.num_packages > 1) 1262*c98d5d94SLen Brown show_pkg = 1; 1263*c98d5d94SLen Brown 1264*c98d5d94SLen Brown topo.num_threads_per_core = max_siblings; 1265*c98d5d94SLen Brown if (verbose > 1) 1266*c98d5d94SLen Brown fprintf(stderr, "max_siblings %d\n", max_siblings); 1267*c98d5d94SLen Brown 1268*c98d5d94SLen Brown free(cpus); 1269*c98d5d94SLen Brown } 1270*c98d5d94SLen Brown 1271*c98d5d94SLen Brown void 1272*c98d5d94SLen Brown allocate_counters(struct thread_data **t, struct core_data **c, struct pkg_data **p) 1273*c98d5d94SLen Brown { 1274*c98d5d94SLen Brown int i; 1275*c98d5d94SLen Brown 1276*c98d5d94SLen Brown *t = calloc(topo.num_threads_per_core * topo.num_cores_per_pkg * 1277*c98d5d94SLen Brown topo.num_packages, sizeof(struct thread_data)); 1278*c98d5d94SLen Brown if (*t == NULL) 1279*c98d5d94SLen Brown goto error; 1280*c98d5d94SLen Brown 1281*c98d5d94SLen Brown for (i = 0; i < topo.num_threads_per_core * 1282*c98d5d94SLen Brown topo.num_cores_per_pkg * topo.num_packages; i++) 1283*c98d5d94SLen Brown (*t)[i].cpu_id = -1; 1284*c98d5d94SLen Brown 1285*c98d5d94SLen Brown *c = calloc(topo.num_cores_per_pkg * topo.num_packages, 1286*c98d5d94SLen Brown sizeof(struct core_data)); 1287*c98d5d94SLen Brown if (*c == NULL) 1288*c98d5d94SLen Brown goto error; 1289*c98d5d94SLen Brown 1290*c98d5d94SLen Brown for (i = 0; i < topo.num_cores_per_pkg * topo.num_packages; i++) 1291*c98d5d94SLen Brown (*c)[i].core_id = -1; 1292*c98d5d94SLen Brown 1293*c98d5d94SLen Brown *p = calloc(topo.num_packages, sizeof(struct pkg_data)); 1294*c98d5d94SLen Brown if (*p == NULL) 1295*c98d5d94SLen Brown goto error; 1296*c98d5d94SLen Brown 1297*c98d5d94SLen Brown for (i = 0; i < topo.num_packages; i++) 1298*c98d5d94SLen Brown (*p)[i].package_id = i; 1299*c98d5d94SLen Brown 1300*c98d5d94SLen Brown return; 1301*c98d5d94SLen Brown error: 1302*c98d5d94SLen Brown perror("calloc counters"); 1303*c98d5d94SLen Brown exit(1); 1304*c98d5d94SLen Brown } 1305*c98d5d94SLen Brown /* 1306*c98d5d94SLen Brown * init_counter() 1307*c98d5d94SLen Brown * 1308*c98d5d94SLen Brown * set cpu_id, core_num, pkg_num 1309*c98d5d94SLen Brown * set FIRST_THREAD_IN_CORE and FIRST_CORE_IN_PACKAGE 1310*c98d5d94SLen Brown * 1311*c98d5d94SLen Brown * increment topo.num_cores when 1st core in pkg seen 1312*c98d5d94SLen Brown */ 1313*c98d5d94SLen Brown void init_counter(struct thread_data *thread_base, struct core_data *core_base, 1314*c98d5d94SLen Brown struct pkg_data *pkg_base, int thread_num, int core_num, 1315*c98d5d94SLen Brown int pkg_num, int cpu_id) 1316*c98d5d94SLen Brown { 1317*c98d5d94SLen Brown struct thread_data *t; 1318*c98d5d94SLen Brown struct core_data *c; 1319*c98d5d94SLen Brown struct pkg_data *p; 1320*c98d5d94SLen Brown 1321*c98d5d94SLen Brown t = GET_THREAD(thread_base, thread_num, core_num, pkg_num); 1322*c98d5d94SLen Brown c = GET_CORE(core_base, core_num, pkg_num); 1323*c98d5d94SLen Brown p = GET_PKG(pkg_base, pkg_num); 1324*c98d5d94SLen Brown 1325*c98d5d94SLen Brown t->cpu_id = cpu_id; 1326*c98d5d94SLen Brown if (thread_num == 0) { 1327*c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_THREAD_IN_CORE; 1328*c98d5d94SLen Brown if (cpu_is_first_core_in_package(cpu_id)) 1329*c98d5d94SLen Brown t->flags |= CPU_IS_FIRST_CORE_IN_PACKAGE; 1330*c98d5d94SLen Brown } 1331*c98d5d94SLen Brown 1332*c98d5d94SLen Brown c->core_id = core_num; 1333*c98d5d94SLen Brown p->package_id = pkg_num; 1334*c98d5d94SLen Brown } 1335*c98d5d94SLen Brown 1336*c98d5d94SLen Brown 1337*c98d5d94SLen Brown int initialize_counters(int cpu_id) 1338*c98d5d94SLen Brown { 1339*c98d5d94SLen Brown int my_thread_id, my_core_id, my_package_id; 1340*c98d5d94SLen Brown 1341*c98d5d94SLen Brown my_package_id = get_physical_package_id(cpu_id); 1342*c98d5d94SLen Brown my_core_id = get_core_id(cpu_id); 1343*c98d5d94SLen Brown 1344*c98d5d94SLen Brown if (cpu_is_first_sibling_in_core(cpu_id)) { 1345*c98d5d94SLen Brown my_thread_id = 0; 1346*c98d5d94SLen Brown topo.num_cores++; 1347*c98d5d94SLen Brown } else { 1348*c98d5d94SLen Brown my_thread_id = 1; 1349*c98d5d94SLen Brown } 1350*c98d5d94SLen Brown 1351*c98d5d94SLen Brown init_counter(EVEN_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 1352*c98d5d94SLen Brown init_counter(ODD_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id); 1353*c98d5d94SLen Brown return 0; 1354*c98d5d94SLen Brown } 1355*c98d5d94SLen Brown 1356*c98d5d94SLen Brown void allocate_output_buffer() 1357*c98d5d94SLen Brown { 1358*c98d5d94SLen Brown output_buffer = calloc(1, (1 + topo.num_cpus) * 128); 1359*c98d5d94SLen Brown outp = output_buffer; 1360*c98d5d94SLen Brown if (outp == NULL) { 1361*c98d5d94SLen Brown perror("calloc"); 1362*c98d5d94SLen Brown exit(-1); 1363*c98d5d94SLen Brown } 1364*c98d5d94SLen Brown } 1365*c98d5d94SLen Brown 1366*c98d5d94SLen Brown void setup_all_buffers(void) 1367*c98d5d94SLen Brown { 1368*c98d5d94SLen Brown topology_probe(); 1369*c98d5d94SLen Brown allocate_counters(&thread_even, &core_even, &package_even); 1370*c98d5d94SLen Brown allocate_counters(&thread_odd, &core_odd, &package_odd); 1371*c98d5d94SLen Brown allocate_output_buffer(); 1372*c98d5d94SLen Brown for_all_proc_cpus(initialize_counters); 1373*c98d5d94SLen Brown } 1374103a8feaSLen Brown void turbostat_init() 1375103a8feaSLen Brown { 1376103a8feaSLen Brown check_cpuid(); 1377103a8feaSLen Brown 1378103a8feaSLen Brown check_dev_msr(); 1379103a8feaSLen Brown check_super_user(); 1380103a8feaSLen Brown 1381*c98d5d94SLen Brown setup_all_buffers(); 1382103a8feaSLen Brown 1383103a8feaSLen Brown if (verbose) 1384*c98d5d94SLen Brown print_verbose_header(); 1385103a8feaSLen Brown } 1386103a8feaSLen Brown 1387103a8feaSLen Brown int fork_it(char **argv) 1388103a8feaSLen Brown { 1389103a8feaSLen Brown pid_t child_pid; 1390d15cf7c1SLen Brown 1391*c98d5d94SLen Brown for_all_cpus(get_counters, EVEN_COUNTERS); 1392d15cf7c1SLen Brown /* clear affinity side-effect of get_counters() */ 1393d15cf7c1SLen Brown sched_setaffinity(0, cpu_present_setsize, cpu_present_set); 1394103a8feaSLen Brown gettimeofday(&tv_even, (struct timezone *)NULL); 1395103a8feaSLen Brown 1396103a8feaSLen Brown child_pid = fork(); 1397103a8feaSLen Brown if (!child_pid) { 1398103a8feaSLen Brown /* child */ 1399103a8feaSLen Brown execvp(argv[0], argv); 1400103a8feaSLen Brown } else { 1401103a8feaSLen Brown int status; 1402103a8feaSLen Brown 1403103a8feaSLen Brown /* parent */ 1404103a8feaSLen Brown if (child_pid == -1) { 1405103a8feaSLen Brown perror("fork"); 1406103a8feaSLen Brown exit(1); 1407103a8feaSLen Brown } 1408103a8feaSLen Brown 1409103a8feaSLen Brown signal(SIGINT, SIG_IGN); 1410103a8feaSLen Brown signal(SIGQUIT, SIG_IGN); 1411103a8feaSLen Brown if (waitpid(child_pid, &status, 0) == -1) { 1412103a8feaSLen Brown perror("wait"); 1413103a8feaSLen Brown exit(1); 1414103a8feaSLen Brown } 1415103a8feaSLen Brown } 1416*c98d5d94SLen Brown /* 1417*c98d5d94SLen Brown * n.b. fork_it() does not check for errors from for_all_cpus() 1418*c98d5d94SLen Brown * because re-starting is problematic when forking 1419*c98d5d94SLen Brown */ 1420*c98d5d94SLen Brown for_all_cpus(get_counters, ODD_COUNTERS); 1421103a8feaSLen Brown gettimeofday(&tv_odd, (struct timezone *)NULL); 1422103a8feaSLen Brown timersub(&tv_odd, &tv_even, &tv_delta); 1423*c98d5d94SLen Brown for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS); 1424*c98d5d94SLen Brown compute_average(EVEN_COUNTERS); 1425*c98d5d94SLen Brown format_all_counters(EVEN_COUNTERS); 1426*c98d5d94SLen Brown flush_stderr(); 1427103a8feaSLen Brown 14286eab04a8SJustin P. Mattock fprintf(stderr, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0); 1429103a8feaSLen Brown 1430103a8feaSLen Brown return 0; 1431103a8feaSLen Brown } 1432103a8feaSLen Brown 1433103a8feaSLen Brown void cmdline(int argc, char **argv) 1434103a8feaSLen Brown { 1435103a8feaSLen Brown int opt; 1436103a8feaSLen Brown 1437103a8feaSLen Brown progname = argv[0]; 1438103a8feaSLen Brown 1439*c98d5d94SLen Brown while ((opt = getopt(argc, argv, "+cpsvi:M:")) != -1) { 1440103a8feaSLen Brown switch (opt) { 1441*c98d5d94SLen Brown case 'c': 1442*c98d5d94SLen Brown show_core_only++; 1443*c98d5d94SLen Brown break; 1444*c98d5d94SLen Brown case 'p': 1445*c98d5d94SLen Brown show_pkg_only++; 1446*c98d5d94SLen Brown break; 1447e23da037SLen Brown case 's': 1448e23da037SLen Brown summary_only++; 1449e23da037SLen Brown break; 1450103a8feaSLen Brown case 'v': 1451103a8feaSLen Brown verbose++; 1452103a8feaSLen Brown break; 1453103a8feaSLen Brown case 'i': 1454103a8feaSLen Brown interval_sec = atoi(optarg); 1455103a8feaSLen Brown break; 1456103a8feaSLen Brown case 'M': 1457103a8feaSLen Brown sscanf(optarg, "%x", &extra_msr_offset); 1458103a8feaSLen Brown if (verbose > 1) 1459103a8feaSLen Brown fprintf(stderr, "MSR 0x%X\n", extra_msr_offset); 1460103a8feaSLen Brown break; 1461103a8feaSLen Brown default: 1462103a8feaSLen Brown usage(); 1463103a8feaSLen Brown } 1464103a8feaSLen Brown } 1465103a8feaSLen Brown } 1466103a8feaSLen Brown 1467103a8feaSLen Brown int main(int argc, char **argv) 1468103a8feaSLen Brown { 1469103a8feaSLen Brown cmdline(argc, argv); 1470103a8feaSLen Brown 1471103a8feaSLen Brown if (verbose > 1) 1472*c98d5d94SLen Brown fprintf(stderr, "turbostat v2.0 May 16, 2012" 1473103a8feaSLen Brown " - Len Brown <lenb@kernel.org>\n"); 1474103a8feaSLen Brown 1475103a8feaSLen Brown turbostat_init(); 1476103a8feaSLen Brown 1477103a8feaSLen Brown /* 1478103a8feaSLen Brown * if any params left, it must be a command to fork 1479103a8feaSLen Brown */ 1480103a8feaSLen Brown if (argc - optind) 1481103a8feaSLen Brown return fork_it(argv + optind); 1482103a8feaSLen Brown else 1483103a8feaSLen Brown turbostat_loop(); 1484103a8feaSLen Brown 1485103a8feaSLen Brown return 0; 1486103a8feaSLen Brown } 1487