1b47b5b34SRafael Vanoni /* 2b47b5b34SRafael Vanoni * Copyright 2009, Intel Corporation 3b47b5b34SRafael Vanoni * Copyright 2009, Sun Microsystems, Inc 4b47b5b34SRafael Vanoni * 5b47b5b34SRafael Vanoni * This file is part of PowerTOP 6b47b5b34SRafael Vanoni * 7b47b5b34SRafael Vanoni * This program file is free software; you can redistribute it and/or modify it 8b47b5b34SRafael Vanoni * under the terms of the GNU General Public License as published by the 9b47b5b34SRafael Vanoni * Free Software Foundation; version 2 of the License. 10b47b5b34SRafael Vanoni * 11b47b5b34SRafael Vanoni * This program is distributed in the hope that it will be useful, but WITHOUT 12b47b5b34SRafael Vanoni * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 13b47b5b34SRafael Vanoni * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 14b47b5b34SRafael Vanoni * for more details. 15b47b5b34SRafael Vanoni * 16b47b5b34SRafael Vanoni * You should have received a copy of the GNU General Public License 17b47b5b34SRafael Vanoni * along with this program in a file named COPYING; if not, write to the 18b47b5b34SRafael Vanoni * Free Software Foundation, Inc., 19b47b5b34SRafael Vanoni * 51 Franklin Street, Fifth Floor, 20b47b5b34SRafael Vanoni * Boston, MA 02110-1301 USA 21b47b5b34SRafael Vanoni * 22b47b5b34SRafael Vanoni * Authors: 23b47b5b34SRafael Vanoni * Arjan van de Ven <arjan@linux.intel.com> 24b47b5b34SRafael Vanoni * Eric C Saxe <eric.saxe@sun.com> 25b47b5b34SRafael Vanoni * Aubrey Li <aubrey.li@intel.com> 26b47b5b34SRafael Vanoni */ 27b47b5b34SRafael Vanoni 28b47b5b34SRafael Vanoni /* 29b47b5b34SRafael Vanoni * GPL Disclaimer 30b47b5b34SRafael Vanoni * 31b47b5b34SRafael Vanoni * For the avoidance of doubt, except that if any license choice other 32b47b5b34SRafael Vanoni * than GPL or LGPL is available it will apply instead, Sun elects to 33b47b5b34SRafael Vanoni * use only the General Public License version 2 (GPLv2) at this time 34b47b5b34SRafael Vanoni * for any software where a choice of GPL license versions is made 35b47b5b34SRafael Vanoni * available with the language indicating that GPLv2 or any later 36b47b5b34SRafael Vanoni * version may be used, or where a choice of which version of the GPL 37b47b5b34SRafael Vanoni * is applied is otherwise unspecified. 38b47b5b34SRafael Vanoni */ 39b47b5b34SRafael Vanoni 40b47b5b34SRafael Vanoni #include <stdlib.h> 41b47b5b34SRafael Vanoni #include <string.h> 42b47b5b34SRafael Vanoni #include <dtrace.h> 43b47b5b34SRafael Vanoni #include <kstat.h> 44b47b5b34SRafael Vanoni #include <errno.h> 45b47b5b34SRafael Vanoni #include "powertop.h" 46b47b5b34SRafael Vanoni 47*636423dbSRafael Vanoni #define HZ2MHZ(speed) ((speed) / MICROSEC) 48b47b5b34SRafael Vanoni #define DTP_ARG_COUNT 2 49b47b5b34SRafael Vanoni #define DTP_ARG_LENGTH 5 50b47b5b34SRafael Vanoni 51b47b5b34SRafael Vanoni static uint64_t max_cpufreq = 0; 52b47b5b34SRafael Vanoni static dtrace_hdl_t *dtp; 53b47b5b34SRafael Vanoni static char **dtp_argv; 54b47b5b34SRafael Vanoni 55b47b5b34SRafael Vanoni /* 56b47b5b34SRafael Vanoni * Enabling PM through /etc/power.conf 57b47b5b34SRafael Vanoni * See suggest_p_state() 58b47b5b34SRafael Vanoni */ 59b47b5b34SRafael Vanoni static char default_conf[] = "/etc/power.conf"; 60b47b5b34SRafael Vanoni static char default_pmconf[] = "/usr/sbin/pmconfig"; 61b47b5b34SRafael Vanoni static char cpupm_enable[] = " echo cpupm enable >> /etc/power.conf"; 62b47b5b34SRafael Vanoni static char cpupm_treshold[] = " echo cpu-threshold 1s >> /etc/power.conf"; 63b47b5b34SRafael Vanoni 64b47b5b34SRafael Vanoni /* 65b47b5b34SRafael Vanoni * Buffer containing DTrace program to track CPU frequency transitions 66b47b5b34SRafael Vanoni */ 67b47b5b34SRafael Vanoni static const char *dtp_cpufreq = 68b47b5b34SRafael Vanoni "hrtime_t last[$0];" 69b47b5b34SRafael Vanoni "" 70b47b5b34SRafael Vanoni "BEGIN" 71b47b5b34SRafael Vanoni "{" 72b47b5b34SRafael Vanoni " begin = timestamp;" 73b47b5b34SRafael Vanoni "}" 74b47b5b34SRafael Vanoni "" 75b47b5b34SRafael Vanoni ":::cpu-change-speed" 76b47b5b34SRafael Vanoni "/last[(processorid_t)arg0] != 0/" 77b47b5b34SRafael Vanoni "{" 78b47b5b34SRafael Vanoni " this->cpu = (processorid_t)arg0;" 79*636423dbSRafael Vanoni " this->oldspeed = (uint64_t)arg1;" 80b47b5b34SRafael Vanoni " @times[this->cpu, this->oldspeed] = sum(timestamp - last[this->cpu]);" 81b47b5b34SRafael Vanoni " last[this->cpu] = timestamp;" 82b47b5b34SRafael Vanoni "}" 83b47b5b34SRafael Vanoni ":::cpu-change-speed" 84b47b5b34SRafael Vanoni "/last[(processorid_t)arg0] == 0/" 85b47b5b34SRafael Vanoni "{" 86b47b5b34SRafael Vanoni " this->cpu = (processorid_t)arg0;" 87*636423dbSRafael Vanoni " this->oldspeed = (uint64_t)arg1;" 88b47b5b34SRafael Vanoni " @times[this->cpu, this->oldspeed] = sum(timestamp - begin);" 89b47b5b34SRafael Vanoni " last[this->cpu] = timestamp;" 90b47b5b34SRafael Vanoni "}"; 91b47b5b34SRafael Vanoni 92b47b5b34SRafael Vanoni /* 93b47b5b34SRafael Vanoni * Same as above, but only for a specific CPU 94b47b5b34SRafael Vanoni */ 95b47b5b34SRafael Vanoni static const char *dtp_cpufreq_c = 96b47b5b34SRafael Vanoni "hrtime_t last;" 97b47b5b34SRafael Vanoni "" 98b47b5b34SRafael Vanoni "BEGIN" 99b47b5b34SRafael Vanoni "{" 100b47b5b34SRafael Vanoni " begin = timestamp;" 101b47b5b34SRafael Vanoni "}" 102b47b5b34SRafael Vanoni "" 103b47b5b34SRafael Vanoni ":::cpu-change-speed" 104b47b5b34SRafael Vanoni "/(processorid_t)arg0 == $1 &&" 105b47b5b34SRafael Vanoni " last != 0/" 106b47b5b34SRafael Vanoni "{" 107b47b5b34SRafael Vanoni " this->cpu = (processorid_t)arg0;" 108*636423dbSRafael Vanoni " this->oldspeed = (uint64_t)arg1;" 109b47b5b34SRafael Vanoni " @times[this->cpu, this->oldspeed] = sum(timestamp - last);" 110b47b5b34SRafael Vanoni " last = timestamp;" 111b47b5b34SRafael Vanoni "}" 112b47b5b34SRafael Vanoni ":::cpu-change-speed" 113b47b5b34SRafael Vanoni "/(processorid_t)arg0 == $1 &&" 114b47b5b34SRafael Vanoni " last == 0/" 115b47b5b34SRafael Vanoni "{" 116b47b5b34SRafael Vanoni " this->cpu = (processorid_t)arg0;" 117*636423dbSRafael Vanoni " this->oldspeed = (uint64_t)arg1;" 118b47b5b34SRafael Vanoni " @times[this->cpu, this->oldspeed] = sum(timestamp - begin);" 119b47b5b34SRafael Vanoni " last = timestamp;" 120b47b5b34SRafael Vanoni "}"; 121b47b5b34SRafael Vanoni 122b47b5b34SRafael Vanoni static int pt_cpufreq_setup(void); 123b47b5b34SRafael Vanoni static int pt_cpufreq_snapshot(void); 124b47b5b34SRafael Vanoni static int pt_cpufreq_dtrace_walk(const dtrace_aggdata_t *, void *); 125b47b5b34SRafael Vanoni static void pt_cpufreq_stat_account(double, uint_t); 126b47b5b34SRafael Vanoni static int pt_cpufreq_snapshot_cpu(kstat_ctl_t *, 127b47b5b34SRafael Vanoni uint_t); 128b47b5b34SRafael Vanoni 129b47b5b34SRafael Vanoni static int 130b47b5b34SRafael Vanoni pt_cpufreq_setup(void) 131b47b5b34SRafael Vanoni { 132b47b5b34SRafael Vanoni if ((dtp_argv = malloc(sizeof (char *) * DTP_ARG_COUNT)) == NULL) 133b47b5b34SRafael Vanoni return (EXIT_FAILURE); 134b47b5b34SRafael Vanoni 135b47b5b34SRafael Vanoni if ((dtp_argv[0] = malloc(sizeof (char) * DTP_ARG_LENGTH)) == NULL) { 136b47b5b34SRafael Vanoni free(dtp_argv); 137b47b5b34SRafael Vanoni return (EXIT_FAILURE); 138b47b5b34SRafael Vanoni } 139b47b5b34SRafael Vanoni 140b47b5b34SRafael Vanoni (void) snprintf(dtp_argv[0], 5, "%d\0", g_ncpus_observed); 141b47b5b34SRafael Vanoni 142*636423dbSRafael Vanoni if (PT_ON_CPU) { 143b47b5b34SRafael Vanoni if ((dtp_argv[1] = malloc(sizeof (char) * DTP_ARG_LENGTH)) 144b47b5b34SRafael Vanoni == NULL) { 145b47b5b34SRafael Vanoni free(dtp_argv[0]); 146b47b5b34SRafael Vanoni free(dtp_argv); 147b47b5b34SRafael Vanoni return (EXIT_FAILURE); 148b47b5b34SRafael Vanoni } 149b47b5b34SRafael Vanoni (void) snprintf(dtp_argv[1], 5, "%d\0", g_observed_cpu); 150b47b5b34SRafael Vanoni } 151b47b5b34SRafael Vanoni 152b47b5b34SRafael Vanoni return (0); 153b47b5b34SRafael Vanoni } 154b47b5b34SRafael Vanoni 155b47b5b34SRafael Vanoni /* 156b47b5b34SRafael Vanoni * Perform setup necessary to enumerate and track CPU speed changes 157b47b5b34SRafael Vanoni */ 158b47b5b34SRafael Vanoni int 159b47b5b34SRafael Vanoni pt_cpufreq_stat_prepare(void) 160b47b5b34SRafael Vanoni { 161b47b5b34SRafael Vanoni dtrace_prog_t *prog; 162b47b5b34SRafael Vanoni dtrace_proginfo_t info; 163b47b5b34SRafael Vanoni dtrace_optval_t statustime; 164b47b5b34SRafael Vanoni kstat_ctl_t *kc; 165b47b5b34SRafael Vanoni kstat_t *ksp; 166b47b5b34SRafael Vanoni kstat_named_t *knp; 167b47b5b34SRafael Vanoni freq_state_info_t *state; 168b47b5b34SRafael Vanoni char *s, *token, *prog_ptr; 169b47b5b34SRafael Vanoni int err; 170b47b5b34SRafael Vanoni 171b47b5b34SRafael Vanoni if ((err = pt_cpufreq_setup()) != 0) { 172b47b5b34SRafael Vanoni pt_error("%s : failed to setup", __FILE__); 173b47b5b34SRafael Vanoni return (errno); 174b47b5b34SRafael Vanoni } 175b47b5b34SRafael Vanoni 176b47b5b34SRafael Vanoni state = g_pstate_info; 177b47b5b34SRafael Vanoni if ((g_cpu_power_states = calloc((size_t)g_ncpus, 178b47b5b34SRafael Vanoni sizeof (cpu_power_info_t))) == NULL) 179b47b5b34SRafael Vanoni return (-1); 180b47b5b34SRafael Vanoni 181b47b5b34SRafael Vanoni /* 182b47b5b34SRafael Vanoni * Enumerate the CPU frequencies 183b47b5b34SRafael Vanoni */ 184b47b5b34SRafael Vanoni if ((kc = kstat_open()) == NULL) 185b47b5b34SRafael Vanoni return (errno); 186b47b5b34SRafael Vanoni 187b47b5b34SRafael Vanoni ksp = kstat_lookup(kc, "cpu_info", g_cpu_table[g_observed_cpu], NULL); 188b47b5b34SRafael Vanoni 189b47b5b34SRafael Vanoni if (ksp == NULL) { 190b47b5b34SRafael Vanoni err = errno; 191b47b5b34SRafael Vanoni (void) kstat_close(kc); 192b47b5b34SRafael Vanoni return (err); 193b47b5b34SRafael Vanoni } 194b47b5b34SRafael Vanoni 195b47b5b34SRafael Vanoni (void) kstat_read(kc, ksp, NULL); 196b47b5b34SRafael Vanoni 197b47b5b34SRafael Vanoni knp = kstat_data_lookup(ksp, "supported_frequencies_Hz"); 198b47b5b34SRafael Vanoni s = knp->value.str.addr.ptr; 199b47b5b34SRafael Vanoni 200b47b5b34SRafael Vanoni g_npstates = 0; 201b47b5b34SRafael Vanoni 202b47b5b34SRafael Vanoni for (token = strtok(s, ":"), s = NULL; 203b47b5b34SRafael Vanoni NULL != token && g_npstates < NSTATES; 204b47b5b34SRafael Vanoni token = strtok(NULL, ":")) { 205b47b5b34SRafael Vanoni 206b47b5b34SRafael Vanoni state->speed = HZ2MHZ(atoll(token)); 207b47b5b34SRafael Vanoni 208b47b5b34SRafael Vanoni if (state->speed > max_cpufreq) 209b47b5b34SRafael Vanoni max_cpufreq = state->speed; 210b47b5b34SRafael Vanoni 211b47b5b34SRafael Vanoni state->total_time = (uint64_t)0; 212b47b5b34SRafael Vanoni 213b47b5b34SRafael Vanoni g_npstates++; 214b47b5b34SRafael Vanoni state++; 215b47b5b34SRafael Vanoni } 216b47b5b34SRafael Vanoni 217b47b5b34SRafael Vanoni if (token != NULL) 218b47b5b34SRafael Vanoni pt_error("%s : exceeded NSTATES\n", __FILE__); 219b47b5b34SRafael Vanoni 220b47b5b34SRafael Vanoni (void) kstat_close(kc); 221b47b5b34SRafael Vanoni 222b47b5b34SRafael Vanoni /* 223b47b5b34SRafael Vanoni * Return if speed transition is not supported 224b47b5b34SRafael Vanoni */ 225b47b5b34SRafael Vanoni if (g_npstates < 2) 226b47b5b34SRafael Vanoni return (-1); 227b47b5b34SRafael Vanoni 228b47b5b34SRafael Vanoni /* 229b47b5b34SRafael Vanoni * Setup DTrace to look for CPU frequency changes 230b47b5b34SRafael Vanoni */ 231b47b5b34SRafael Vanoni if ((dtp = dtrace_open(DTRACE_VERSION, 0, &err)) == NULL) { 232b47b5b34SRafael Vanoni pt_error("%s : cannot open dtrace library: %s\n", __FILE__, 233b47b5b34SRafael Vanoni dtrace_errmsg(NULL, err)); 234b47b5b34SRafael Vanoni return (-2); 235b47b5b34SRafael Vanoni } 236b47b5b34SRafael Vanoni 237b47b5b34SRafael Vanoni /* 238b47b5b34SRafael Vanoni * Execute different scripts (defined above) depending on 239b47b5b34SRafael Vanoni * user specified options. Default mode uses dtp_cpufreq. 240b47b5b34SRafael Vanoni */ 241*636423dbSRafael Vanoni if (PT_ON_CPU) 242b47b5b34SRafael Vanoni prog_ptr = (char *)dtp_cpufreq_c; 243b47b5b34SRafael Vanoni else 244b47b5b34SRafael Vanoni prog_ptr = (char *)dtp_cpufreq; 245b47b5b34SRafael Vanoni 246b47b5b34SRafael Vanoni if ((prog = dtrace_program_strcompile(dtp, prog_ptr, 247b47b5b34SRafael Vanoni DTRACE_PROBESPEC_NAME, 0, (1 + g_argc), dtp_argv)) == NULL) { 248b47b5b34SRafael Vanoni pt_error("%s : cpu-change-speed probe unavailable\n", __FILE__); 249b47b5b34SRafael Vanoni return (dtrace_errno(dtp)); 250b47b5b34SRafael Vanoni } 251b47b5b34SRafael Vanoni 252b47b5b34SRafael Vanoni if (dtrace_program_exec(dtp, prog, &info) == -1) { 253b47b5b34SRafael Vanoni pt_error("%s : failed to enable speed probe\n", __FILE__); 254b47b5b34SRafael Vanoni return (dtrace_errno(dtp)); 255b47b5b34SRafael Vanoni } 256b47b5b34SRafael Vanoni 257b47b5b34SRafael Vanoni if (dtrace_setopt(dtp, "aggsize", "128k") == -1) { 258b47b5b34SRafael Vanoni pt_error("%s : failed to set speed 'aggsize'\n", __FILE__); 259b47b5b34SRafael Vanoni } 260b47b5b34SRafael Vanoni 261b47b5b34SRafael Vanoni if (dtrace_setopt(dtp, "aggrate", "0") == -1) { 262b47b5b34SRafael Vanoni pt_error("%s : failed to set speed 'aggrate'\n", __FILE__); 263b47b5b34SRafael Vanoni } 264b47b5b34SRafael Vanoni 265b47b5b34SRafael Vanoni if (dtrace_setopt(dtp, "aggpercpu", 0) == -1) { 266b47b5b34SRafael Vanoni pt_error("%s : failed to set speed 'aggpercpu'\n", __FILE__); 267b47b5b34SRafael Vanoni } 268b47b5b34SRafael Vanoni 269b47b5b34SRafael Vanoni if (dtrace_go(dtp) != 0) { 270b47b5b34SRafael Vanoni pt_error("%s : failed to start speed observation", __FILE__); 271b47b5b34SRafael Vanoni return (dtrace_errno(dtp)); 272b47b5b34SRafael Vanoni } 273b47b5b34SRafael Vanoni 274b47b5b34SRafael Vanoni if (dtrace_getopt(dtp, "statusrate", &statustime) == -1) { 275b47b5b34SRafael Vanoni pt_error("%s : failed to get speed 'statusrate'\n", __FILE__); 276b47b5b34SRafael Vanoni return (dtrace_errno(dtp)); 277b47b5b34SRafael Vanoni } 278b47b5b34SRafael Vanoni 279b47b5b34SRafael Vanoni return (0); 280b47b5b34SRafael Vanoni } 281b47b5b34SRafael Vanoni 282b47b5b34SRafael Vanoni /* 283b47b5b34SRafael Vanoni * The DTrace probes have already been enabled, and are tracking 284b47b5b34SRafael Vanoni * CPU speed transitions. Take a snapshot of the aggregations, and 285b47b5b34SRafael Vanoni * look for any CPUs that have made a speed transition over the last 286b47b5b34SRafael Vanoni * sampling interval. Note that the aggregations may be empty if no 287b47b5b34SRafael Vanoni * speed transitions took place over the last interval. In that case, 288b47b5b34SRafael Vanoni * notate that we have already accounted for the time, so that when 289b47b5b34SRafael Vanoni * we do encounter a speed transition in a future sampling interval 290b47b5b34SRafael Vanoni * we can subtract that time back out. 291b47b5b34SRafael Vanoni */ 292b47b5b34SRafael Vanoni int 293b47b5b34SRafael Vanoni pt_cpufreq_stat_collect(double interval) 294b47b5b34SRafael Vanoni { 295b47b5b34SRafael Vanoni int i, ret; 296b47b5b34SRafael Vanoni 297b47b5b34SRafael Vanoni /* 298b47b5b34SRafael Vanoni * Zero out the interval time reported by DTrace for 299b47b5b34SRafael Vanoni * this interval 300b47b5b34SRafael Vanoni */ 301b47b5b34SRafael Vanoni for (i = 0; i < g_npstates; i++) 302b47b5b34SRafael Vanoni g_pstate_info[i].total_time = 0; 303b47b5b34SRafael Vanoni 304b47b5b34SRafael Vanoni for (i = 0; i < g_ncpus; i++) 305b47b5b34SRafael Vanoni g_cpu_power_states[i].dtrace_time = 0; 306b47b5b34SRafael Vanoni 307b47b5b34SRafael Vanoni if (dtrace_status(dtp) == -1) 308b47b5b34SRafael Vanoni return (-1); 309b47b5b34SRafael Vanoni 310b47b5b34SRafael Vanoni if (dtrace_aggregate_snap(dtp) != 0) 311b47b5b34SRafael Vanoni pt_error("%s : failed to add to stats aggregation", __FILE__); 312b47b5b34SRafael Vanoni 313b47b5b34SRafael Vanoni if (dtrace_aggregate_walk_keyvarsorted(dtp, pt_cpufreq_dtrace_walk, 314b47b5b34SRafael Vanoni NULL) != 0) 315b47b5b34SRafael Vanoni pt_error("%s : failed to sort stats aggregation", __FILE__); 316b47b5b34SRafael Vanoni 317b47b5b34SRafael Vanoni dtrace_aggregate_clear(dtp); 318b47b5b34SRafael Vanoni 319b47b5b34SRafael Vanoni if ((ret = pt_cpufreq_snapshot()) != 0) { 320b47b5b34SRafael Vanoni pt_error("%s : failed to add to stats aggregation", __FILE__); 321b47b5b34SRafael Vanoni return (ret); 322b47b5b34SRafael Vanoni } 323b47b5b34SRafael Vanoni 324b47b5b34SRafael Vanoni switch (g_op_mode) { 325*636423dbSRafael Vanoni case PT_MODE_CPU: 326b47b5b34SRafael Vanoni pt_cpufreq_stat_account(interval, g_observed_cpu); 327b47b5b34SRafael Vanoni break; 328*636423dbSRafael Vanoni case PT_MODE_DEFAULT: 329b47b5b34SRafael Vanoni default: 330b47b5b34SRafael Vanoni for (i = 0; i < g_ncpus_observed; i++) 331b47b5b34SRafael Vanoni pt_cpufreq_stat_account(interval, i); 332b47b5b34SRafael Vanoni break; 333b47b5b34SRafael Vanoni } 334b47b5b34SRafael Vanoni 335b47b5b34SRafael Vanoni return (0); 336b47b5b34SRafael Vanoni } 337b47b5b34SRafael Vanoni 338b47b5b34SRafael Vanoni static void 339b47b5b34SRafael Vanoni pt_cpufreq_stat_account(double interval, uint_t cpu) 340b47b5b34SRafael Vanoni { 341*636423dbSRafael Vanoni cpu_power_info_t *cpu_pow; 342b47b5b34SRafael Vanoni uint64_t speed; 343b47b5b34SRafael Vanoni hrtime_t duration; 344b47b5b34SRafael Vanoni int i; 345b47b5b34SRafael Vanoni 346b47b5b34SRafael Vanoni cpu_pow = &g_cpu_power_states[cpu]; 347b47b5b34SRafael Vanoni speed = cpu_pow->current_pstate; 348b47b5b34SRafael Vanoni 349*636423dbSRafael Vanoni duration = (hrtime_t)(interval * NANOSEC) - cpu_pow->dtrace_time; 350*636423dbSRafael Vanoni 351*636423dbSRafael Vanoni /* 352*636423dbSRafael Vanoni * 'duration' may be a negative value when we're using or forcing a 353*636423dbSRafael Vanoni * small interval, and the amount of time already accounted ends up 354*636423dbSRafael Vanoni * being larger than the the former. 355*636423dbSRafael Vanoni */ 356*636423dbSRafael Vanoni if (duration < 0) 357*636423dbSRafael Vanoni return; 358b47b5b34SRafael Vanoni 359b47b5b34SRafael Vanoni for (i = 0; i < g_npstates; i++) { 360b47b5b34SRafael Vanoni if (g_pstate_info[i].speed == speed) { 361b47b5b34SRafael Vanoni g_pstate_info[i].total_time += duration; 362b47b5b34SRafael Vanoni cpu_pow->time_accounted += duration; 363*636423dbSRafael Vanoni cpu_pow->speed_accounted = speed; 364b47b5b34SRafael Vanoni } 365b47b5b34SRafael Vanoni } 366b47b5b34SRafael Vanoni } 367b47b5b34SRafael Vanoni 368b47b5b34SRafael Vanoni /* 369b47b5b34SRafael Vanoni * Take a snapshot of each CPU's speed by looking through the cpu_info kstats. 370b47b5b34SRafael Vanoni */ 371b47b5b34SRafael Vanoni static int 372b47b5b34SRafael Vanoni pt_cpufreq_snapshot(void) 373b47b5b34SRafael Vanoni { 374b47b5b34SRafael Vanoni kstat_ctl_t *kc; 375b47b5b34SRafael Vanoni int ret; 376b47b5b34SRafael Vanoni uint_t i; 377b47b5b34SRafael Vanoni 378b47b5b34SRafael Vanoni if ((kc = kstat_open()) == NULL) 379b47b5b34SRafael Vanoni return (errno); 380b47b5b34SRafael Vanoni 381b47b5b34SRafael Vanoni switch (g_op_mode) { 382*636423dbSRafael Vanoni case PT_MODE_CPU: 383b47b5b34SRafael Vanoni ret = pt_cpufreq_snapshot_cpu(kc, g_observed_cpu); 384b47b5b34SRafael Vanoni break; 385*636423dbSRafael Vanoni case PT_MODE_DEFAULT: 386b47b5b34SRafael Vanoni default: 387b47b5b34SRafael Vanoni for (i = 0; i < g_ncpus_observed; i++) 388b47b5b34SRafael Vanoni if ((ret = pt_cpufreq_snapshot_cpu(kc, i)) != 0) 389b47b5b34SRafael Vanoni break; 390b47b5b34SRafael Vanoni break; 391b47b5b34SRafael Vanoni } 392b47b5b34SRafael Vanoni 393b47b5b34SRafael Vanoni if (kstat_close(kc) != 0) 394b47b5b34SRafael Vanoni pt_error("%s : couldn't close kstat\n", __FILE__); 395b47b5b34SRafael Vanoni 396b47b5b34SRafael Vanoni return (ret); 397b47b5b34SRafael Vanoni } 398b47b5b34SRafael Vanoni 399b47b5b34SRafael Vanoni static int 400b47b5b34SRafael Vanoni pt_cpufreq_snapshot_cpu(kstat_ctl_t *kc, uint_t cpu) 401b47b5b34SRafael Vanoni { 402b47b5b34SRafael Vanoni kstat_t *ksp; 403b47b5b34SRafael Vanoni kstat_named_t *knp; 404b47b5b34SRafael Vanoni 405b47b5b34SRafael Vanoni ksp = kstat_lookup(kc, "cpu_info", g_cpu_table[cpu], NULL); 406b47b5b34SRafael Vanoni if (ksp == NULL) { 407b47b5b34SRafael Vanoni pt_error("%s : couldn't find cpu_info kstat for CPU " 408b47b5b34SRafael Vanoni "%d\n", __FILE__, cpu); 409b47b5b34SRafael Vanoni return (1); 410b47b5b34SRafael Vanoni } 411b47b5b34SRafael Vanoni 412b47b5b34SRafael Vanoni if (kstat_read(kc, ksp, NULL) == -1) { 413b47b5b34SRafael Vanoni pt_error("%s : couldn't read cpu_info kstat for " 414b47b5b34SRafael Vanoni "CPU %d\n", __FILE__, cpu); 415b47b5b34SRafael Vanoni return (2); 416b47b5b34SRafael Vanoni } 417b47b5b34SRafael Vanoni 418b47b5b34SRafael Vanoni knp = kstat_data_lookup(ksp, "current_clock_Hz"); 419b47b5b34SRafael Vanoni if (knp == NULL) { 420b47b5b34SRafael Vanoni pt_error("%s : couldn't find current_clock_Hz " 421b47b5b34SRafael Vanoni "kstat for CPU %d\n", __FILE__, cpu); 422b47b5b34SRafael Vanoni return (3); 423b47b5b34SRafael Vanoni } 424b47b5b34SRafael Vanoni 425b47b5b34SRafael Vanoni g_cpu_power_states[cpu].current_pstate = HZ2MHZ(knp->value.ui64); 426b47b5b34SRafael Vanoni 427b47b5b34SRafael Vanoni return (0); 428b47b5b34SRafael Vanoni } 429b47b5b34SRafael Vanoni 430b47b5b34SRafael Vanoni /* 431b47b5b34SRafael Vanoni * DTrace aggregation walker that sorts through a snapshot of the 432b47b5b34SRafael Vanoni * aggregation data collected during firings of the cpu-change-speed 433b47b5b34SRafael Vanoni * probe. 434b47b5b34SRafael Vanoni */ 435b47b5b34SRafael Vanoni /*ARGSUSED*/ 436b47b5b34SRafael Vanoni static int 437b47b5b34SRafael Vanoni pt_cpufreq_dtrace_walk(const dtrace_aggdata_t *data, void *arg) 438b47b5b34SRafael Vanoni { 439b47b5b34SRafael Vanoni dtrace_aggdesc_t *aggdesc = data->dtada_desc; 440b47b5b34SRafael Vanoni dtrace_recdesc_t *cpu_rec, *speed_rec; 441*636423dbSRafael Vanoni cpu_power_info_t *cp; 442b47b5b34SRafael Vanoni int32_t cpu; 443b47b5b34SRafael Vanoni uint64_t speed; 444*636423dbSRafael Vanoni hrtime_t res; 445b47b5b34SRafael Vanoni int i; 446b47b5b34SRafael Vanoni 447b47b5b34SRafael Vanoni if (strcmp(aggdesc->dtagd_name, "times") == 0) { 448b47b5b34SRafael Vanoni cpu_rec = &aggdesc->dtagd_rec[1]; 449b47b5b34SRafael Vanoni speed_rec = &aggdesc->dtagd_rec[2]; 450b47b5b34SRafael Vanoni 451b47b5b34SRafael Vanoni /* LINTED - alignment */ 452b47b5b34SRafael Vanoni cpu = *(int32_t *)(data->dtada_data + cpu_rec->dtrd_offset); 453*636423dbSRafael Vanoni 454*636423dbSRafael Vanoni /* LINTED - alignment */ 455*636423dbSRafael Vanoni res = *((hrtime_t *)(data->dtada_percpu[cpu])); 456*636423dbSRafael Vanoni 457b47b5b34SRafael Vanoni /* LINTED - alignment */ 458b47b5b34SRafael Vanoni speed = *(uint64_t *)(data->dtada_data + 459b47b5b34SRafael Vanoni speed_rec->dtrd_offset); 460b47b5b34SRafael Vanoni 461*636423dbSRafael Vanoni if (speed == 0) 462b47b5b34SRafael Vanoni speed = max_cpufreq; 463*636423dbSRafael Vanoni else 464*636423dbSRafael Vanoni speed = HZ2MHZ(speed); 465b47b5b34SRafael Vanoni 466b47b5b34SRafael Vanoni /* 467b47b5b34SRafael Vanoni * We have an aggregation record for "cpu" being at "speed" 468b47b5b34SRafael Vanoni * for an interval of "n" nanoseconds. The reported interval 469b47b5b34SRafael Vanoni * may exceed the powertop sampling interval, since we only 470b47b5b34SRafael Vanoni * notice during potentially infrequent firings of the 471b47b5b34SRafael Vanoni * "speed change" DTrace probe. In this case powertop would 472b47b5b34SRafael Vanoni * have already accounted for the portions of the interval 473b47b5b34SRafael Vanoni * that happened during prior powertop samplings, so subtract 474b47b5b34SRafael Vanoni * out time already accounted. 475b47b5b34SRafael Vanoni */ 476*636423dbSRafael Vanoni cp = &g_cpu_power_states[cpu]; 477b47b5b34SRafael Vanoni 478b47b5b34SRafael Vanoni for (i = 0; i < g_npstates; i++) { 479b47b5b34SRafael Vanoni if (g_pstate_info[i].speed == speed) { 480*636423dbSRafael Vanoni 481*636423dbSRafael Vanoni if (cp->time_accounted > 0 && 482*636423dbSRafael Vanoni cp->speed_accounted == speed) { 483*636423dbSRafael Vanoni if (res > cp->time_accounted) { 484*636423dbSRafael Vanoni res -= cp->time_accounted; 485*636423dbSRafael Vanoni cp->time_accounted = 0; 486*636423dbSRafael Vanoni cp->speed_accounted = 0; 487*636423dbSRafael Vanoni } else { 488*636423dbSRafael Vanoni return (DTRACE_AGGWALK_NEXT); 489b47b5b34SRafael Vanoni } 490b47b5b34SRafael Vanoni } 491*636423dbSRafael Vanoni 492*636423dbSRafael Vanoni g_pstate_info[i].total_time += res; 493*636423dbSRafael Vanoni cp->dtrace_time += res; 494b47b5b34SRafael Vanoni } 495b47b5b34SRafael Vanoni } 496b47b5b34SRafael Vanoni } 497*636423dbSRafael Vanoni 498b47b5b34SRafael Vanoni return (DTRACE_AGGWALK_NEXT); 499b47b5b34SRafael Vanoni } 500b47b5b34SRafael Vanoni 501b47b5b34SRafael Vanoni /* 502b47b5b34SRafael Vanoni * Used as a suggestion, sets PM in /etc/power.conf and 503b47b5b34SRafael Vanoni * a 1sec threshold, then calls /usr/sbin/pmconfig 504b47b5b34SRafael Vanoni */ 505b47b5b34SRafael Vanoni void 506b47b5b34SRafael Vanoni enable_p_state(void) 507b47b5b34SRafael Vanoni { 508b47b5b34SRafael Vanoni (void) system(cpupm_enable); 509b47b5b34SRafael Vanoni (void) system(cpupm_treshold); 510b47b5b34SRafael Vanoni (void) system(default_pmconf); 511b47b5b34SRafael Vanoni } 512b47b5b34SRafael Vanoni 513b47b5b34SRafael Vanoni /* 514b47b5b34SRafael Vanoni * Checks if PM is enabled in /etc/power.conf, enabling if not 515b47b5b34SRafael Vanoni */ 516b47b5b34SRafael Vanoni void 517b47b5b34SRafael Vanoni suggest_p_state(void) 518b47b5b34SRafael Vanoni { 519b47b5b34SRafael Vanoni char line[1024]; 520b47b5b34SRafael Vanoni FILE *file; 521b47b5b34SRafael Vanoni 522b47b5b34SRafael Vanoni /* 523b47b5b34SRafael Vanoni * Return if speed transition is not supported 524b47b5b34SRafael Vanoni */ 525b47b5b34SRafael Vanoni if (g_npstates < 2) 526b47b5b34SRafael Vanoni return; 527b47b5b34SRafael Vanoni 528b47b5b34SRafael Vanoni file = fopen(default_conf, "r"); 529b47b5b34SRafael Vanoni 530b47b5b34SRafael Vanoni if (!file) 531b47b5b34SRafael Vanoni return; 532b47b5b34SRafael Vanoni 533b47b5b34SRafael Vanoni (void) memset(line, 0, 1024); 534b47b5b34SRafael Vanoni 535b47b5b34SRafael Vanoni while (fgets(line, 1023, file)) { 536b47b5b34SRafael Vanoni if (strstr(line, "cpupm")) { 537b47b5b34SRafael Vanoni if (strstr(line, "enable")) { 538b47b5b34SRafael Vanoni (void) fclose(file); 539b47b5b34SRafael Vanoni return; 540b47b5b34SRafael Vanoni } 541b47b5b34SRafael Vanoni } 542b47b5b34SRafael Vanoni } 543b47b5b34SRafael Vanoni 544b47b5b34SRafael Vanoni add_suggestion("Suggestion: enable CPU power management by " 545b47b5b34SRafael Vanoni "pressing the P key", 40, 'P', "P - Enable p-state", 546b47b5b34SRafael Vanoni enable_p_state); 547b47b5b34SRafael Vanoni 548b47b5b34SRafael Vanoni (void) fclose(file); 549b47b5b34SRafael Vanoni } 550