/* * Copyright 2009, Intel Corporation * Copyright 2009, Sun Microsystems, Inc * * This file is part of PowerTOP * * This program file is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License as published by the * Free Software Foundation; version 2 of the License. * * This program is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * for more details. * * You should have received a copy of the GNU General Public License * along with this program in a file named COPYING; if not, write to the * Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301 USA * * Authors: * Arjan van de Ven * Eric C Saxe * Aubrey Li */ /* * GPL Disclaimer * * For the avoidance of doubt, except that if any license choice other * than GPL or LGPL is available it will apply instead, Sun elects to * use only the General Public License version 2 (GPLv2) at this time * for any software where a choice of GPL license versions is made * available with the language indicating that GPLv2 or any later * version may be used, or where a choice of which version of the GPL * is applied is otherwise unspecified. */ #include #include #include "powertop.h" static dtrace_hdl_t *dtp; /* * Buffer containing DTrace program to track CPU idle state transitions */ static const char *dtp_cpuidle = ":::idle-state-transition" "/arg0 != 0/" "{" " self->start = timestamp;" " self->state = arg0;" "}" "" ":::idle-state-transition" "/arg0 == 0 && self->start/" "{" " @number[self->state] = count();" " @times[self->state] = sum((timestamp - self->start)/1000000);" " self->start = 0;" " self->state = 0;" "}"; /* * Same as above but only for a specific CPU */ static const char *dtp_cpuidle_c = ":::idle-state-transition" "/cpu == $0 &&" " arg0 != 0/" "{" " self->start = timestamp;" " self->state = arg0;" "}" "" ":::idle-state-transition" "/cpu == $0 &&" " arg0 == 0 && self->start/" "{" " @number[self->state] = count();" " @times[self->state] = sum((timestamp - self->start)/1000000);" " self->start = 0;" " self->state = 0;" "}"; static int pt_cpuidle_dtrace_walk(const dtrace_aggdata_t *, void *); /* * Perform setup necessary to track CPU idle state transitions */ int pt_cpuidle_stat_prepare(void) { dtrace_prog_t *prog; dtrace_proginfo_t info; dtrace_optval_t statustime; int err; char *prog_ptr; if ((dtp = dtrace_open(DTRACE_VERSION, 0, &err)) == NULL) { pt_error("%s : cannot open dtrace library: %s\n", __FILE__, dtrace_errmsg(NULL, err)); return (-1); } /* * Execute different scripts (defined above) depending on * user specified options. */ if (PTOP_ON_CPU) prog_ptr = (char *)dtp_cpuidle_c; else prog_ptr = (char *)dtp_cpuidle; if ((prog = dtrace_program_strcompile(dtp, prog_ptr, DTRACE_PROBESPEC_NAME, 0, g_argc, g_argv)) == NULL) { pt_error("%s : C-State DTrace probes unavailable\n", __FILE__); return (dtrace_errno(dtp)); } if (dtrace_program_exec(dtp, prog, &info) == -1) { pt_error("%s : failed to enable C State probes\n", __FILE__); return (dtrace_errno(dtp)); } if (dtrace_setopt(dtp, "aggsize", "128k") == -1) { pt_error("%s : failed to set C-state 'aggsize'\n", __FILE__); } if (dtrace_setopt(dtp, "aggrate", "0") == -1) { pt_error("%s : failed to set C-state'aggrate'\n", __FILE__); } if (dtrace_setopt(dtp, "aggpercpu", 0) == -1) { pt_error("%s : failed to set C-state 'aggpercpu'\n", __FILE__); } if (dtrace_go(dtp) != 0) { pt_error("%s : failed to start C-state observation", __FILE__); return (dtrace_errno(dtp)); } if (dtrace_getopt(dtp, "statusrate", &statustime) == -1) { pt_error("%s : failed to get C-state 'statusrate'\n", __FILE__); return (dtrace_errno(dtp)); } return (0); } /* * The DTrace probes have been enabled, and are tracking CPU idle state * transitions. Take a snapshot of the aggregations, and invoke the aggregation * walker to process any records. The walker does most of the accounting work * chalking up time spent into the g_cstate_info structure. */ int pt_cpuidle_stat_collect(double interval) { int i; hrtime_t t = 0; /* * Zero out the interval time reported by DTrace for * this interval */ for (i = 0; i < NSTATES; i++) { g_cstate_info[i].total_time = 0; g_cstate_info[i].events = 0; } /* * Assume that all the time spent in this interval will * be the default "0" state. The DTrace walker will reallocate * time out of the default bucket as it processes aggregation * records for time spent in other states. */ g_cstate_info[0].total_time = (long)(interval * g_ncpus_observed * 1000); if (dtrace_status(dtp) == -1) return (-1); if (dtrace_aggregate_snap(dtp) != 0) pt_error("%s : failed to add to aggregation", __FILE__); if (dtrace_aggregate_walk_keyvarsorted(dtp, pt_cpuidle_dtrace_walk, NULL) != 0) pt_error("%s : failed to sort aggregation", __FILE__); dtrace_aggregate_clear(dtp); /* * Populate g_cstate_info with the correct amount of time spent * in each C state and update the number of C states in g_max_cstate */ g_total_c_time = 0; for (i = 0; i < NSTATES; i++) { if (g_cstate_info[i].total_time > 0) { g_total_c_time += g_cstate_info[i].total_time; if (i > g_max_cstate) g_max_cstate = i; if (g_cstate_info[i].last_time > t) { t = g_cstate_info[i].last_time; g_longest_cstate = i; } } } return (0); } /* * DTrace aggregation walker that sorts through a snapshot of data records * collected during firings of the idle-state-transition probe. * * XXX A way of querying the current idle state for a CPU is needed in addition * to logic similar to that in cpufreq.c */ /*ARGSUSED*/ static int pt_cpuidle_dtrace_walk(const dtrace_aggdata_t *data, void *arg) { dtrace_aggdesc_t *aggdesc = data->dtada_desc; dtrace_recdesc_t *rec; uint64_t n = 0; int32_t state; int i; rec = &aggdesc->dtagd_rec[1]; /* LINTED - alignment */ state = *(int32_t *)(data->dtada_data + rec->dtrd_offset); if (strcmp(aggdesc->dtagd_name, "number") == 0) { for (i = 0; i < g_ncpus; i++) { /* LINTED - alignment */ n += *((uint64_t *)(data->dtada_percpu[i])); } g_total_events += n; g_cstate_info[state].events += n; } else if (strcmp(aggdesc->dtagd_name, "times") == 0) { for (i = 0; i < g_ncpus; i++) { /* LINTED - alignment */ n += *((uint64_t *)(data->dtada_percpu[i])); } g_cstate_info[state].last_time = n; g_cstate_info[state].total_time += n; if (g_cstate_info[0].total_time >= n) g_cstate_info[0].total_time -= n; } return (DTRACE_AGGWALK_NEXT); }