xref: /titanic_51/usr/src/cmd/powertop/common/cpuidle.c (revision 2d83778a2c10c425b98c41d254f85f0e384d4dac)
1b47b5b34SRafael Vanoni /*
2b47b5b34SRafael Vanoni  * Copyright 2009, Intel Corporation
3b47b5b34SRafael Vanoni  * Copyright 2009, Sun Microsystems, Inc
4b47b5b34SRafael Vanoni  *
5b47b5b34SRafael Vanoni  * This file is part of PowerTOP
6b47b5b34SRafael Vanoni  *
7b47b5b34SRafael Vanoni  * This program file is free software; you can redistribute it and/or modify it
8b47b5b34SRafael Vanoni  * under the terms of the GNU General Public License as published by the
9b47b5b34SRafael Vanoni  * Free Software Foundation; version 2 of the License.
10b47b5b34SRafael Vanoni  *
11b47b5b34SRafael Vanoni  * This program is distributed in the hope that it will be useful, but WITHOUT
12b47b5b34SRafael Vanoni  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13b47b5b34SRafael Vanoni  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
14b47b5b34SRafael Vanoni  * for more details.
15b47b5b34SRafael Vanoni  *
16b47b5b34SRafael Vanoni  * You should have received a copy of the GNU General Public License
17b47b5b34SRafael Vanoni  * along with this program in a file named COPYING; if not, write to the
18b47b5b34SRafael Vanoni  * Free Software Foundation, Inc.,
19b47b5b34SRafael Vanoni  * 51 Franklin Street, Fifth Floor,
20b47b5b34SRafael Vanoni  * Boston, MA 02110-1301 USA
21b47b5b34SRafael Vanoni  *
22b47b5b34SRafael Vanoni  * Authors:
23b47b5b34SRafael Vanoni  *	Arjan van de Ven <arjan@linux.intel.com>
24b47b5b34SRafael Vanoni  *	Eric C Saxe <eric.saxe@sun.com>
25b47b5b34SRafael Vanoni  *	Aubrey Li <aubrey.li@intel.com>
26b47b5b34SRafael Vanoni  */
27b47b5b34SRafael Vanoni 
28b47b5b34SRafael Vanoni /*
29b47b5b34SRafael Vanoni  * GPL Disclaimer
30b47b5b34SRafael Vanoni  *
31b47b5b34SRafael Vanoni  * For the avoidance of doubt, except that if any license choice other
32b47b5b34SRafael Vanoni  * than GPL or LGPL is available it will apply instead, Sun elects to
33b47b5b34SRafael Vanoni  * use only the General Public License version 2 (GPLv2) at this time
34b47b5b34SRafael Vanoni  * for any software where a choice of GPL license versions is made
35b47b5b34SRafael Vanoni  * available with the language indicating that GPLv2 or any later
36b47b5b34SRafael Vanoni  * version may be used, or where a choice of which version of the GPL
37b47b5b34SRafael Vanoni  * is applied is otherwise unspecified.
38b47b5b34SRafael Vanoni  */
39b47b5b34SRafael Vanoni 
40b47b5b34SRafael Vanoni #include <string.h>
41b47b5b34SRafael Vanoni #include <dtrace.h>
42b47b5b34SRafael Vanoni #include "powertop.h"
43b47b5b34SRafael Vanoni 
44636423dbSRafael Vanoni #define	S2NS(x)		((x) * (NANOSEC))
45636423dbSRafael Vanoni 
46b47b5b34SRafael Vanoni static dtrace_hdl_t 	*dtp;
47b47b5b34SRafael Vanoni 
48b47b5b34SRafael Vanoni /*
49b47b5b34SRafael Vanoni  * Buffer containing DTrace program to track CPU idle state transitions
50b47b5b34SRafael Vanoni  */
51b47b5b34SRafael Vanoni static const char *dtp_cpuidle =
52b47b5b34SRafael Vanoni ":::idle-state-transition"
53b47b5b34SRafael Vanoni "/arg0 != 0/"
54b47b5b34SRafael Vanoni "{"
55b47b5b34SRafael Vanoni "	self->start = timestamp;"
56b47b5b34SRafael Vanoni "	self->state = arg0;"
57b47b5b34SRafael Vanoni "}"
58b47b5b34SRafael Vanoni ""
59b47b5b34SRafael Vanoni ":::idle-state-transition"
60b47b5b34SRafael Vanoni "/arg0 == 0 && self->start/"
61b47b5b34SRafael Vanoni "{"
62b47b5b34SRafael Vanoni "	@number[self->state] = count();"
63636423dbSRafael Vanoni "	@times[self->state] = sum(timestamp - self->start);"
64b47b5b34SRafael Vanoni "	self->start = 0;"
65b47b5b34SRafael Vanoni "	self->state = 0;"
66b47b5b34SRafael Vanoni "}";
67b47b5b34SRafael Vanoni 
68b47b5b34SRafael Vanoni /*
69b47b5b34SRafael Vanoni  * Same as above but only for a specific CPU
70b47b5b34SRafael Vanoni  */
71b47b5b34SRafael Vanoni static const char *dtp_cpuidle_c =
72b47b5b34SRafael Vanoni ":::idle-state-transition"
73b47b5b34SRafael Vanoni "/cpu == $0 &&"
74b47b5b34SRafael Vanoni " arg0 != 0/"
75b47b5b34SRafael Vanoni "{"
76b47b5b34SRafael Vanoni "	self->start = timestamp;"
77b47b5b34SRafael Vanoni "	self->state = arg0;"
78b47b5b34SRafael Vanoni "}"
79b47b5b34SRafael Vanoni ""
80b47b5b34SRafael Vanoni ":::idle-state-transition"
81b47b5b34SRafael Vanoni "/cpu == $0 &&"
82b47b5b34SRafael Vanoni " arg0 == 0 && self->start/"
83b47b5b34SRafael Vanoni "{"
84b47b5b34SRafael Vanoni "	@number[self->state] = count();"
85636423dbSRafael Vanoni "	@times[self->state] = sum(timestamp - self->start);"
86b47b5b34SRafael Vanoni "	self->start = 0;"
87b47b5b34SRafael Vanoni "	self->state = 0;"
88b47b5b34SRafael Vanoni "}";
89b47b5b34SRafael Vanoni 
90b47b5b34SRafael Vanoni static int 	pt_cpuidle_dtrace_walk(const dtrace_aggdata_t *, void *);
91b47b5b34SRafael Vanoni 
92b47b5b34SRafael Vanoni /*
93b47b5b34SRafael Vanoni  * Perform setup necessary to track CPU idle state transitions
94b47b5b34SRafael Vanoni  */
95b47b5b34SRafael Vanoni int
96b47b5b34SRafael Vanoni pt_cpuidle_stat_prepare(void)
97b47b5b34SRafael Vanoni {
98b47b5b34SRafael Vanoni 	dtrace_prog_t 		*prog;
99b47b5b34SRafael Vanoni 	dtrace_proginfo_t 	info;
100b47b5b34SRafael Vanoni 	dtrace_optval_t 	statustime;
101b47b5b34SRafael Vanoni 	int 			err;
102b47b5b34SRafael Vanoni 	char			*prog_ptr;
103b47b5b34SRafael Vanoni 
104b47b5b34SRafael Vanoni 	if ((dtp = dtrace_open(DTRACE_VERSION, 0, &err)) == NULL) {
105*2d83778aSRafael Vanoni 		pt_error("cannot open dtrace library for the %s report: %s\n",
106*2d83778aSRafael Vanoni 		    g_msg_idle_state, dtrace_errmsg(NULL, err));
107b47b5b34SRafael Vanoni 		return (-1);
108b47b5b34SRafael Vanoni 	}
109b47b5b34SRafael Vanoni 
110b47b5b34SRafael Vanoni 	/*
111b47b5b34SRafael Vanoni 	 * Execute different scripts (defined above) depending on
112b47b5b34SRafael Vanoni 	 * user specified options.
113b47b5b34SRafael Vanoni 	 */
114636423dbSRafael Vanoni 	if (PT_ON_CPU)
115b47b5b34SRafael Vanoni 		prog_ptr = (char *)dtp_cpuidle_c;
116b47b5b34SRafael Vanoni 	else
117b47b5b34SRafael Vanoni 		prog_ptr = (char *)dtp_cpuidle;
118b47b5b34SRafael Vanoni 
119b47b5b34SRafael Vanoni 	if ((prog = dtrace_program_strcompile(dtp, prog_ptr,
120b47b5b34SRafael Vanoni 	    DTRACE_PROBESPEC_NAME, 0, g_argc, g_argv)) == NULL) {
121*2d83778aSRafael Vanoni 		pt_error("failed to compile %s program\n", g_msg_idle_state);
122b47b5b34SRafael Vanoni 		return (dtrace_errno(dtp));
123b47b5b34SRafael Vanoni 	}
124b47b5b34SRafael Vanoni 
125b47b5b34SRafael Vanoni 	if (dtrace_program_exec(dtp, prog, &info) == -1) {
126*2d83778aSRafael Vanoni 		pt_error("failed to enable %s probes\n", g_msg_idle_state);
127b47b5b34SRafael Vanoni 		return (dtrace_errno(dtp));
128b47b5b34SRafael Vanoni 	}
129b47b5b34SRafael Vanoni 
130*2d83778aSRafael Vanoni 	if (dtrace_setopt(dtp, "aggsize", "128k") == -1)
131*2d83778aSRafael Vanoni 		pt_error("failed to set %s 'aggsize'\n", g_msg_idle_state);
132b47b5b34SRafael Vanoni 
133*2d83778aSRafael Vanoni 	if (dtrace_setopt(dtp, "aggrate", "0") == -1)
134*2d83778aSRafael Vanoni 		pt_error("failed to set %s 'aggrate'\n", g_msg_idle_state);
135b47b5b34SRafael Vanoni 
136*2d83778aSRafael Vanoni 	if (dtrace_setopt(dtp, "aggpercpu", 0) == -1)
137*2d83778aSRafael Vanoni 		pt_error("failed to set %s 'aggpercpu'\n", g_msg_idle_state);
138b47b5b34SRafael Vanoni 
139b47b5b34SRafael Vanoni 	if (dtrace_go(dtp) != 0) {
140*2d83778aSRafael Vanoni 		pt_error("failed to start %s observation\n", g_msg_idle_state);
141b47b5b34SRafael Vanoni 		return (dtrace_errno(dtp));
142b47b5b34SRafael Vanoni 	}
143b47b5b34SRafael Vanoni 
144b47b5b34SRafael Vanoni 	if (dtrace_getopt(dtp, "statusrate", &statustime) == -1) {
145*2d83778aSRafael Vanoni 		pt_error("failed to get %s 'statusrate'\n", g_msg_idle_state);
146b47b5b34SRafael Vanoni 		return (dtrace_errno(dtp));
147b47b5b34SRafael Vanoni 	}
148b47b5b34SRafael Vanoni 
149b47b5b34SRafael Vanoni 	return (0);
150b47b5b34SRafael Vanoni }
151b47b5b34SRafael Vanoni 
152b47b5b34SRafael Vanoni /*
153b47b5b34SRafael Vanoni  * The DTrace probes have been enabled, and are tracking CPU idle state
154b47b5b34SRafael Vanoni  * transitions. Take a snapshot of the aggregations, and invoke the aggregation
155b47b5b34SRafael Vanoni  * walker to process any records. The walker does most of the accounting work
156b47b5b34SRafael Vanoni  * chalking up time spent into the g_cstate_info structure.
157b47b5b34SRafael Vanoni  */
158b47b5b34SRafael Vanoni int
159b47b5b34SRafael Vanoni pt_cpuidle_stat_collect(double interval)
160b47b5b34SRafael Vanoni {
161b47b5b34SRafael Vanoni 	int i;
162b47b5b34SRafael Vanoni 	hrtime_t t = 0;
163b47b5b34SRafael Vanoni 
164b47b5b34SRafael Vanoni 	/*
165b47b5b34SRafael Vanoni 	 * Assume that all the time spent in this interval will
166b47b5b34SRafael Vanoni 	 * be the default "0" state. The DTrace walker will reallocate
167b47b5b34SRafael Vanoni 	 * time out of the default bucket as it processes aggregation
168b47b5b34SRafael Vanoni 	 * records for time spent in other states.
169b47b5b34SRafael Vanoni 	 */
170636423dbSRafael Vanoni 	g_cstate_info[0].total_time = (uint64_t)S2NS(interval *
171636423dbSRafael Vanoni 	    g_ncpus_observed);
172b47b5b34SRafael Vanoni 
173b47b5b34SRafael Vanoni 	if (dtrace_status(dtp) == -1)
174b47b5b34SRafael Vanoni 		return (-1);
175b47b5b34SRafael Vanoni 
176b47b5b34SRafael Vanoni 	if (dtrace_aggregate_snap(dtp) != 0)
177*2d83778aSRafael Vanoni 		pt_error("failed to collect data for %s\n", g_msg_idle_state);
178b47b5b34SRafael Vanoni 
179b47b5b34SRafael Vanoni 	if (dtrace_aggregate_walk_keyvarsorted(dtp, pt_cpuidle_dtrace_walk,
180b47b5b34SRafael Vanoni 	    NULL) != 0)
181*2d83778aSRafael Vanoni 		pt_error("failed to sort %s data\n", g_msg_idle_state);
182b47b5b34SRafael Vanoni 
183b47b5b34SRafael Vanoni 	dtrace_aggregate_clear(dtp);
184b47b5b34SRafael Vanoni 
185b47b5b34SRafael Vanoni 	/*
186b47b5b34SRafael Vanoni 	 * Populate g_cstate_info with the correct amount of time spent
187b47b5b34SRafael Vanoni 	 * in each C state and update the number of C states in g_max_cstate
188b47b5b34SRafael Vanoni 	 */
189b47b5b34SRafael Vanoni 	g_total_c_time = 0;
190b47b5b34SRafael Vanoni 	for (i = 0; i < NSTATES; i++) {
191b47b5b34SRafael Vanoni 		if (g_cstate_info[i].total_time > 0) {
192b47b5b34SRafael Vanoni 			g_total_c_time += g_cstate_info[i].total_time;
193b47b5b34SRafael Vanoni 			if (i > g_max_cstate)
194b47b5b34SRafael Vanoni 				g_max_cstate = i;
195b47b5b34SRafael Vanoni 			if (g_cstate_info[i].last_time > t) {
196b47b5b34SRafael Vanoni 				t = g_cstate_info[i].last_time;
197b47b5b34SRafael Vanoni 				g_longest_cstate = i;
198b47b5b34SRafael Vanoni 			}
199b47b5b34SRafael Vanoni 		}
200b47b5b34SRafael Vanoni 	}
201b47b5b34SRafael Vanoni 
202b47b5b34SRafael Vanoni 	return (0);
203b47b5b34SRafael Vanoni }
204b47b5b34SRafael Vanoni 
205b47b5b34SRafael Vanoni /*
206b47b5b34SRafael Vanoni  * DTrace aggregation walker that sorts through a snapshot of data records
207b47b5b34SRafael Vanoni  * collected during firings of the idle-state-transition probe.
208b47b5b34SRafael Vanoni  *
209b47b5b34SRafael Vanoni  * XXX A way of querying the current idle state for a CPU is needed in addition
210b47b5b34SRafael Vanoni  *     to logic similar to that in cpufreq.c
211b47b5b34SRafael Vanoni  */
212b47b5b34SRafael Vanoni /*ARGSUSED*/
213b47b5b34SRafael Vanoni static int
214b47b5b34SRafael Vanoni pt_cpuidle_dtrace_walk(const dtrace_aggdata_t *data, void *arg)
215b47b5b34SRafael Vanoni {
216b47b5b34SRafael Vanoni 	dtrace_aggdesc_t 	*aggdesc = data->dtada_desc;
217b47b5b34SRafael Vanoni 	dtrace_recdesc_t 	*rec;
218*2d83778aSRafael Vanoni 	uint64_t 		n = 0, state;
219b47b5b34SRafael Vanoni 	int 			i;
220b47b5b34SRafael Vanoni 
221b47b5b34SRafael Vanoni 	rec = &aggdesc->dtagd_rec[1];
222*2d83778aSRafael Vanoni 
223*2d83778aSRafael Vanoni 	switch (g_bit_depth) {
224*2d83778aSRafael Vanoni 		case 32:
225b47b5b34SRafael Vanoni 			/* LINTED - alignment */
226*2d83778aSRafael Vanoni 			state = *(uint32_t *)(data->dtada_data +
227*2d83778aSRafael Vanoni 			    rec->dtrd_offset);
228*2d83778aSRafael Vanoni 			break;
229*2d83778aSRafael Vanoni 		case 64:
230*2d83778aSRafael Vanoni 			/* LINTED - alignment */
231*2d83778aSRafael Vanoni 			state = *(uint64_t *)(data->dtada_data +
232*2d83778aSRafael Vanoni 			    rec->dtrd_offset);
233*2d83778aSRafael Vanoni 			break;
234*2d83778aSRafael Vanoni 	}
235b47b5b34SRafael Vanoni 
236b47b5b34SRafael Vanoni 	if (strcmp(aggdesc->dtagd_name, "number") == 0) {
237b47b5b34SRafael Vanoni 		for (i = 0; i < g_ncpus; i++) {
238b47b5b34SRafael Vanoni 			/* LINTED - alignment */
239b47b5b34SRafael Vanoni 			n += *((uint64_t *)(data->dtada_percpu[i]));
240b47b5b34SRafael Vanoni 		}
241b47b5b34SRafael Vanoni 		g_total_events += n;
242b47b5b34SRafael Vanoni 		g_cstate_info[state].events += n;
243b47b5b34SRafael Vanoni 	}
244b47b5b34SRafael Vanoni 	else
245b47b5b34SRafael Vanoni 		if (strcmp(aggdesc->dtagd_name, "times") == 0) {
246b47b5b34SRafael Vanoni 			for (i = 0; i < g_ncpus; i++) {
247b47b5b34SRafael Vanoni 				/* LINTED - alignment */
248b47b5b34SRafael Vanoni 				n += *((uint64_t *)(data->dtada_percpu[i]));
249b47b5b34SRafael Vanoni 			}
250b47b5b34SRafael Vanoni 			g_cstate_info[state].last_time = n;
251b47b5b34SRafael Vanoni 			g_cstate_info[state].total_time += n;
252b47b5b34SRafael Vanoni 			if (g_cstate_info[0].total_time >= n)
253b47b5b34SRafael Vanoni 				g_cstate_info[0].total_time -= n;
254636423dbSRafael Vanoni 			else
255636423dbSRafael Vanoni 				g_cstate_info[0].total_time = 0;
256b47b5b34SRafael Vanoni 		}
257b47b5b34SRafael Vanoni 
258b47b5b34SRafael Vanoni 	return (DTRACE_AGGWALK_NEXT);
259b47b5b34SRafael Vanoni }
260