xref: /titanic_44/usr/src/lib/libdisasm/common/dis_i386.c (revision f7184619589931c4b827180c213074c470f08a8f)
1*f7184619SJoshua M. Clulow /*
2*f7184619SJoshua M. Clulow  * CDDL HEADER START
3*f7184619SJoshua M. Clulow  *
4*f7184619SJoshua M. Clulow  * The contents of this file are subject to the terms of the
5*f7184619SJoshua M. Clulow  * Common Development and Distribution License (the "License").
6*f7184619SJoshua M. Clulow  * You may not use this file except in compliance with the License.
7*f7184619SJoshua M. Clulow  *
8*f7184619SJoshua M. Clulow  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9*f7184619SJoshua M. Clulow  * or http://www.opensolaris.org/os/licensing.
10*f7184619SJoshua M. Clulow  * See the License for the specific language governing permissions
11*f7184619SJoshua M. Clulow  * and limitations under the License.
12*f7184619SJoshua M. Clulow  *
13*f7184619SJoshua M. Clulow  * When distributing Covered Code, include this CDDL HEADER in each
14*f7184619SJoshua M. Clulow  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15*f7184619SJoshua M. Clulow  * If applicable, add the following below this CDDL HEADER, with the
16*f7184619SJoshua M. Clulow  * fields enclosed by brackets "[]" replaced with your own identifying
17*f7184619SJoshua M. Clulow  * information: Portions Copyright [yyyy] [name of copyright owner]
18*f7184619SJoshua M. Clulow  *
19*f7184619SJoshua M. Clulow  * CDDL HEADER END
20*f7184619SJoshua M. Clulow  */
21*f7184619SJoshua M. Clulow 
22*f7184619SJoshua M. Clulow /*
23*f7184619SJoshua M. Clulow  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
24*f7184619SJoshua M. Clulow  * Use is subject to license terms.
25*f7184619SJoshua M. Clulow  * Copyright 2012 Joshua M. Clulow <josh@sysmgr.org>
26*f7184619SJoshua M. Clulow  * Copyright 2015 Nexenta Systems, Inc.  All rights reserved.
27*f7184619SJoshua M. Clulow  */
28*f7184619SJoshua M. Clulow 
29*f7184619SJoshua M. Clulow #include <libdisasm.h>
30*f7184619SJoshua M. Clulow 
31*f7184619SJoshua M. Clulow #include "dis_tables.h"
32*f7184619SJoshua M. Clulow #include "libdisasm_impl.h"
33*f7184619SJoshua M. Clulow 
34*f7184619SJoshua M. Clulow typedef struct dis_handle_i386 {
35*f7184619SJoshua M. Clulow 	int		dhx_mode;
36*f7184619SJoshua M. Clulow 	dis86_t		dhx_dis;
37*f7184619SJoshua M. Clulow 	uint64_t	dhx_end;
38*f7184619SJoshua M. Clulow } dis_handle_i386_t;
39*f7184619SJoshua M. Clulow 
40*f7184619SJoshua M. Clulow /*
41*f7184619SJoshua M. Clulow  * Returns true if we are near the end of a function.  This is a cheap hack at
42*f7184619SJoshua M. Clulow  * detecting NULL padding between functions.  If we're within a few bytes of the
43*f7184619SJoshua M. Clulow  * next function, or past the start, then return true.
44*f7184619SJoshua M. Clulow  */
45*f7184619SJoshua M. Clulow static int
check_func(void * data)46*f7184619SJoshua M. Clulow check_func(void *data)
47*f7184619SJoshua M. Clulow {
48*f7184619SJoshua M. Clulow 	dis_handle_t *dhp = data;
49*f7184619SJoshua M. Clulow 	uint64_t start;
50*f7184619SJoshua M. Clulow 	size_t len;
51*f7184619SJoshua M. Clulow 
52*f7184619SJoshua M. Clulow 	if (dhp->dh_lookup(dhp->dh_data, dhp->dh_addr, NULL, 0, &start, &len)
53*f7184619SJoshua M. Clulow 	    != 0)
54*f7184619SJoshua M. Clulow 		return (0);
55*f7184619SJoshua M. Clulow 
56*f7184619SJoshua M. Clulow 	if (start < dhp->dh_addr)
57*f7184619SJoshua M. Clulow 		return (dhp->dh_addr > start + len - 0x10);
58*f7184619SJoshua M. Clulow 
59*f7184619SJoshua M. Clulow 	return (1);
60*f7184619SJoshua M. Clulow }
61*f7184619SJoshua M. Clulow 
62*f7184619SJoshua M. Clulow static int
get_byte(void * data)63*f7184619SJoshua M. Clulow get_byte(void *data)
64*f7184619SJoshua M. Clulow {
65*f7184619SJoshua M. Clulow 	uchar_t byte;
66*f7184619SJoshua M. Clulow 	dis_handle_t *dhp = data;
67*f7184619SJoshua M. Clulow 
68*f7184619SJoshua M. Clulow 	if (dhp->dh_read(dhp->dh_data, dhp->dh_addr, &byte, sizeof (byte)) !=
69*f7184619SJoshua M. Clulow 	    sizeof (byte))
70*f7184619SJoshua M. Clulow 		return (-1);
71*f7184619SJoshua M. Clulow 
72*f7184619SJoshua M. Clulow 	dhp->dh_addr++;
73*f7184619SJoshua M. Clulow 
74*f7184619SJoshua M. Clulow 	return ((int)byte);
75*f7184619SJoshua M. Clulow }
76*f7184619SJoshua M. Clulow 
77*f7184619SJoshua M. Clulow static int
do_lookup(void * data,uint64_t addr,char * buf,size_t buflen)78*f7184619SJoshua M. Clulow do_lookup(void *data, uint64_t addr, char *buf, size_t buflen)
79*f7184619SJoshua M. Clulow {
80*f7184619SJoshua M. Clulow 	dis_handle_t *dhp = data;
81*f7184619SJoshua M. Clulow 
82*f7184619SJoshua M. Clulow 	return (dhp->dh_lookup(dhp->dh_data, addr, buf, buflen, NULL, NULL));
83*f7184619SJoshua M. Clulow }
84*f7184619SJoshua M. Clulow 
85*f7184619SJoshua M. Clulow static void
dis_i386_handle_detach(dis_handle_t * dhp)86*f7184619SJoshua M. Clulow dis_i386_handle_detach(dis_handle_t *dhp)
87*f7184619SJoshua M. Clulow {
88*f7184619SJoshua M. Clulow 	dis_free(dhp->dh_arch_private, sizeof (dis_handle_i386_t));
89*f7184619SJoshua M. Clulow 	dhp->dh_arch_private = NULL;
90*f7184619SJoshua M. Clulow }
91*f7184619SJoshua M. Clulow 
92*f7184619SJoshua M. Clulow static int
dis_i386_handle_attach(dis_handle_t * dhp)93*f7184619SJoshua M. Clulow dis_i386_handle_attach(dis_handle_t *dhp)
94*f7184619SJoshua M. Clulow {
95*f7184619SJoshua M. Clulow 	dis_handle_i386_t *dhx;
96*f7184619SJoshua M. Clulow 
97*f7184619SJoshua M. Clulow 	/*
98*f7184619SJoshua M. Clulow 	 * Validate architecture flags
99*f7184619SJoshua M. Clulow 	 */
100*f7184619SJoshua M. Clulow 	if (dhp->dh_flags & ~(DIS_X86_SIZE16 | DIS_X86_SIZE32 | DIS_X86_SIZE64 |
101*f7184619SJoshua M. Clulow 	    DIS_OCTAL | DIS_NOIMMSYM)) {
102*f7184619SJoshua M. Clulow 		(void) dis_seterrno(E_DIS_INVALFLAG);
103*f7184619SJoshua M. Clulow 		return (-1);
104*f7184619SJoshua M. Clulow 	}
105*f7184619SJoshua M. Clulow 
106*f7184619SJoshua M. Clulow 	/*
107*f7184619SJoshua M. Clulow 	 * Create and initialize the internal structure
108*f7184619SJoshua M. Clulow 	 */
109*f7184619SJoshua M. Clulow 	if ((dhx = dis_zalloc(sizeof (dis_handle_i386_t))) == NULL) {
110*f7184619SJoshua M. Clulow 		(void) dis_seterrno(E_DIS_NOMEM);
111*f7184619SJoshua M. Clulow 		return (-1);
112*f7184619SJoshua M. Clulow 	}
113*f7184619SJoshua M. Clulow 	dhp->dh_arch_private = dhx;
114*f7184619SJoshua M. Clulow 
115*f7184619SJoshua M. Clulow 	/*
116*f7184619SJoshua M. Clulow 	 * Initialize x86-specific architecture structure
117*f7184619SJoshua M. Clulow 	 */
118*f7184619SJoshua M. Clulow 	if (dhp->dh_flags & DIS_X86_SIZE16)
119*f7184619SJoshua M. Clulow 		dhx->dhx_mode = SIZE16;
120*f7184619SJoshua M. Clulow 	else if (dhp->dh_flags & DIS_X86_SIZE64)
121*f7184619SJoshua M. Clulow 		dhx->dhx_mode = SIZE64;
122*f7184619SJoshua M. Clulow 	else
123*f7184619SJoshua M. Clulow 		dhx->dhx_mode = SIZE32;
124*f7184619SJoshua M. Clulow 
125*f7184619SJoshua M. Clulow 	if (dhp->dh_flags & DIS_OCTAL)
126*f7184619SJoshua M. Clulow 		dhx->dhx_dis.d86_flags = DIS_F_OCTAL;
127*f7184619SJoshua M. Clulow 
128*f7184619SJoshua M. Clulow 	dhx->dhx_dis.d86_sprintf_func = dis_snprintf;
129*f7184619SJoshua M. Clulow 	dhx->dhx_dis.d86_get_byte = get_byte;
130*f7184619SJoshua M. Clulow 	dhx->dhx_dis.d86_sym_lookup = do_lookup;
131*f7184619SJoshua M. Clulow 	dhx->dhx_dis.d86_check_func = check_func;
132*f7184619SJoshua M. Clulow 
133*f7184619SJoshua M. Clulow 	dhx->dhx_dis.d86_data = dhp;
134*f7184619SJoshua M. Clulow 
135*f7184619SJoshua M. Clulow 	return (0);
136*f7184619SJoshua M. Clulow }
137*f7184619SJoshua M. Clulow 
138*f7184619SJoshua M. Clulow static int
dis_i386_disassemble(dis_handle_t * dhp,uint64_t addr,char * buf,size_t buflen)139*f7184619SJoshua M. Clulow dis_i386_disassemble(dis_handle_t *dhp, uint64_t addr, char *buf,
140*f7184619SJoshua M. Clulow     size_t buflen)
141*f7184619SJoshua M. Clulow {
142*f7184619SJoshua M. Clulow 	dis_handle_i386_t *dhx = dhp->dh_arch_private;
143*f7184619SJoshua M. Clulow 	dhp->dh_addr = addr;
144*f7184619SJoshua M. Clulow 
145*f7184619SJoshua M. Clulow 	/* DIS_NOIMMSYM might not be set until now, so update */
146*f7184619SJoshua M. Clulow 	if (dhp->dh_flags & DIS_NOIMMSYM)
147*f7184619SJoshua M. Clulow 		dhx->dhx_dis.d86_flags |= DIS_F_NOIMMSYM;
148*f7184619SJoshua M. Clulow 	else
149*f7184619SJoshua M. Clulow 		dhx->dhx_dis.d86_flags &= ~DIS_F_NOIMMSYM;
150*f7184619SJoshua M. Clulow 
151*f7184619SJoshua M. Clulow 	if (dtrace_disx86(&dhx->dhx_dis, dhx->dhx_mode) != 0)
152*f7184619SJoshua M. Clulow 		return (-1);
153*f7184619SJoshua M. Clulow 
154*f7184619SJoshua M. Clulow 	if (buf != NULL)
155*f7184619SJoshua M. Clulow 		dtrace_disx86_str(&dhx->dhx_dis, dhx->dhx_mode, addr, buf,
156*f7184619SJoshua M. Clulow 		    buflen);
157*f7184619SJoshua M. Clulow 
158*f7184619SJoshua M. Clulow 	return (0);
159*f7184619SJoshua M. Clulow }
160*f7184619SJoshua M. Clulow 
161*f7184619SJoshua M. Clulow /* ARGSUSED */
162*f7184619SJoshua M. Clulow static int
dis_i386_max_instrlen(dis_handle_t * dhp)163*f7184619SJoshua M. Clulow dis_i386_max_instrlen(dis_handle_t *dhp)
164*f7184619SJoshua M. Clulow {
165*f7184619SJoshua M. Clulow 	return (15);
166*f7184619SJoshua M. Clulow }
167*f7184619SJoshua M. Clulow 
168*f7184619SJoshua M. Clulow /* ARGSUSED */
169*f7184619SJoshua M. Clulow static int
dis_i386_min_instrlen(dis_handle_t * dhp)170*f7184619SJoshua M. Clulow dis_i386_min_instrlen(dis_handle_t *dhp)
171*f7184619SJoshua M. Clulow {
172*f7184619SJoshua M. Clulow 	return (1);
173*f7184619SJoshua M. Clulow }
174*f7184619SJoshua M. Clulow 
175*f7184619SJoshua M. Clulow /*
176*f7184619SJoshua M. Clulow  * Return the previous instruction.  On x86, we have no choice except to
177*f7184619SJoshua M. Clulow  * disassemble everything from the start of the symbol, and stop when we have
178*f7184619SJoshua M. Clulow  * reached our instruction address.  If we're not in the middle of a known
179*f7184619SJoshua M. Clulow  * symbol, then we return the same address to indicate failure.
180*f7184619SJoshua M. Clulow  */
181*f7184619SJoshua M. Clulow static uint64_t
dis_i386_previnstr(dis_handle_t * dhp,uint64_t pc,int n)182*f7184619SJoshua M. Clulow dis_i386_previnstr(dis_handle_t *dhp, uint64_t pc, int n)
183*f7184619SJoshua M. Clulow {
184*f7184619SJoshua M. Clulow 	uint64_t *hist, addr, start;
185*f7184619SJoshua M. Clulow 	int cur, nseen;
186*f7184619SJoshua M. Clulow 	uint64_t res = pc;
187*f7184619SJoshua M. Clulow 
188*f7184619SJoshua M. Clulow 	if (n <= 0)
189*f7184619SJoshua M. Clulow 		return (pc);
190*f7184619SJoshua M. Clulow 
191*f7184619SJoshua M. Clulow 	if (dhp->dh_lookup(dhp->dh_data, pc, NULL, 0, &start, NULL) != 0 ||
192*f7184619SJoshua M. Clulow 	    start == pc)
193*f7184619SJoshua M. Clulow 		return (res);
194*f7184619SJoshua M. Clulow 
195*f7184619SJoshua M. Clulow 	hist = dis_zalloc(sizeof (uint64_t) * n);
196*f7184619SJoshua M. Clulow 
197*f7184619SJoshua M. Clulow 	for (cur = 0, nseen = 0, addr = start; addr < pc; addr = dhp->dh_addr) {
198*f7184619SJoshua M. Clulow 		hist[cur] = addr;
199*f7184619SJoshua M. Clulow 		cur = (cur + 1) % n;
200*f7184619SJoshua M. Clulow 		nseen++;
201*f7184619SJoshua M. Clulow 
202*f7184619SJoshua M. Clulow 		/* if we cannot make forward progress, give up */
203*f7184619SJoshua M. Clulow 		if (dis_disassemble(dhp, addr, NULL, 0) != 0)
204*f7184619SJoshua M. Clulow 			goto done;
205*f7184619SJoshua M. Clulow 	}
206*f7184619SJoshua M. Clulow 
207*f7184619SJoshua M. Clulow 	if (addr != pc) {
208*f7184619SJoshua M. Clulow 		/*
209*f7184619SJoshua M. Clulow 		 * We scanned past %pc, but didn't find an instruction that
210*f7184619SJoshua M. Clulow 		 * started at %pc.  This means that either the caller specified
211*f7184619SJoshua M. Clulow 		 * an invalid address, or we ran into something other than code
212*f7184619SJoshua M. Clulow 		 * during our scan.  Virtually any combination of bytes can be
213*f7184619SJoshua M. Clulow 		 * construed as a valid Intel instruction, so any non-code bytes
214*f7184619SJoshua M. Clulow 		 * we encounter will have thrown off the scan.
215*f7184619SJoshua M. Clulow 		 */
216*f7184619SJoshua M. Clulow 		goto done;
217*f7184619SJoshua M. Clulow 	}
218*f7184619SJoshua M. Clulow 
219*f7184619SJoshua M. Clulow 	res = hist[(cur + n - MIN(n, nseen)) % n];
220*f7184619SJoshua M. Clulow 
221*f7184619SJoshua M. Clulow done:
222*f7184619SJoshua M. Clulow 	dis_free(hist, sizeof (uint64_t) * n);
223*f7184619SJoshua M. Clulow 	return (res);
224*f7184619SJoshua M. Clulow }
225*f7184619SJoshua M. Clulow 
226*f7184619SJoshua M. Clulow static int
dis_i386_supports_flags(int flags)227*f7184619SJoshua M. Clulow dis_i386_supports_flags(int flags)
228*f7184619SJoshua M. Clulow {
229*f7184619SJoshua M. Clulow 	int archflags = flags & DIS_ARCH_MASK;
230*f7184619SJoshua M. Clulow 
231*f7184619SJoshua M. Clulow 	if (archflags == DIS_X86_SIZE16 || archflags == DIS_X86_SIZE32 ||
232*f7184619SJoshua M. Clulow 	    archflags == DIS_X86_SIZE64)
233*f7184619SJoshua M. Clulow 		return (1);
234*f7184619SJoshua M. Clulow 
235*f7184619SJoshua M. Clulow 	return (0);
236*f7184619SJoshua M. Clulow }
237*f7184619SJoshua M. Clulow 
238*f7184619SJoshua M. Clulow static int
dis_i386_instrlen(dis_handle_t * dhp,uint64_t pc)239*f7184619SJoshua M. Clulow dis_i386_instrlen(dis_handle_t *dhp, uint64_t pc)
240*f7184619SJoshua M. Clulow {
241*f7184619SJoshua M. Clulow 	if (dis_disassemble(dhp, pc, NULL, 0) != 0)
242*f7184619SJoshua M. Clulow 		return (-1);
243*f7184619SJoshua M. Clulow 
244*f7184619SJoshua M. Clulow 	return (dhp->dh_addr - pc);
245*f7184619SJoshua M. Clulow }
246*f7184619SJoshua M. Clulow 
247*f7184619SJoshua M. Clulow dis_arch_t dis_arch_i386 = {
248*f7184619SJoshua M. Clulow 	dis_i386_supports_flags,
249*f7184619SJoshua M. Clulow 	dis_i386_handle_attach,
250*f7184619SJoshua M. Clulow 	dis_i386_handle_detach,
251*f7184619SJoshua M. Clulow 	dis_i386_disassemble,
252*f7184619SJoshua M. Clulow 	dis_i386_previnstr,
253*f7184619SJoshua M. Clulow 	dis_i386_min_instrlen,
254*f7184619SJoshua M. Clulow 	dis_i386_max_instrlen,
255*f7184619SJoshua M. Clulow 	dis_i386_instrlen,
256*f7184619SJoshua M. Clulow };
257