1 |
/* |
2 |
* mon_x86.cpp - 80x86 disassembler |
3 |
* |
4 |
* (C) 1998-1999 Christian Bauer |
5 |
*/ |
6 |
|
7 |
#include <stdio.h> |
8 |
#include <string.h> |
9 |
|
10 |
#include "mon.h" |
11 |
#include "mon_x86.h" |
12 |
|
13 |
|
14 |
// Memory access functions |
15 |
static uint16 read_uint16(uint8 *&m) |
16 |
{ |
17 |
uint16 val = (m[1] << 8) | m[0]; |
18 |
m += 2; |
19 |
return val; |
20 |
} |
21 |
|
22 |
static int16 read_int16(uint8 *&m) |
23 |
{ |
24 |
int16 val = (m[1] << 8) | m[0]; |
25 |
m += 2; |
26 |
return val; |
27 |
} |
28 |
|
29 |
static uint32 read_uint32(uint8 *&m) |
30 |
{ |
31 |
uint32 val = (m[3] << 24) | (m[2] << 16) | (m[1] << 8) | m[0]; |
32 |
m += 4; |
33 |
return val; |
34 |
} |
35 |
|
36 |
|
37 |
// String constants |
38 |
static const char *gp_reg[2][8] = { |
39 |
"ax", "cx", "dx", "bx", "sp", "bp", "si", "di", |
40 |
"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi" |
41 |
}; |
42 |
|
43 |
|
44 |
// Prototypes |
45 |
static void disass0f(char *&mnem, char *s, uint8 *&m, bool &mode32); |
46 |
|
47 |
|
48 |
/* |
49 |
* Disassemble one instruction, return number of bytes |
50 |
*/ |
51 |
|
52 |
int disass_x86(FILE *f, uint32 adr, uint8 *m) |
53 |
{ |
54 |
uint8 *orig_m = m; |
55 |
char *mnem; |
56 |
char s[256] = ""; |
57 |
bool mode32 = true; |
58 |
int32 disp; |
59 |
|
60 |
// Decode primary opcode |
61 |
next_opcode: |
62 |
uint8 opcode = *m++; |
63 |
switch (opcode) { |
64 |
case 0x04: |
65 |
mnem = "add"; |
66 |
arith_alimm: |
67 |
sprintf(s, "al,$%02x", *m++); |
68 |
break; |
69 |
case 0x05: |
70 |
mnem = "add"; |
71 |
arith_aximm: |
72 |
if (mode32) |
73 |
sprintf(s, "eax,$%08lx", read_uint32(m)); |
74 |
else |
75 |
sprintf(s, "ax,$%04x", read_uint16(m)); |
76 |
break; |
77 |
|
78 |
case 0x06: mnem = "push\tes"; break; |
79 |
case 0x07: mnem = "pop\tes"; break; |
80 |
case 0x0c: mnem = "or"; goto arith_alimm; |
81 |
case 0x0d: mnem = "or"; goto arith_aximm; |
82 |
case 0x0e: mnem = "push\tcs"; break; |
83 |
case 0x0f: disass0f(mnem, s, m, mode32); break; |
84 |
case 0x14: mnem = "adc"; goto arith_alimm; |
85 |
case 0x15: mnem = "adc"; goto arith_aximm; |
86 |
case 0x16: mnem = "push\tss"; break; |
87 |
case 0x17: mnem = "pop\tss"; break; |
88 |
case 0x1c: mnem = "sbb"; goto arith_alimm; |
89 |
case 0x1d: mnem = "sbb"; goto arith_aximm; |
90 |
case 0x1e: mnem = "push\tds"; break; |
91 |
case 0x1f: mnem = "pop\tds"; break; |
92 |
case 0x24: mnem = "and"; goto arith_alimm; |
93 |
case 0x25: mnem = "and"; goto arith_aximm; |
94 |
case 0x26: mnem = "(seg es prefix)"; break; |
95 |
case 0x27: mnem = "daa"; break; |
96 |
case 0x2c: mnem = "sub"; goto arith_alimm; |
97 |
case 0x2d: mnem = "sub"; goto arith_aximm; |
98 |
case 0x2e: mnem = "(seg cs prefix)"; break; |
99 |
case 0x2f: mnem = "das"; break; |
100 |
case 0x34: mnem = "xor"; goto arith_alimm; |
101 |
case 0x35: mnem = "xor"; goto arith_aximm; |
102 |
case 0x36: mnem = "(seg ss prefix)"; break; |
103 |
case 0x37: mnem = "aaa"; break; |
104 |
case 0x3c: mnem = "cmp"; goto arith_alimm; |
105 |
case 0x3d: mnem = "cmp"; goto arith_aximm; |
106 |
case 0x3e: mnem = "(seg ds prefix)"; break; |
107 |
case 0x3f: mnem = "aas"; break; |
108 |
|
109 |
case 0x40: case 0x41: case 0x42: case 0x43: case 0x44: case 0x45: case 0x46: case 0x47: |
110 |
mnem = "inc"; sprintf(s, "%s", gp_reg[mode32][opcode & 7]); break; |
111 |
case 0x48: case 0x49: case 0x4a: case 0x4b: case 0x4c: case 0x4d: case 0x4e: case 0x4f: |
112 |
mnem = "dec"; sprintf(s, "%s", gp_reg[mode32][opcode & 7]); break; |
113 |
case 0x50: case 0x51: case 0x52: case 0x53: case 0x54: case 0x55: case 0x56: case 0x57: |
114 |
mnem = "push"; sprintf(s, "%s", gp_reg[mode32][opcode & 7]); break; |
115 |
case 0x58: case 0x59: case 0x5a: case 0x5b: case 0x5c: case 0x5d: case 0x5e: case 0x5f: |
116 |
mnem = "pop"; sprintf(s, "%s", gp_reg[mode32][opcode & 7]); break; |
117 |
|
118 |
case 0x60: mnem = mode32 ? "pushad" : "pusha"; break; |
119 |
case 0x61: mnem = mode32 ? "popad" : "popa"; break; |
120 |
case 0x64: mnem = "(seg fs prefix)"; break; |
121 |
case 0x65: mnem = "(seg gs prefix)"; break; |
122 |
case 0x66: mode32 = !mode32; goto next_opcode; //!! error checking |
123 |
case 0x67: mnem = "(adr size prefix)"; break; |
124 |
|
125 |
case 0x70: |
126 |
mnem = "jo"; |
127 |
jcc_bdisp: |
128 |
disp = (int8)*m++; |
129 |
sprintf(s, "$%08lx", disp + adr + (m - orig_m)); |
130 |
break; |
131 |
case 0x71: mnem = "jno"; goto jcc_bdisp; |
132 |
case 0x72: mnem = "jc"; goto jcc_bdisp; |
133 |
case 0x73: mnem = "jnc"; goto jcc_bdisp; |
134 |
case 0x74: mnem = "je"; goto jcc_bdisp; |
135 |
case 0x75: mnem = "jne"; goto jcc_bdisp; |
136 |
case 0x76: mnem = "jbe"; goto jcc_bdisp; |
137 |
case 0x77: mnem = "jnbe"; goto jcc_bdisp; |
138 |
case 0x78: mnem = "js"; goto jcc_bdisp; |
139 |
case 0x79: mnem = "jns"; goto jcc_bdisp; |
140 |
case 0x7a: mnem = "jpe"; goto jcc_bdisp; |
141 |
case 0x7b: mnem = "jpo"; goto jcc_bdisp; |
142 |
case 0x7c: mnem = "jl"; goto jcc_bdisp; |
143 |
case 0x7d: mnem = "jge"; goto jcc_bdisp; |
144 |
case 0x7e: mnem = "jle"; goto jcc_bdisp; |
145 |
case 0x7f: mnem = "jg"; goto jcc_bdisp; |
146 |
|
147 |
case 0x90: mnem = "nop"; break; |
148 |
case 0x91: case 0x92: case 0x93: case 0x94: case 0x95: case 0x96: case 0x97: |
149 |
mnem = "xchg"; sprintf(s, "%s,%s", mode32 ? "eax" : "ax", gp_reg[mode32][opcode & 7]); break; |
150 |
|
151 |
case 0x98: mnem = mode32 ? "cwde" : "cbw"; break; |
152 |
case 0x99: mnem = mode32 ? "cdq" : "cwd"; break; |
153 |
case 0x9b: mnem = "wait"; break; |
154 |
case 0x9c: mnem = mode32 ? "pushfd" : "pushf"; break; |
155 |
case 0x9d: mnem = mode32 ? "popfd" : "popf"; break; |
156 |
case 0x9e: mnem = "sahf"; break; |
157 |
case 0x9f: mnem = "lahf"; break; |
158 |
case 0xa0: mnem = "mov"; sprintf(s, "al,byte ptr $%08lx", read_uint32(m)); break; |
159 |
case 0xa1: mnem = "mov"; sprintf(s, mode32 ? "eax,dword ptr $%08lx" : "ax,word ptr $%08x", read_uint32(m)); break; |
160 |
case 0xa2: mnem = "mov"; sprintf(s, "byte ptr $%08lx,al", read_uint32(m)); break; |
161 |
case 0xa3: mnem = "mov"; sprintf(s, mode32 ? "dword ptr $%08lx,eax" : "word ptr $%08x,ax", read_uint32(m)); break; |
162 |
case 0xa4: mnem = "movsb"; break; |
163 |
case 0xa5: mnem = mode32 ? "movsd" : "movsw"; break; |
164 |
case 0xa6: mnem = "cmpsb"; break; |
165 |
case 0xa7: mnem = mode32 ? "cmpsd" : "cmpsw"; break; |
166 |
case 0xa8: mnem = "test"; goto arith_alimm; |
167 |
case 0xa9: mnem = "test"; goto arith_aximm; |
168 |
case 0xaa: mnem = "stosb"; break; |
169 |
case 0xab: mnem = mode32 ? "stosd" : "stosw"; break; |
170 |
case 0xac: mnem = "lodsb"; break; |
171 |
case 0xad: mnem = mode32 ? "lodsd" : "lodsw"; break; |
172 |
case 0xae: mnem = "scasb"; break; |
173 |
case 0xaf: mnem = mode32 ? "scasd" : "scasw"; break; |
174 |
case 0xb0: mnem = "mov"; sprintf(s, "al,$%02x", *m++); break; |
175 |
case 0xb1: mnem = "mov"; sprintf(s, "cl,$%02x", *m++); break; |
176 |
case 0xb2: mnem = "mov"; sprintf(s, "dl,$%02x", *m++); break; |
177 |
case 0xb3: mnem = "mov"; sprintf(s, "bl,$%02x", *m++); break; |
178 |
case 0xb4: mnem = "mov"; sprintf(s, "ah,$%02x", *m++); break; |
179 |
case 0xb5: mnem = "mov"; sprintf(s, "ch,$%02x", *m++); break; |
180 |
case 0xb6: mnem = "mov"; sprintf(s, "dh,$%02x", *m++); break; |
181 |
case 0xb7: mnem = "mov"; sprintf(s, "bh,$%02x", *m++); break; |
182 |
|
183 |
case 0xb8: case 0xb9: case 0xba: case 0xbb: case 0xbc: case 0xbd: case 0xbe: case 0xbf: |
184 |
mnem = "mov"; |
185 |
if (mode32) |
186 |
sprintf(s, "%s,$%08lx", gp_reg[true][opcode & 7], read_uint32(m)); |
187 |
else |
188 |
sprintf(s, "%s,$%04x", gp_reg[false][opcode & 7], read_uint16(m)); |
189 |
break; |
190 |
|
191 |
case 0xc2: mnem = "ret"; sprintf(s, "near $%04x", read_uint16(m)); break; |
192 |
case 0xc3: mnem = "ret\tnear"; break; |
193 |
case 0xc9: mnem = "leave"; break; |
194 |
case 0xca: mnem = "ret"; sprintf(s, "far $%04x", read_uint16(m)); break; |
195 |
case 0xcb: mnem = "ret\tfar"; break; |
196 |
case 0xcc: mnem = "int3"; break; |
197 |
case 0xcd: mnem = "int"; sprintf(s, "$%02x", *m++); break; |
198 |
case 0xce: mnem = "into"; break; |
199 |
case 0xcf: mnem = "iret"; break; |
200 |
case 0xd4: mnem = "aam"; m++; break; |
201 |
case 0xd5: mnem = "aad"; m++; break; |
202 |
case 0xd7: mnem = "xlat"; break; |
203 |
case 0xe0: mnem = "loopnz"; goto jcc_bdisp; |
204 |
case 0xe1: mnem = "loopz"; goto jcc_bdisp; |
205 |
case 0xe2: mnem = "loop"; goto jcc_bdisp; |
206 |
case 0xe3: mnem = mode32 ? "jecxz" : "jcxz"; goto jcc_bdisp; |
207 |
case 0xe4: mnem = "in"; sprintf(s, "al,$%02x", *m++); break; |
208 |
case 0xe5: mnem = "in"; sprintf(s, "%s,$%02x", mode32 ? "eax" : "ax", *m++); break; |
209 |
case 0xe6: mnem = "out"; sprintf(s, "$%02x,al", *m++); break; |
210 |
case 0xe7: mnem = "out"; sprintf(s, "$%02x,%s", *m++, mode32 ? "eax" : "ax"); break; |
211 |
|
212 |
case 0xe8: |
213 |
mnem = "call"; |
214 |
jump_near: |
215 |
disp = read_uint32(m); |
216 |
sprintf(s, "near $%08lx", disp + adr + (m - orig_m)); |
217 |
break; |
218 |
case 0xe9: mnem = "jmp"; goto jump_near; |
219 |
case 0xeb: |
220 |
mnem = "jmp"; |
221 |
disp = (int8)*m++; |
222 |
sprintf(s, "near $%08lx", disp + adr + (m - orig_m)); |
223 |
break; |
224 |
|
225 |
case 0xec: mnem = "in\tal,dx"; break; |
226 |
case 0xed: mnem = mode32 ? "in\teax,dx" : "in\tax,dx"; break; |
227 |
case 0xee: mnem = "out\tdx,al"; break; |
228 |
case 0xef: mnem = mode32 ? "out\tdx,eax" : "out\tdx,ax"; break; |
229 |
case 0xf0: mnem = "lock"; break; |
230 |
case 0xf2: mnem = "repne"; break; |
231 |
case 0xf3: mnem = "rep"; break; |
232 |
case 0xf4: mnem = "hlt"; break; |
233 |
case 0xf5: mnem = "cmc"; break; |
234 |
case 0xf8: mnem = "clc"; break; |
235 |
case 0xf9: mnem = "stc"; break; |
236 |
case 0xfa: mnem = "cli"; break; |
237 |
case 0xfb: mnem = "sti"; break; |
238 |
case 0xfc: mnem = "cld"; break; |
239 |
case 0xfd: mnem = "std"; break; |
240 |
|
241 |
default: |
242 |
mnem = "?"; |
243 |
break; |
244 |
} |
245 |
|
246 |
// Print opcodes and mnemonics |
247 |
int size = m - orig_m; |
248 |
for (int i=0; i<7; i++) |
249 |
if (i < size) |
250 |
fprintf(f, "%02x ", orig_m[i]); |
251 |
else |
252 |
fprintf(f, " "); |
253 |
fprintf(f, "%s\t%s\n", mnem, s); |
254 |
return size; |
255 |
} |
256 |
|
257 |
|
258 |
/* |
259 |
* Disassemble instruction with primary opcode 0x0f |
260 |
*/ |
261 |
|
262 |
static void disass0f(char *&mnem, char *s, uint8 *&m, bool &mode32) |
263 |
{ |
264 |
// Decode secondary opcode |
265 |
uint8 opcode = *m++; |
266 |
switch (opcode) { |
267 |
case 0x06: mnem = "clts"; break; |
268 |
case 0x08: mnem = "invd"; break; |
269 |
case 0x09: mnem = "wbinvd"; break; |
270 |
case 0x0b: mnem = "ud2"; break; |
271 |
case 0x30: mnem = "wrmsr"; break; |
272 |
case 0x31: mnem = "rdtsc"; break; |
273 |
case 0x32: mnem = "rdmsr"; break; |
274 |
case 0x33: mnem = "rdpmc"; break; |
275 |
case 0xa0: mnem = "push\tfs"; break; |
276 |
case 0xa1: mnem = "pop\tfs"; break; |
277 |
case 0xa2: mnem = "cpuid"; break; |
278 |
case 0xa8: mnem = "push\tgs"; break; |
279 |
case 0xa9: mnem = "pop\tgs"; break; |
280 |
case 0xaa: mnem = "rsm"; break; |
281 |
|
282 |
case 0xc8: case 0xc9: case 0xca: case 0xcb: case 0xcc: case 0xcd: case 0xce: case 0xcf: |
283 |
mnem = "bswap"; sprintf(s, "%s", gp_reg[true][opcode & 7]); break; |
284 |
|
285 |
default: |
286 |
mnem = "?"; |
287 |
break; |
288 |
} |
289 |
} |