blob: 724d0bf6832658b24e9531907cd53c21d5ed9c73 [file] [log] [blame]
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001/* disasm.c where all the _work_ gets done in the Netwide Disassembler
2 *
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the licence given in the file "Licence"
6 * distributed in the NASM archive.
7 *
8 * initial version 27/iii/95 by Simon Tatham
9 */
10
11#include <stdio.h>
12#include <string.h>
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +000013#include <limits.h>
Keith Kaniosb7a89542007-04-12 02:40:54 +000014#include <inttypes.h>
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000015
16#include "nasm.h"
17#include "disasm.h"
18#include "sync.h"
19#include "insns.h"
20
21#include "names.c"
22
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000023/*
24 * Flags that go into the `segment' field of `insn' structures
25 * during disassembly.
26 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +000027#define SEG_RELATIVE 1
28#define SEG_32BIT 2
29#define SEG_RMREG 4
30#define SEG_DISP8 8
31#define SEG_DISP16 16
32#define SEG_DISP32 32
33#define SEG_NODISP 64
34#define SEG_SIGNED 128
35#define SEG_64BIT 256
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000036
H. Peter Anvin232badb2002-06-06 02:41:20 +000037#include "regdis.c"
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000038
H. Peter Anvin62cb6062007-09-11 22:44:03 +000039/*
40 * Prefix information
41 */
42struct prefix_info {
43 uint8_t osize; /* Operand size */
44 uint8_t asize; /* Address size */
45 uint8_t osp; /* Operand size prefix present */
46 uint8_t asp; /* Address size prefix present */
47 uint8_t rep; /* Rep prefix present */
48 uint8_t seg; /* Segment override prefix present */
49 uint8_t lock; /* Lock prefix present */
50 uint8_t rex; /* Rex prefix present */
51};
52
H. Peter Anvin0ee01422007-04-16 01:18:30 +000053#define getu8(x) (*(uint8_t *)(x))
54#if defined(__i386__) || defined(__x86_64__)
55/* Littleendian CPU which can handle unaligned references */
56#define getu16(x) (*(uint16_t *)(x))
57#define getu32(x) (*(uint32_t *)(x))
58#define getu64(x) (*(uint64_t *)(x))
59#else
60static uint16_t getu16(uint8_t *data)
61{
62 return (uint16_t)data[0] + ((uint16_t)data[1] << 8);
63}
64static uint32_t getu32(uint8_t *data)
65{
66 return (uint32_t)getu16(data) + ((uint32_t)getu16(data+2) << 16);
67}
68static uint64_t getu64(uint8_t *data)
69{
70 return (uint64_t)getu32(data) + ((uint64_t)getu32(data+4) << 32);
71}
72#endif
73
74#define gets8(x) ((int8_t)getu8(x))
75#define gets16(x) ((int16_t)getu16(x))
76#define gets32(x) ((int32_t)getu32(x))
77#define gets64(x) ((int64_t)getu64(x))
78
79/* Important: regval must already have been adjusted for rex extensions */
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +000080static enum reg_enum whichreg(int32_t regflags, int regval, int rex)
H. Peter Anvin0ee01422007-04-16 01:18:30 +000081{
H. Peter Anvin0da6b582007-09-12 20:32:39 -070082 if (!(regflags & (REGISTER|REGMEM)))
83 return 0; /* Registers not permissible?! */
84
85 regflags |= REGISTER;
86
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000087 if (!(REG_AL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000088 return R_AL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000089 if (!(REG_AX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000090 return R_AX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000091 if (!(REG_EAX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000092 return R_EAX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +000093 if (!(REG_RAX & ~regflags))
94 return R_RAX;
H. Peter Anvin10101f22003-02-24 23:22:45 +000095 if (!(REG_DL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000096 return R_DL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000097 if (!(REG_DX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000098 return R_DX;
H. Peter Anvin10101f22003-02-24 23:22:45 +000099 if (!(REG_EDX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000100 return R_EDX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000101 if (!(REG_RDX & ~regflags))
102 return R_RDX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000103 if (!(REG_CL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000104 return R_CL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000105 if (!(REG_CX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000106 return R_CX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000107 if (!(REG_ECX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000108 return R_ECX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000109 if (!(REG_RCX & ~regflags))
110 return R_RCX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000111 if (!(FPU0 & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000112 return R_ST0;
H. Peter Anvind7ed89e2002-04-30 20:52:08 +0000113 if (!(REG_CS & ~regflags))
H. Peter Anvin232badb2002-06-06 02:41:20 +0000114 return (regval == 1) ? R_CS : 0;
H. Peter Anvin76690a12002-04-30 20:52:49 +0000115 if (!(REG_DESS & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000116 return (regval == 0 || regval == 2
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000117 || regval == 3 ? rd_sreg[regval] : 0);
H. Peter Anvin76690a12002-04-30 20:52:49 +0000118 if (!(REG_FSGS & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000119 return (regval == 4 || regval == 5 ? rd_sreg[regval] : 0);
H. Peter Anvin232badb2002-06-06 02:41:20 +0000120 if (!(REG_SEG67 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000121 return (regval == 6 || regval == 7 ? rd_sreg[regval] : 0);
H. Peter Anvin232badb2002-06-06 02:41:20 +0000122
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000123 /* All the entries below look up regval in an 16-entry array */
124 if (regval < 0 || regval > 15)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000125 return 0;
H. Peter Anvin232badb2002-06-06 02:41:20 +0000126
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700127 if (!(REG8 & ~regflags)) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000128 if (rex & REX_P)
129 return rd_reg8_rex[regval];
130 else
131 return rd_reg8[regval];
132 }
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700133 if (!(REG16 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000134 return rd_reg16[regval];
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700135 if (!(REG32 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000136 return rd_reg32[regval];
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700137 if (!(REG64 & ~regflags))
H. Peter Anvinb061d592007-04-16 02:02:06 +0000138 return rd_reg64[regval];
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000139 if (!(REG_SREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000140 return rd_sreg[regval & 7]; /* Ignore REX */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000141 if (!(REG_CREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000142 return rd_creg[regval];
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000143 if (!(REG_DREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000144 return rd_dreg[regval];
145 if (!(REG_TREG & ~regflags)) {
146 if (rex & REX_P)
147 return 0; /* TR registers are ill-defined with rex */
148 return rd_treg[regval];
149 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000150 if (!(FPUREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000151 return rd_fpureg[regval & 7]; /* Ignore REX */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000152 if (!(MMXREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000153 return rd_mmxreg[regval & 7]; /* Ignore REX */
H. Peter Anvin4836e332002-04-30 20:56:43 +0000154 if (!(XMMREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000155 return rd_xmmreg[regval];
H. Peter Anvin232badb2002-06-06 02:41:20 +0000156
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000157 return 0;
158}
159
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000160static const char *whichcond(int condval)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000161{
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000162 static int conds[] = {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000163 C_O, C_NO, C_C, C_NC, C_Z, C_NZ, C_NA, C_A,
164 C_S, C_NS, C_PE, C_PO, C_L, C_NL, C_NG, C_G
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000165 };
166 return conditions[conds[condval]];
167}
168
169/*
H. Peter Anvin7786c362007-09-17 18:45:44 -0700170 * Process a DREX suffix
171 */
172static uint8_t *do_drex(uint8_t *data, insn *ins)
173{
174 uint8_t drex = *data++;
175 operand *dst = &ins->oprs[ins->drexdst];
176
177 if ((drex & 8) != ((ins->rex & REX_OC) ? 8 : 0))
178 return NULL; /* OC0 mismatch */
179 ins->rex = (ins->rex & ~7) | (drex & 7);
180
181 dst->segment = SEG_RMREG;
182 dst->basereg = drex >> 4;
183 return data;
184}
185
186
187/*
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000188 * Process an effective address (ModRM) specification.
189 */
Keith Kaniosb7a89542007-04-12 02:40:54 +0000190static uint8_t *do_ea(uint8_t *data, int modrm, int asize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700191 int segsize, operand * op, insn *ins)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000192{
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000193 int mod, rm, scale, index, base;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700194 int rex;
195 uint8_t sib = 0;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000196
197 mod = (modrm >> 6) & 03;
198 rm = modrm & 07;
199
H. Peter Anvin7786c362007-09-17 18:45:44 -0700200 if (mod != 3 && rm == 4 && asize != 16)
201 sib = *data++;
202
203 if (ins->rex & REX_D) {
204 data = do_drex(data, ins);
205 if (!data)
206 return NULL;
207 }
208 rex = ins->rex;
209
H. Peter Anvine2c80182005-01-15 22:15:51 +0000210 if (mod == 3) { /* pure register version */
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000211 op->basereg = rm+(rex & REX_B ? 8 : 0);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000212 op->segment |= SEG_RMREG;
213 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000214 }
215
216 op->addr_size = 0;
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000217 op->eaflags = 0;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000218
219 if (asize == 16) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000220 /*
221 * <mod> specifies the displacement size (none, byte or
222 * word), and <rm> specifies the register combination.
223 * Exception: mod=0,rm=6 does not specify [BP] as one might
224 * expect, but instead specifies [disp16].
225 */
226 op->indexreg = op->basereg = -1;
227 op->scale = 1; /* always, in 16 bits */
228 switch (rm) {
229 case 0:
230 op->basereg = R_BX;
231 op->indexreg = R_SI;
232 break;
233 case 1:
234 op->basereg = R_BX;
235 op->indexreg = R_DI;
236 break;
237 case 2:
238 op->basereg = R_BP;
239 op->indexreg = R_SI;
240 break;
241 case 3:
242 op->basereg = R_BP;
243 op->indexreg = R_DI;
244 break;
245 case 4:
246 op->basereg = R_SI;
247 break;
248 case 5:
249 op->basereg = R_DI;
250 break;
251 case 6:
252 op->basereg = R_BP;
253 break;
254 case 7:
255 op->basereg = R_BX;
256 break;
257 }
258 if (rm == 6 && mod == 0) { /* special case */
259 op->basereg = -1;
260 if (segsize != 16)
261 op->addr_size = 16;
262 mod = 2; /* fake disp16 */
263 }
264 switch (mod) {
265 case 0:
266 op->segment |= SEG_NODISP;
267 break;
268 case 1:
269 op->segment |= SEG_DISP8;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000270 op->offset = (int8_t)*data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000271 break;
272 case 2:
273 op->segment |= SEG_DISP16;
274 op->offset = *data++;
275 op->offset |= ((unsigned)*data++) << 8;
276 break;
277 }
278 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000279 } else {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000280 /*
281 * Once again, <mod> specifies displacement size (this time
282 * none, byte or *dword*), while <rm> specifies the base
283 * register. Again, [EBP] is missing, replaced by a pure
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000284 * disp32 (this time that's mod=0,rm=*5*) in 32-bit mode,
285 * and RIP-relative addressing in 64-bit mode.
286 *
287 * However, rm=4
H. Peter Anvine2c80182005-01-15 22:15:51 +0000288 * indicates not a single base register, but instead the
289 * presence of a SIB byte...
290 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000291 int a64 = asize == 64;
292
H. Peter Anvine2c80182005-01-15 22:15:51 +0000293 op->indexreg = -1;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000294
295 if (a64)
296 op->basereg = rd_reg64[rm | ((rex & REX_B) ? 8 : 0)];
297 else
298 op->basereg = rd_reg32[rm | ((rex & REX_B) ? 8 : 0)];
299
H. Peter Anvine2c80182005-01-15 22:15:51 +0000300 if (rm == 5 && mod == 0) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000301 if (segsize == 64) {
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000302 op->eaflags |= EAF_REL;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000303 op->segment |= SEG_RELATIVE;
304 mod = 2; /* fake disp32 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000305 }
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000306
307 if (asize != 64)
308 op->addr_size = asize;
309
310 op->basereg = -1;
311 mod = 2; /* fake disp32 */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000312 }
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000313
H. Peter Anvine2c80182005-01-15 22:15:51 +0000314 if (rm == 4) { /* process SIB */
H. Peter Anvin7786c362007-09-17 18:45:44 -0700315 scale = (sib >> 6) & 03;
316 index = (sib >> 3) & 07;
317 base = sib & 07;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000318
H. Peter Anvine2c80182005-01-15 22:15:51 +0000319 op->scale = 1 << scale;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000320
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000321 if (index == 4)
322 op->indexreg = -1; /* ESP/RSP/R12 cannot be an index */
323 else if (a64)
324 op->indexreg = rd_reg64[index | ((rex & REX_X) ? 8 : 0)];
325 else
326 op->indexreg = rd_reg64[index | ((rex & REX_X) ? 8 : 0)];
327
328 if (base == 5 && mod == 0) {
329 op->basereg = -1;
330 mod = 2; /* Fake disp32 */
331 } else if (a64)
332 op->basereg = rd_reg64[base | ((rex & REX_B) ? 8 : 0)];
333 else
334 op->basereg = rd_reg32[base | ((rex & REX_B) ? 8 : 0)];
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000335
336 if (segsize != 32)
337 op->addr_size = 32;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000338 }
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000339
H. Peter Anvine2c80182005-01-15 22:15:51 +0000340 switch (mod) {
341 case 0:
342 op->segment |= SEG_NODISP;
343 break;
344 case 1:
345 op->segment |= SEG_DISP8;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000346 op->offset = gets8(data);
347 data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000348 break;
349 case 2:
350 op->segment |= SEG_DISP32;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000351 op->offset = getu32(data);
352 data += 4;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000353 break;
354 }
355 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000356 }
357}
358
359/*
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000360 * Determine whether the instruction template in t corresponds to the data
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000361 * stream in data. Return the number of bytes matched if so.
362 */
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000363static int matches(const struct itemplate *t, uint8_t *data,
364 const struct prefix_info *prefix, int segsize, insn *ins)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000365{
Keith Kaniosb7a89542007-04-12 02:40:54 +0000366 uint8_t *r = (uint8_t *)(t->code);
367 uint8_t *origdata = data;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000368 int a_used = FALSE, o_used = FALSE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000369 enum prefixes drep = 0;
370 uint8_t lock = prefix->lock;
371 int osize = prefix->osize;
372 int asize = prefix->asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700373 int i;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000374
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700375 for (i = 0; i < MAX_OPERANDS; i++) {
376 ins->oprs[i].segment = ins->oprs[i].addr_size =
377 (segsize == 64 ? SEG_64BIT : segsize == 32 ? SEG_32BIT : 0);
378 }
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000379 ins->condition = -1;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000380 ins->rex = prefix->rex;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000381
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000382 if (t->flags & (segsize == 64 ? IF_NOLONG : IF_LONG))
383 return FALSE;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000384
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000385 if (prefix->rep == 0xF2)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000386 drep = P_REPNE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000387 else if (prefix->rep == 0xF3)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000388 drep = P_REP;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000389
H. Peter Anvine2c80182005-01-15 22:15:51 +0000390 while (*r) {
391 int c = *r++;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000392
393 /* FIX: change this into a switch */
394 if (c >= 01 && c <= 03) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000395 while (c--)
396 if (*r++ != *data++)
397 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000398 } else if (c == 04) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000399 switch (*data++) {
400 case 0x07:
401 ins->oprs[0].basereg = 0;
402 break;
403 case 0x17:
404 ins->oprs[0].basereg = 2;
405 break;
406 case 0x1F:
407 ins->oprs[0].basereg = 3;
408 break;
409 default:
410 return FALSE;
411 }
H. Peter Anvinb061d592007-04-16 02:02:06 +0000412 } else if (c == 05) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000413 switch (*data++) {
414 case 0xA1:
415 ins->oprs[0].basereg = 4;
416 break;
417 case 0xA9:
418 ins->oprs[0].basereg = 5;
419 break;
420 default:
421 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000422 }
423 } else if (c == 06) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000424 switch (*data++) {
425 case 0x06:
426 ins->oprs[0].basereg = 0;
427 break;
428 case 0x0E:
429 ins->oprs[0].basereg = 1;
430 break;
431 case 0x16:
432 ins->oprs[0].basereg = 2;
433 break;
434 case 0x1E:
435 ins->oprs[0].basereg = 3;
436 break;
437 default:
438 return FALSE;
439 }
H. Peter Anvinb061d592007-04-16 02:02:06 +0000440 } else if (c == 07) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000441 switch (*data++) {
442 case 0xA0:
443 ins->oprs[0].basereg = 4;
444 break;
445 case 0xA8:
446 ins->oprs[0].basereg = 5;
447 break;
448 default:
449 return FALSE;
450 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700451 } else if (c >= 010 && c <= 013) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000452 int t = *r++, d = *data++;
453 if (d < t || d > t + 7)
454 return FALSE;
455 else {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000456 ins->oprs[c - 010].basereg = (d-t)+
457 (ins->rex & REX_B ? 8 : 0);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000458 ins->oprs[c - 010].segment |= SEG_RMREG;
459 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700460 } else if (c >= 014 && c <= 017) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000461 ins->oprs[c - 014].offset = (int8_t)*data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000462 ins->oprs[c - 014].segment |= SEG_SIGNED;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700463 } else if (c >= 020 && c <= 023) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000464 ins->oprs[c - 020].offset = *data++;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700465 } else if (c >= 024 && c <= 027) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000466 ins->oprs[c - 024].offset = *data++;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700467 } else if (c >= 030 && c <= 033) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000468 ins->oprs[c - 030].offset = getu16(data);
469 data += 2;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700470 } else if (c >= 034 && c <= 037) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000471 if (osize == 32) {
472 ins->oprs[c - 034].offset = getu32(data);
473 data += 4;
474 } else {
475 ins->oprs[c - 034].offset = getu16(data);
476 data += 2;
477 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000478 if (segsize != asize)
479 ins->oprs[c - 034].addr_size = asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700480 } else if (c >= 040 && c <= 043) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000481 ins->oprs[c - 040].offset = getu32(data);
482 data += 4;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700483 } else if (c >= 044 && c <= 047) {
H. Peter Anvinb061d592007-04-16 02:02:06 +0000484 switch (asize) {
485 case 16:
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000486 ins->oprs[c - 044].offset = getu16(data);
487 data += 2;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000488 break;
489 case 32:
490 ins->oprs[c - 044].offset = getu32(data);
491 data += 4;
492 break;
493 case 64:
494 ins->oprs[c - 044].offset = getu64(data);
495 data += 8;
496 break;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000497 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000498 if (segsize != asize)
499 ins->oprs[c - 044].addr_size = asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700500 } else if (c >= 050 && c <= 053) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000501 ins->oprs[c - 050].offset = gets8(data++);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000502 ins->oprs[c - 050].segment |= SEG_RELATIVE;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700503 } else if (c >= 054 && c <= 057) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000504 ins->oprs[c - 054].offset = getu64(data);
505 data += 8;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700506 } else if (c >= 060 && c <= 063) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000507 ins->oprs[c - 060].offset = gets16(data);
508 data += 2;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000509 ins->oprs[c - 060].segment |= SEG_RELATIVE;
510 ins->oprs[c - 060].segment &= ~SEG_32BIT;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700511 } else if (c >= 064 && c <= 067) {
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000512 if (osize == 16) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000513 ins->oprs[c - 064].offset = getu16(data);
514 data += 2;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000515 ins->oprs[c - 064].segment &= ~(SEG_32BIT|SEG_64BIT);
516 } else if (osize == 32) {
517 ins->oprs[c - 064].offset = getu32(data);
518 data += 4;
519 ins->oprs[c - 064].segment &= ~SEG_64BIT;
520 ins->oprs[c - 064].segment |= SEG_32BIT;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000521 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000522 if (segsize != osize) {
523 ins->oprs[c - 064].type =
H. Peter Anvin5a640e12007-05-29 23:57:12 +0000524 (ins->oprs[c - 064].type & ~SIZE_MASK)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000525 | ((osize == 16) ? BITS16 : BITS32);
526 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700527 } else if (c >= 070 && c <= 073) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000528 ins->oprs[c - 070].offset = getu32(data);
529 data += 4;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000530 ins->oprs[c - 070].segment |= SEG_32BIT | SEG_RELATIVE;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700531 } else if (c >= 0100 && c < 0140) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000532 int modrm = *data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000533 ins->oprs[c & 07].segment |= SEG_RMREG;
534 data = do_ea(data, modrm, asize, segsize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700535 &ins->oprs[(c >> 3) & 07], ins);
536 if (!data)
537 return FALSE;
538 ins->oprs[c & 07].basereg = ((modrm >> 3)&7)+
539 (ins->rex & REX_R ? 8 : 0);
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700540 } else if (c >= 0140 && c <= 0143) {
541 ins->oprs[c - 0140].offset = getu16(data);
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000542 data += 2;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700543 } else if (c >= 0150 && c <= 0153) {
544 ins->oprs[c - 0150].offset = getu32(data);
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000545 data += 4;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700546 } else if (c >= 0160 && c <= 0167) {
547 ins->rex |= (c & 4) ? REX_D|REX_OC : REX_D;
548 ins->drexdst = c & 3;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700549 } else if (c == 0170) {
550 if (*data++)
551 return FALSE;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700552 } else if (c == 0171) {
553 data = do_drex(data, ins);
554 if (!data)
555 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000556 } else if (c >= 0200 && c <= 0277) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000557 int modrm = *data++;
558 if (((modrm >> 3) & 07) != (c & 07))
559 return FALSE; /* spare field doesn't match up */
560 data = do_ea(data, modrm, asize, segsize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700561 &ins->oprs[(c >> 3) & 07], ins);
562 if (!data)
563 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000564 } else if (c == 0310) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000565 if (asize != 16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000566 return FALSE;
567 else
568 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000569 } else if (c == 0311) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000570 if (asize == 16)
571 return FALSE;
572 else
573 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000574 } else if (c == 0312) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000575 if (asize != segsize)
576 return FALSE;
577 else
578 a_used = TRUE;
H. Peter Anvince2b3972007-05-30 22:21:11 +0000579 } else if (c == 0313) {
580 if (asize != 64)
581 return FALSE;
582 else
583 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000584 } else if (c == 0320) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000585 if (osize != 16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000586 return FALSE;
587 else
588 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000589 } else if (c == 0321) {
590 if (osize != 32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000591 return FALSE;
592 else
593 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000594 } else if (c == 0322) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000595 if (osize != (segsize == 16) ? 16 : 32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000596 return FALSE;
597 else
598 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000599 } else if (c == 0323) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000600 ins->rex |= REX_W; /* 64-bit only instruction */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000601 osize = 64;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000602 } else if (c == 0324) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000603 if (!(ins->rex & (REX_P|REX_W)) || osize != 64)
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000604 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000605 } else if (c == 0330) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000606 int t = *r++, d = *data++;
607 if (d < t || d > t + 15)
608 return FALSE;
609 else
610 ins->condition = d - t;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000611 } else if (c == 0331) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000612 if (prefix->rep)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000613 return FALSE;
H. Peter Anvincb9b6902007-09-12 21:58:51 -0700614 } else if (c == 0332) {
615 if (prefix->rep != 0xF2)
616 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000617 } else if (c == 0333) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000618 if (prefix->rep != 0xF3)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000619 return FALSE;
620 drep = 0;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000621 } else if (c == 0334) {
622 if (lock) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000623 ins->rex |= REX_R;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000624 lock = 0;
625 }
H. Peter Anvincb9b6902007-09-12 21:58:51 -0700626 } else if (c == 0335) {
627 if (drep == P_REP)
628 drep = P_REPE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000629 } else if (c == 0364) {
630 if (prefix->osp)
631 return FALSE;
632 } else if (c == 0365) {
633 if (prefix->asp)
634 return FALSE;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000635 } else if (c == 0366) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000636 if (!prefix->osp)
637 return FALSE;
638 o_used = TRUE;
639 } else if (c == 0367) {
640 if (!prefix->asp)
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000641 return FALSE;
642 o_used = TRUE;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000643 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000644 }
645
H. Peter Anvin7786c362007-09-17 18:45:44 -0700646 /* REX cannot be combined with DREX */
647 if ((ins->rex & REX_D) && (prefix->rex))
648 return FALSE;
649
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000650 /*
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000651 * Check for unused rep or a/o prefixes.
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000652 */
H. Peter Anvinc5b9ce02007-09-22 21:49:51 -0700653 for (i = 0; i < t->operands; i++) {
654 if (ins->oprs[i].segment != SEG_RMREG)
655 a_used = TRUE;
656 }
657
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000658 ins->nprefix = 0;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000659 if (lock)
660 ins->prefixes[ins->nprefix++] = P_LOCK;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000661 if (drep)
662 ins->prefixes[ins->nprefix++] = drep;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000663 if (!a_used && asize != segsize)
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000664 ins->prefixes[ins->nprefix++] = asize == 16 ? P_A16 : P_A32;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000665 if (!o_used && osize == ((segsize == 16) ? 32 : 16))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000666 ins->prefixes[ins->nprefix++] = osize == 16 ? P_O16 : P_O32;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000667
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000668 /* Fix: check for redundant REX prefixes */
669
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000670 return data - origdata;
671}
672
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000673int32_t disasm(uint8_t *data, char *output, int outbufsize, int segsize,
Keith Kaniosb7a89542007-04-12 02:40:54 +0000674 int32_t offset, int autosync, uint32_t prefer)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000675{
H. Peter Anvin3360d792007-09-11 04:16:57 +0000676 const struct itemplate * const *p, * const *best_p;
H. Peter Anvin19e20102007-09-18 15:08:20 -0700677 const struct disasm_index *ix;
678 uint8_t *dp;
H. Peter Anvin4836e332002-04-30 20:56:43 +0000679 int length, best_length = 0;
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000680 char *segover;
H. Peter Anvin19e20102007-09-18 15:08:20 -0700681 int i, slen, colon, n;
Keith Kaniosb7a89542007-04-12 02:40:54 +0000682 uint8_t *origdata;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000683 int works;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000684 insn tmp_ins, ins;
Keith Kaniosb7a89542007-04-12 02:40:54 +0000685 uint32_t goodness, best;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000686 int best_pref;
687 struct prefix_info prefix;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000688
H. Peter Anvinbfb888c2007-09-11 04:26:44 +0000689 memset(&ins, 0, sizeof ins);
690
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000691 /*
692 * Scan for prefixes.
693 */
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000694 memset(&prefix, 0, sizeof prefix);
695 prefix.asize = segsize;
696 prefix.osize = (segsize == 64) ? 32 : segsize;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000697 segover = NULL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000698 origdata = data;
699 for (;;) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000700 if (*data == 0xF3 || *data == 0xF2)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000701 prefix.rep = *data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000702 else if (*data == 0xF0)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000703 prefix.lock = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000704 else if (*data == 0x2E)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000705 segover = "cs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000706 else if (*data == 0x36)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000707 segover = "ss", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000708 else if (*data == 0x3E)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000709 segover = "ds", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000710 else if (*data == 0x26)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000711 segover = "es", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000712 else if (*data == 0x64)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000713 segover = "fs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000714 else if (*data == 0x65)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000715 segover = "gs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000716 else if (*data == 0x66) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000717 prefix.osize = (segsize == 16) ? 32 : 16;
718 prefix.osp = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000719 } else if (*data == 0x67) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000720 prefix.asize = (segsize == 32) ? 16 : 32;
721 prefix.asp = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000722 } else if (segsize == 64 && (*data & 0xf0) == REX_P) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000723 prefix.rex = *data++;
724 if (prefix.rex & REX_W)
725 prefix.osize = 64;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000726 break; /* REX is always the last prefix */
727 } else {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000728 break;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000729 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000730 }
731
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000732 best = -1; /* Worst possible */
H. Peter Anvin4836e332002-04-30 20:56:43 +0000733 best_p = NULL;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000734 best_pref = INT_MAX;
735
H. Peter Anvin19e20102007-09-18 15:08:20 -0700736 dp = data;
737 ix = itable + *dp++;
738 while (ix->n == (size_t)-1) {
739 ix = (const struct disasm_index *)ix->p + *dp++;
740 }
741
742 p = (const struct itemplate * const *)ix->p;
743 for (n = ix->n; n; n--, p++) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000744 if ((length = matches(*p, data, &prefix, segsize, &tmp_ins))) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000745 works = TRUE;
746 /*
747 * Final check to make sure the types of r/m match up.
H. Peter Anvindbf130e2007-05-30 00:18:26 +0000748 * XXX: Need to make sure this is actually correct.
H. Peter Anvine2c80182005-01-15 22:15:51 +0000749 */
750 for (i = 0; i < (*p)->operands; i++) {
H. Peter Anvin7786c362007-09-17 18:45:44 -0700751 if (!((*p)->opd[i] & SAME_AS) &&
752 (
753 /* If it's a mem-only EA but we have a register, die. */
754 ((tmp_ins.oprs[i].segment & SEG_RMREG) &&
755 !(MEMORY & ~(*p)->opd[i])) ||
756 /* If it's a reg-only EA but we have a memory ref, die. */
757 (!(tmp_ins.oprs[i].segment & SEG_RMREG) &&
758 !(REG_EA & ~(*p)->opd[i]) &&
759 !((*p)->opd[i] & REG_SMASK)) ||
760 /* Register type mismatch (eg FS vs REG_DESS): die. */
761 ((((*p)->opd[i] & (REGISTER | FPUREG)) ||
762 (tmp_ins.oprs[i].segment & SEG_RMREG)) &&
763 !whichreg((*p)->opd[i],
764 tmp_ins.oprs[i].basereg, tmp_ins.rex))
765 )) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000766 works = FALSE;
767 break;
768 }
769 }
770
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000771 /*
772 * Note: we always prefer instructions which incorporate
773 * prefixes in the instructions themselves. This is to allow
774 * e.g. PAUSE to be preferred to REP NOP, and deal with
775 * MMX/SSE instructions where prefixes are used to select
776 * between MMX and SSE register sets or outright opcode
777 * selection.
778 */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000779 if (works) {
780 goodness = ((*p)->flags & IF_PFMASK) ^ prefer;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000781 if (tmp_ins.nprefix < best_pref ||
782 (tmp_ins.nprefix == best_pref && goodness < best)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000783 /* This is the best one found so far */
784 best = goodness;
785 best_p = p;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000786 best_pref = tmp_ins.nprefix;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000787 best_length = length;
788 ins = tmp_ins;
789 }
790 }
791 }
H. Peter Anvin4836e332002-04-30 20:56:43 +0000792 }
H. Peter Anvineba20a72002-04-30 20:53:55 +0000793
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000794 if (!best_p)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000795 return 0; /* no instruction was matched */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000796
H. Peter Anvin4836e332002-04-30 20:56:43 +0000797 /* Pick the best match */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000798 p = best_p;
H. Peter Anvin4836e332002-04-30 20:56:43 +0000799 length = best_length;
800
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000801 slen = 0;
802
Ed Beroset64ab5192004-12-15 23:32:57 +0000803 /* TODO: snprintf returns the value that the string would have if
H. Peter Anvine2c80182005-01-15 22:15:51 +0000804 * the buffer were long enough, and not the actual length of
805 * the returned string, so each instance of using the return
806 * value of snprintf should actually be checked to assure that
807 * the return value is "sane." Maybe a macro wrapper could
808 * be used for that purpose.
809 */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000810 for (i = 0; i < ins.nprefix; i++)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000811 switch (ins.prefixes[i]) {
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000812 case P_LOCK:
813 slen += snprintf(output + slen, outbufsize - slen, "lock ");
814 break;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000815 case P_REP:
816 slen += snprintf(output + slen, outbufsize - slen, "rep ");
817 break;
818 case P_REPE:
819 slen += snprintf(output + slen, outbufsize - slen, "repe ");
820 break;
821 case P_REPNE:
822 slen += snprintf(output + slen, outbufsize - slen, "repne ");
823 break;
824 case P_A16:
825 slen += snprintf(output + slen, outbufsize - slen, "a16 ");
826 break;
827 case P_A32:
828 slen += snprintf(output + slen, outbufsize - slen, "a32 ");
829 break;
830 case P_O16:
831 slen += snprintf(output + slen, outbufsize - slen, "o16 ");
832 break;
833 case P_O32:
834 slen += snprintf(output + slen, outbufsize - slen, "o32 ");
835 break;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000836 default:
837 break;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000838 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000839
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000840 for (i = 0; i < (int)elements(ico); i++)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000841 if ((*p)->opcode == ico[i]) {
842 slen +=
843 snprintf(output + slen, outbufsize - slen, "%s%s", icn[i],
844 whichcond(ins.condition));
845 break;
846 }
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000847 if (i >= (int)elements(ico))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000848 slen +=
849 snprintf(output + slen, outbufsize - slen, "%s",
850 insn_names[(*p)->opcode]);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000851 colon = FALSE;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000852 length += data - origdata; /* fix up for prefixes */
853 for (i = 0; i < (*p)->operands; i++) {
H. Peter Anvin7786c362007-09-17 18:45:44 -0700854 opflags_t t = (*p)->opd[i];
855 const operand *o = &ins.oprs[i];
856 int64_t offs;
857
858 if (t & SAME_AS) {
859 o = &ins.oprs[t & ~SAME_AS];
860 t = (*p)->opd[t & ~SAME_AS];
861 }
862
H. Peter Anvine2c80182005-01-15 22:15:51 +0000863 output[slen++] = (colon ? ':' : i == 0 ? ' ' : ',');
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000864
H. Peter Anvin7786c362007-09-17 18:45:44 -0700865 offs = o->offset;
866 if (o->segment & SEG_RELATIVE) {
867 offs += offset + length;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000868 /*
869 * sort out wraparound
870 */
H. Peter Anvin7786c362007-09-17 18:45:44 -0700871 if (!(o->segment & (SEG_32BIT|SEG_64BIT)))
872 offs &= 0xffff;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000873 /*
874 * add sync marker, if autosync is on
875 */
876 if (autosync)
H. Peter Anvin7786c362007-09-17 18:45:44 -0700877 add_sync(offs, 0L);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000878 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000879
H. Peter Anvin7786c362007-09-17 18:45:44 -0700880 if (t & COLON)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000881 colon = TRUE;
882 else
883 colon = FALSE;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000884
H. Peter Anvin7786c362007-09-17 18:45:44 -0700885 if ((t & (REGISTER | FPUREG)) ||
886 (o->segment & SEG_RMREG)) {
887 enum reg_enum reg;
888 reg = whichreg(t, o->basereg, ins.rex);
889 if (t & TO)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000890 slen += snprintf(output + slen, outbufsize - slen, "to ");
891 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700892 reg_names[reg - EXPR_REG_START]);
893 } else if (!(UNITY & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000894 output[slen++] = '1';
H. Peter Anvin7786c362007-09-17 18:45:44 -0700895 } else if (t & IMMEDIATE) {
896 if (t & BITS8) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000897 slen +=
898 snprintf(output + slen, outbufsize - slen, "byte ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700899 if (o->segment & SEG_SIGNED) {
900 if (offs < 0) {
901 offs *= -1;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000902 output[slen++] = '-';
903 } else
904 output[slen++] = '+';
905 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700906 } else if (t & BITS16) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000907 slen +=
908 snprintf(output + slen, outbufsize - slen, "word ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700909 } else if (t & BITS32) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000910 slen +=
911 snprintf(output + slen, outbufsize - slen, "dword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700912 } else if (t & BITS64) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000913 slen +=
914 snprintf(output + slen, outbufsize - slen, "qword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700915 } else if (t & NEAR) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000916 slen +=
917 snprintf(output + slen, outbufsize - slen, "near ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700918 } else if (t & SHORT) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000919 slen +=
920 snprintf(output + slen, outbufsize - slen, "short ");
921 }
922 slen +=
Keith Kanios93f2e9a2007-04-14 00:10:59 +0000923 snprintf(output + slen, outbufsize - slen, "0x%"PRIx64"",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700924 offs);
925 } else if (!(MEM_OFFS & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000926 slen +=
Keith Kanios93f2e9a2007-04-14 00:10:59 +0000927 snprintf(output + slen, outbufsize - slen, "[%s%s%s0x%"PRIx64"]",
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000928 (segover ? segover : ""),
929 (segover ? ":" : ""),
H. Peter Anvin7786c362007-09-17 18:45:44 -0700930 (o->addr_size ==
931 32 ? "dword " : o->addr_size ==
932 16 ? "word " : ""), offs);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000933 segover = NULL;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700934 } else if (!(REGMEM & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000935 int started = FALSE;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700936 if (t & BITS8)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000937 slen +=
938 snprintf(output + slen, outbufsize - slen, "byte ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700939 if (t & BITS16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000940 slen +=
941 snprintf(output + slen, outbufsize - slen, "word ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700942 if (t & BITS32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000943 slen +=
944 snprintf(output + slen, outbufsize - slen, "dword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700945 if (t & BITS64)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000946 slen +=
947 snprintf(output + slen, outbufsize - slen, "qword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700948 if (t & BITS80)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000949 slen +=
950 snprintf(output + slen, outbufsize - slen, "tword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700951 if (t & FAR)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000952 slen += snprintf(output + slen, outbufsize - slen, "far ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700953 if (t & NEAR)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000954 slen +=
955 snprintf(output + slen, outbufsize - slen, "near ");
956 output[slen++] = '[';
H. Peter Anvin7786c362007-09-17 18:45:44 -0700957 if (o->addr_size)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000958 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700959 (o->addr_size == 64 ? "qword " :
960 o->addr_size == 32 ? "dword " :
961 o->addr_size == 16 ? "word " :
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000962 ""));
H. Peter Anvin7786c362007-09-17 18:45:44 -0700963 if (o->eaflags & EAF_REL)
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000964 slen += snprintf(output + slen, outbufsize - slen, "rel ");
H. Peter Anvine2c80182005-01-15 22:15:51 +0000965 if (segover) {
966 slen +=
967 snprintf(output + slen, outbufsize - slen, "%s:",
968 segover);
969 segover = NULL;
970 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700971 if (o->basereg != -1) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000972 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700973 reg_names[(o->basereg -
H. Peter Anvine2c80182005-01-15 22:15:51 +0000974 EXPR_REG_START)]);
975 started = TRUE;
976 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700977 if (o->indexreg != -1) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000978 if (started)
979 output[slen++] = '+';
980 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700981 reg_names[(o->indexreg -
H. Peter Anvine2c80182005-01-15 22:15:51 +0000982 EXPR_REG_START)]);
H. Peter Anvin7786c362007-09-17 18:45:44 -0700983 if (o->scale > 1)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000984 slen +=
985 snprintf(output + slen, outbufsize - slen, "*%d",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700986 o->scale);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000987 started = TRUE;
988 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700989 if (o->segment & SEG_DISP8) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000990 int minus = 0;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700991 int8_t offset = offs;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000992 if (offset < 0) {
993 minus = 1;
994 offset = -offset;
995 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000996 slen +=
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000997 snprintf(output + slen, outbufsize - slen, "%s0x%"PRIx8"",
998 minus ? "-" : "+", offset);
H. Peter Anvin7786c362007-09-17 18:45:44 -0700999 } else if (o->segment & SEG_DISP16) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001000 int minus = 0;
H. Peter Anvin7786c362007-09-17 18:45:44 -07001001 int16_t offset = offs;
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001002 if (offset < 0) {
1003 minus = 1;
1004 offset = -offset;
1005 }
H. Peter Anvine2c80182005-01-15 22:15:51 +00001006 slen +=
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001007 snprintf(output + slen, outbufsize - slen, "%s0x%"PRIx16"",
1008 minus ? "-" : started ? "+" : "", offset);
H. Peter Anvin7786c362007-09-17 18:45:44 -07001009 } else if (o->segment & SEG_DISP32) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001010 char *prefix = "";
H. Peter Anvin7786c362007-09-17 18:45:44 -07001011 int32_t offset = offs;
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +00001012 if (offset < 0) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001013 offset = -offset;
1014 prefix = "-";
1015 } else {
1016 prefix = started ? "+" : "";
1017 }
1018 slen +=
1019 snprintf(output + slen, outbufsize - slen,
1020 "%s0x%"PRIx32"", prefix, offset);
H. Peter Anvine2c80182005-01-15 22:15:51 +00001021 }
1022 output[slen++] = ']';
1023 } else {
1024 slen +=
1025 snprintf(output + slen, outbufsize - slen, "<operand%d>",
1026 i);
1027 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001028 }
1029 output[slen] = '\0';
H. Peter Anvine2c80182005-01-15 22:15:51 +00001030 if (segover) { /* unused segment override */
Keith Kaniosa6dfa782007-04-13 16:47:53 +00001031 char *p = output;
H. Peter Anvine2c80182005-01-15 22:15:51 +00001032 int count = slen + 1;
1033 while (count--)
1034 p[count + 3] = p[count];
1035 strncpy(output, segover, 2);
1036 output[2] = ' ';
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001037 }
1038 return length;
1039}
1040
Keith Kaniosa6dfa782007-04-13 16:47:53 +00001041int32_t eatbyte(uint8_t *data, char *output, int outbufsize)
H. Peter Anvineba20a72002-04-30 20:53:55 +00001042{
Ed Beroset92348172004-12-15 18:27:50 +00001043 snprintf(output, outbufsize, "db 0x%02X", *data);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001044 return 1;
1045}