blob: a6c1c7294405246584745b41014bc2642fa9291a [file] [log] [blame]
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001/* disasm.c where all the _work_ gets done in the Netwide Disassembler
2 *
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the licence given in the file "Licence"
6 * distributed in the NASM archive.
7 *
8 * initial version 27/iii/95 by Simon Tatham
9 */
10
11#include <stdio.h>
12#include <string.h>
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +000013#include <limits.h>
Keith Kaniosb7a89542007-04-12 02:40:54 +000014#include <inttypes.h>
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000015
16#include "nasm.h"
17#include "disasm.h"
18#include "sync.h"
19#include "insns.h"
20
21#include "names.c"
22
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000023/*
24 * Flags that go into the `segment' field of `insn' structures
25 * during disassembly.
26 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +000027#define SEG_RELATIVE 1
28#define SEG_32BIT 2
29#define SEG_RMREG 4
30#define SEG_DISP8 8
31#define SEG_DISP16 16
32#define SEG_DISP32 32
33#define SEG_NODISP 64
34#define SEG_SIGNED 128
35#define SEG_64BIT 256
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000036
H. Peter Anvin232badb2002-06-06 02:41:20 +000037#include "regdis.c"
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000038
H. Peter Anvin62cb6062007-09-11 22:44:03 +000039/*
40 * Prefix information
41 */
42struct prefix_info {
43 uint8_t osize; /* Operand size */
44 uint8_t asize; /* Address size */
45 uint8_t osp; /* Operand size prefix present */
46 uint8_t asp; /* Address size prefix present */
47 uint8_t rep; /* Rep prefix present */
48 uint8_t seg; /* Segment override prefix present */
49 uint8_t lock; /* Lock prefix present */
50 uint8_t rex; /* Rex prefix present */
51};
52
H. Peter Anvin0ee01422007-04-16 01:18:30 +000053#define getu8(x) (*(uint8_t *)(x))
54#if defined(__i386__) || defined(__x86_64__)
55/* Littleendian CPU which can handle unaligned references */
56#define getu16(x) (*(uint16_t *)(x))
57#define getu32(x) (*(uint32_t *)(x))
58#define getu64(x) (*(uint64_t *)(x))
59#else
60static uint16_t getu16(uint8_t *data)
61{
62 return (uint16_t)data[0] + ((uint16_t)data[1] << 8);
63}
64static uint32_t getu32(uint8_t *data)
65{
66 return (uint32_t)getu16(data) + ((uint32_t)getu16(data+2) << 16);
67}
68static uint64_t getu64(uint8_t *data)
69{
70 return (uint64_t)getu32(data) + ((uint64_t)getu32(data+4) << 32);
71}
72#endif
73
74#define gets8(x) ((int8_t)getu8(x))
75#define gets16(x) ((int16_t)getu16(x))
76#define gets32(x) ((int32_t)getu32(x))
77#define gets64(x) ((int64_t)getu64(x))
78
79/* Important: regval must already have been adjusted for rex extensions */
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +000080static enum reg_enum whichreg(int32_t regflags, int regval, int rex)
H. Peter Anvin0ee01422007-04-16 01:18:30 +000081{
H. Peter Anvin0da6b582007-09-12 20:32:39 -070082 if (!(regflags & (REGISTER|REGMEM)))
83 return 0; /* Registers not permissible?! */
84
85 regflags |= REGISTER;
86
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000087 if (!(REG_AL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000088 return R_AL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000089 if (!(REG_AX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000090 return R_AX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000091 if (!(REG_EAX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000092 return R_EAX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +000093 if (!(REG_RAX & ~regflags))
94 return R_RAX;
H. Peter Anvin10101f22003-02-24 23:22:45 +000095 if (!(REG_DL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000096 return R_DL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000097 if (!(REG_DX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +000098 return R_DX;
H. Peter Anvin10101f22003-02-24 23:22:45 +000099 if (!(REG_EDX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000100 return R_EDX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000101 if (!(REG_RDX & ~regflags))
102 return R_RDX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000103 if (!(REG_CL & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000104 return R_CL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000105 if (!(REG_CX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000106 return R_CX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000107 if (!(REG_ECX & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000108 return R_ECX;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000109 if (!(REG_RCX & ~regflags))
110 return R_RCX;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000111 if (!(FPU0 & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000112 return R_ST0;
H. Peter Anvind7ed89e2002-04-30 20:52:08 +0000113 if (!(REG_CS & ~regflags))
H. Peter Anvin232badb2002-06-06 02:41:20 +0000114 return (regval == 1) ? R_CS : 0;
H. Peter Anvin76690a12002-04-30 20:52:49 +0000115 if (!(REG_DESS & ~regflags))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000116 return (regval == 0 || regval == 2
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000117 || regval == 3 ? rd_sreg[regval] : 0);
H. Peter Anvin76690a12002-04-30 20:52:49 +0000118 if (!(REG_FSGS & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000119 return (regval == 4 || regval == 5 ? rd_sreg[regval] : 0);
H. Peter Anvin232badb2002-06-06 02:41:20 +0000120 if (!(REG_SEG67 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000121 return (regval == 6 || regval == 7 ? rd_sreg[regval] : 0);
H. Peter Anvin232badb2002-06-06 02:41:20 +0000122
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000123 /* All the entries below look up regval in an 16-entry array */
124 if (regval < 0 || regval > 15)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000125 return 0;
H. Peter Anvin232badb2002-06-06 02:41:20 +0000126
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700127 if (!(REG8 & ~regflags)) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000128 if (rex & REX_P)
129 return rd_reg8_rex[regval];
130 else
131 return rd_reg8[regval];
132 }
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700133 if (!(REG16 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000134 return rd_reg16[regval];
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700135 if (!(REG32 & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000136 return rd_reg32[regval];
H. Peter Anvin0da6b582007-09-12 20:32:39 -0700137 if (!(REG64 & ~regflags))
H. Peter Anvinb061d592007-04-16 02:02:06 +0000138 return rd_reg64[regval];
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000139 if (!(REG_SREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000140 return rd_sreg[regval & 7]; /* Ignore REX */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000141 if (!(REG_CREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000142 return rd_creg[regval];
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000143 if (!(REG_DREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000144 return rd_dreg[regval];
145 if (!(REG_TREG & ~regflags)) {
146 if (rex & REX_P)
147 return 0; /* TR registers are ill-defined with rex */
148 return rd_treg[regval];
149 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000150 if (!(FPUREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000151 return rd_fpureg[regval & 7]; /* Ignore REX */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000152 if (!(MMXREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000153 return rd_mmxreg[regval & 7]; /* Ignore REX */
H. Peter Anvin4836e332002-04-30 20:56:43 +0000154 if (!(XMMREG & ~regflags))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000155 return rd_xmmreg[regval];
H. Peter Anvin232badb2002-06-06 02:41:20 +0000156
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000157 return 0;
158}
159
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000160static const char *whichcond(int condval)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000161{
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000162 static int conds[] = {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000163 C_O, C_NO, C_C, C_NC, C_Z, C_NZ, C_NA, C_A,
164 C_S, C_NS, C_PE, C_PO, C_L, C_NL, C_NG, C_G
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000165 };
166 return conditions[conds[condval]];
167}
168
169/*
H. Peter Anvin7786c362007-09-17 18:45:44 -0700170 * Process a DREX suffix
171 */
172static uint8_t *do_drex(uint8_t *data, insn *ins)
173{
174 uint8_t drex = *data++;
175 operand *dst = &ins->oprs[ins->drexdst];
176
177 if ((drex & 8) != ((ins->rex & REX_OC) ? 8 : 0))
178 return NULL; /* OC0 mismatch */
179 ins->rex = (ins->rex & ~7) | (drex & 7);
180
181 dst->segment = SEG_RMREG;
182 dst->basereg = drex >> 4;
183 return data;
184}
185
186
187/*
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000188 * Process an effective address (ModRM) specification.
189 */
Keith Kaniosb7a89542007-04-12 02:40:54 +0000190static uint8_t *do_ea(uint8_t *data, int modrm, int asize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700191 int segsize, operand * op, insn *ins)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000192{
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000193 int mod, rm, scale, index, base;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700194 int rex;
195 uint8_t sib = 0;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000196
197 mod = (modrm >> 6) & 03;
198 rm = modrm & 07;
199
H. Peter Anvin7786c362007-09-17 18:45:44 -0700200 if (mod != 3 && rm == 4 && asize != 16)
201 sib = *data++;
202
203 if (ins->rex & REX_D) {
204 data = do_drex(data, ins);
205 if (!data)
206 return NULL;
207 }
208 rex = ins->rex;
209
H. Peter Anvine2c80182005-01-15 22:15:51 +0000210 if (mod == 3) { /* pure register version */
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000211 op->basereg = rm+(rex & REX_B ? 8 : 0);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000212 op->segment |= SEG_RMREG;
213 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000214 }
215
216 op->addr_size = 0;
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000217 op->eaflags = 0;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000218
219 if (asize == 16) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000220 /*
221 * <mod> specifies the displacement size (none, byte or
222 * word), and <rm> specifies the register combination.
223 * Exception: mod=0,rm=6 does not specify [BP] as one might
224 * expect, but instead specifies [disp16].
225 */
226 op->indexreg = op->basereg = -1;
227 op->scale = 1; /* always, in 16 bits */
228 switch (rm) {
229 case 0:
230 op->basereg = R_BX;
231 op->indexreg = R_SI;
232 break;
233 case 1:
234 op->basereg = R_BX;
235 op->indexreg = R_DI;
236 break;
237 case 2:
238 op->basereg = R_BP;
239 op->indexreg = R_SI;
240 break;
241 case 3:
242 op->basereg = R_BP;
243 op->indexreg = R_DI;
244 break;
245 case 4:
246 op->basereg = R_SI;
247 break;
248 case 5:
249 op->basereg = R_DI;
250 break;
251 case 6:
252 op->basereg = R_BP;
253 break;
254 case 7:
255 op->basereg = R_BX;
256 break;
257 }
258 if (rm == 6 && mod == 0) { /* special case */
259 op->basereg = -1;
260 if (segsize != 16)
261 op->addr_size = 16;
262 mod = 2; /* fake disp16 */
263 }
264 switch (mod) {
265 case 0:
266 op->segment |= SEG_NODISP;
267 break;
268 case 1:
269 op->segment |= SEG_DISP8;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000270 op->offset = (int8_t)*data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000271 break;
272 case 2:
273 op->segment |= SEG_DISP16;
274 op->offset = *data++;
275 op->offset |= ((unsigned)*data++) << 8;
276 break;
277 }
278 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000279 } else {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000280 /*
281 * Once again, <mod> specifies displacement size (this time
282 * none, byte or *dword*), while <rm> specifies the base
283 * register. Again, [EBP] is missing, replaced by a pure
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000284 * disp32 (this time that's mod=0,rm=*5*) in 32-bit mode,
285 * and RIP-relative addressing in 64-bit mode.
286 *
287 * However, rm=4
H. Peter Anvine2c80182005-01-15 22:15:51 +0000288 * indicates not a single base register, but instead the
289 * presence of a SIB byte...
290 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000291 int a64 = asize == 64;
292
H. Peter Anvine2c80182005-01-15 22:15:51 +0000293 op->indexreg = -1;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000294
295 if (a64)
296 op->basereg = rd_reg64[rm | ((rex & REX_B) ? 8 : 0)];
297 else
298 op->basereg = rd_reg32[rm | ((rex & REX_B) ? 8 : 0)];
299
H. Peter Anvine2c80182005-01-15 22:15:51 +0000300 if (rm == 5 && mod == 0) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000301 if (segsize == 64) {
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000302 op->eaflags |= EAF_REL;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000303 op->segment |= SEG_RELATIVE;
304 mod = 2; /* fake disp32 */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000305 }
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000306
307 if (asize != 64)
308 op->addr_size = asize;
309
310 op->basereg = -1;
311 mod = 2; /* fake disp32 */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000312 }
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000313
H. Peter Anvine2c80182005-01-15 22:15:51 +0000314 if (rm == 4) { /* process SIB */
H. Peter Anvin7786c362007-09-17 18:45:44 -0700315 scale = (sib >> 6) & 03;
316 index = (sib >> 3) & 07;
317 base = sib & 07;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000318
H. Peter Anvine2c80182005-01-15 22:15:51 +0000319 op->scale = 1 << scale;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000320
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000321 if (index == 4)
322 op->indexreg = -1; /* ESP/RSP/R12 cannot be an index */
323 else if (a64)
324 op->indexreg = rd_reg64[index | ((rex & REX_X) ? 8 : 0)];
325 else
326 op->indexreg = rd_reg64[index | ((rex & REX_X) ? 8 : 0)];
327
328 if (base == 5 && mod == 0) {
329 op->basereg = -1;
330 mod = 2; /* Fake disp32 */
331 } else if (a64)
332 op->basereg = rd_reg64[base | ((rex & REX_B) ? 8 : 0)];
333 else
334 op->basereg = rd_reg32[base | ((rex & REX_B) ? 8 : 0)];
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000335
336 if (segsize != 32)
337 op->addr_size = 32;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000338 }
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000339
H. Peter Anvine2c80182005-01-15 22:15:51 +0000340 switch (mod) {
341 case 0:
342 op->segment |= SEG_NODISP;
343 break;
344 case 1:
345 op->segment |= SEG_DISP8;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000346 op->offset = gets8(data);
347 data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000348 break;
349 case 2:
350 op->segment |= SEG_DISP32;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000351 op->offset = getu32(data);
352 data += 4;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000353 break;
354 }
355 return data;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000356 }
357}
358
359/*
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000360 * Determine whether the instruction template in t corresponds to the data
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000361 * stream in data. Return the number of bytes matched if so.
362 */
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000363static int matches(const struct itemplate *t, uint8_t *data,
364 const struct prefix_info *prefix, int segsize, insn *ins)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000365{
Keith Kaniosb7a89542007-04-12 02:40:54 +0000366 uint8_t *r = (uint8_t *)(t->code);
367 uint8_t *origdata = data;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000368 int a_used = FALSE, o_used = FALSE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000369 enum prefixes drep = 0;
370 uint8_t lock = prefix->lock;
371 int osize = prefix->osize;
372 int asize = prefix->asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700373 int i;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000374
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700375 for (i = 0; i < MAX_OPERANDS; i++) {
376 ins->oprs[i].segment = ins->oprs[i].addr_size =
377 (segsize == 64 ? SEG_64BIT : segsize == 32 ? SEG_32BIT : 0);
378 }
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000379 ins->condition = -1;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000380 ins->rex = prefix->rex;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000381
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000382 if (t->flags & (segsize == 64 ? IF_NOLONG : IF_LONG))
383 return FALSE;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000384
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000385 if (prefix->rep == 0xF2)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000386 drep = P_REPNE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000387 else if (prefix->rep == 0xF3)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000388 drep = P_REP;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000389
H. Peter Anvine2c80182005-01-15 22:15:51 +0000390 while (*r) {
391 int c = *r++;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000392
393 /* FIX: change this into a switch */
394 if (c >= 01 && c <= 03) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000395 while (c--)
396 if (*r++ != *data++)
397 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000398 } else if (c == 04) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000399 switch (*data++) {
400 case 0x07:
401 ins->oprs[0].basereg = 0;
402 break;
403 case 0x17:
404 ins->oprs[0].basereg = 2;
405 break;
406 case 0x1F:
407 ins->oprs[0].basereg = 3;
408 break;
409 default:
410 return FALSE;
411 }
H. Peter Anvinb061d592007-04-16 02:02:06 +0000412 } else if (c == 05) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000413 switch (*data++) {
414 case 0xA1:
415 ins->oprs[0].basereg = 4;
416 break;
417 case 0xA9:
418 ins->oprs[0].basereg = 5;
419 break;
420 default:
421 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000422 }
423 } else if (c == 06) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000424 switch (*data++) {
425 case 0x06:
426 ins->oprs[0].basereg = 0;
427 break;
428 case 0x0E:
429 ins->oprs[0].basereg = 1;
430 break;
431 case 0x16:
432 ins->oprs[0].basereg = 2;
433 break;
434 case 0x1E:
435 ins->oprs[0].basereg = 3;
436 break;
437 default:
438 return FALSE;
439 }
H. Peter Anvinb061d592007-04-16 02:02:06 +0000440 } else if (c == 07) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000441 switch (*data++) {
442 case 0xA0:
443 ins->oprs[0].basereg = 4;
444 break;
445 case 0xA8:
446 ins->oprs[0].basereg = 5;
447 break;
448 default:
449 return FALSE;
450 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700451 } else if (c >= 010 && c <= 013) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000452 int t = *r++, d = *data++;
453 if (d < t || d > t + 7)
454 return FALSE;
455 else {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000456 ins->oprs[c - 010].basereg = (d-t)+
457 (ins->rex & REX_B ? 8 : 0);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000458 ins->oprs[c - 010].segment |= SEG_RMREG;
459 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700460 } else if (c >= 014 && c <= 017) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000461 ins->oprs[c - 014].offset = (int8_t)*data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000462 ins->oprs[c - 014].segment |= SEG_SIGNED;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700463 } else if (c >= 020 && c <= 023) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000464 ins->oprs[c - 020].offset = *data++;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700465 } else if (c >= 024 && c <= 027) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000466 ins->oprs[c - 024].offset = *data++;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700467 } else if (c >= 030 && c <= 033) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000468 ins->oprs[c - 030].offset = getu16(data);
469 data += 2;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700470 } else if (c >= 034 && c <= 037) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000471 if (osize == 32) {
472 ins->oprs[c - 034].offset = getu32(data);
473 data += 4;
474 } else {
475 ins->oprs[c - 034].offset = getu16(data);
476 data += 2;
477 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000478 if (segsize != asize)
479 ins->oprs[c - 034].addr_size = asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700480 } else if (c >= 040 && c <= 043) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000481 ins->oprs[c - 040].offset = getu32(data);
482 data += 4;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700483 } else if (c >= 044 && c <= 047) {
H. Peter Anvinb061d592007-04-16 02:02:06 +0000484 switch (asize) {
485 case 16:
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000486 ins->oprs[c - 044].offset = getu16(data);
487 data += 2;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000488 break;
489 case 32:
490 ins->oprs[c - 044].offset = getu32(data);
491 data += 4;
492 break;
493 case 64:
494 ins->oprs[c - 044].offset = getu64(data);
495 data += 8;
496 break;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000497 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000498 if (segsize != asize)
499 ins->oprs[c - 044].addr_size = asize;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700500 } else if (c >= 050 && c <= 053) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000501 ins->oprs[c - 050].offset = gets8(data++);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000502 ins->oprs[c - 050].segment |= SEG_RELATIVE;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700503 } else if (c >= 054 && c <= 057) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000504 ins->oprs[c - 054].offset = getu64(data);
505 data += 8;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700506 } else if (c >= 060 && c <= 063) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000507 ins->oprs[c - 060].offset = gets16(data);
508 data += 2;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000509 ins->oprs[c - 060].segment |= SEG_RELATIVE;
510 ins->oprs[c - 060].segment &= ~SEG_32BIT;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700511 } else if (c >= 064 && c <= 067) {
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000512 if (osize == 16) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000513 ins->oprs[c - 064].offset = getu16(data);
514 data += 2;
H. Peter Anvin7cf03af2007-04-16 02:39:56 +0000515 ins->oprs[c - 064].segment &= ~(SEG_32BIT|SEG_64BIT);
516 } else if (osize == 32) {
517 ins->oprs[c - 064].offset = getu32(data);
518 data += 4;
519 ins->oprs[c - 064].segment &= ~SEG_64BIT;
520 ins->oprs[c - 064].segment |= SEG_32BIT;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000521 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000522 if (segsize != osize) {
523 ins->oprs[c - 064].type =
H. Peter Anvin5a640e12007-05-29 23:57:12 +0000524 (ins->oprs[c - 064].type & ~SIZE_MASK)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000525 | ((osize == 16) ? BITS16 : BITS32);
526 }
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700527 } else if (c >= 070 && c <= 073) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000528 ins->oprs[c - 070].offset = getu32(data);
529 data += 4;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000530 ins->oprs[c - 070].segment |= SEG_32BIT | SEG_RELATIVE;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700531 } else if (c >= 0100 && c < 0140) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000532 int modrm = *data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000533 ins->oprs[c & 07].segment |= SEG_RMREG;
534 data = do_ea(data, modrm, asize, segsize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700535 &ins->oprs[(c >> 3) & 07], ins);
536 if (!data)
537 return FALSE;
538 ins->oprs[c & 07].basereg = ((modrm >> 3)&7)+
539 (ins->rex & REX_R ? 8 : 0);
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700540 } else if (c >= 0140 && c <= 0143) {
541 ins->oprs[c - 0140].offset = getu16(data);
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000542 data += 2;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700543 } else if (c >= 0150 && c <= 0153) {
544 ins->oprs[c - 0150].offset = getu32(data);
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000545 data += 4;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700546 } else if (c >= 0160 && c <= 0167) {
547 ins->rex |= (c & 4) ? REX_D|REX_OC : REX_D;
548 ins->drexdst = c & 3;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700549 } else if (c == 0170) {
550 if (*data++)
551 return FALSE;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700552 } else if (c == 0171) {
553 data = do_drex(data, ins);
554 if (!data)
555 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000556 } else if (c >= 0200 && c <= 0277) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000557 int modrm = *data++;
558 if (((modrm >> 3) & 07) != (c & 07))
559 return FALSE; /* spare field doesn't match up */
560 data = do_ea(data, modrm, asize, segsize,
H. Peter Anvin7786c362007-09-17 18:45:44 -0700561 &ins->oprs[(c >> 3) & 07], ins);
562 if (!data)
563 return FALSE;
H. Peter Anvin7eb4a382007-09-17 15:49:30 -0700564 } else if (c >= 0300 && c <= 0303) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000565 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000566 } else if (c == 0310) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000567 if (asize != 16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000568 return FALSE;
569 else
570 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000571 } else if (c == 0311) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000572 if (asize == 16)
573 return FALSE;
574 else
575 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000576 } else if (c == 0312) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000577 if (asize != segsize)
578 return FALSE;
579 else
580 a_used = TRUE;
H. Peter Anvince2b3972007-05-30 22:21:11 +0000581 } else if (c == 0313) {
582 if (asize != 64)
583 return FALSE;
584 else
585 a_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000586 } else if (c == 0320) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000587 if (osize != 16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000588 return FALSE;
589 else
590 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000591 } else if (c == 0321) {
592 if (osize != 32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000593 return FALSE;
594 else
595 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000596 } else if (c == 0322) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000597 if (osize != (segsize == 16) ? 16 : 32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000598 return FALSE;
599 else
600 o_used = TRUE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000601 } else if (c == 0323) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000602 ins->rex |= REX_W; /* 64-bit only instruction */
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000603 osize = 64;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000604 } else if (c == 0324) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000605 if (!(ins->rex & (REX_P|REX_W)) || osize != 64)
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000606 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000607 } else if (c == 0330) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000608 int t = *r++, d = *data++;
609 if (d < t || d > t + 15)
610 return FALSE;
611 else
612 ins->condition = d - t;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000613 } else if (c == 0331) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000614 if (prefix->rep)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000615 return FALSE;
H. Peter Anvincb9b6902007-09-12 21:58:51 -0700616 } else if (c == 0332) {
617 if (prefix->rep != 0xF2)
618 return FALSE;
H. Peter Anvinb061d592007-04-16 02:02:06 +0000619 } else if (c == 0333) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000620 if (prefix->rep != 0xF3)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000621 return FALSE;
622 drep = 0;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000623 } else if (c == 0334) {
624 if (lock) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000625 ins->rex |= REX_R;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000626 lock = 0;
627 }
H. Peter Anvincb9b6902007-09-12 21:58:51 -0700628 } else if (c == 0335) {
629 if (drep == P_REP)
630 drep = P_REPE;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000631 } else if (c == 0364) {
632 if (prefix->osp)
633 return FALSE;
634 } else if (c == 0365) {
635 if (prefix->asp)
636 return FALSE;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000637 } else if (c == 0366) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000638 if (!prefix->osp)
639 return FALSE;
640 o_used = TRUE;
641 } else if (c == 0367) {
642 if (!prefix->asp)
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000643 return FALSE;
644 o_used = TRUE;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000645 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000646 }
647
H. Peter Anvin7786c362007-09-17 18:45:44 -0700648 /* REX cannot be combined with DREX */
649 if ((ins->rex & REX_D) && (prefix->rex))
650 return FALSE;
651
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000652 /*
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000653 * Check for unused rep or a/o prefixes.
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000654 */
655 ins->nprefix = 0;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000656 if (lock)
657 ins->prefixes[ins->nprefix++] = P_LOCK;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000658 if (drep)
659 ins->prefixes[ins->nprefix++] = drep;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000660 if (!a_used && asize != segsize)
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000661 ins->prefixes[ins->nprefix++] = asize == 16 ? P_A16 : P_A32;
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000662 if (!o_used && osize == ((segsize == 16) ? 32 : 16))
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000663 ins->prefixes[ins->nprefix++] = osize == 16 ? P_O16 : P_O32;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000664
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000665 /* Fix: check for redundant REX prefixes */
666
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000667 return data - origdata;
668}
669
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000670int32_t disasm(uint8_t *data, char *output, int outbufsize, int segsize,
Keith Kaniosb7a89542007-04-12 02:40:54 +0000671 int32_t offset, int autosync, uint32_t prefer)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000672{
H. Peter Anvin3360d792007-09-11 04:16:57 +0000673 const struct itemplate * const *p, * const *best_p;
H. Peter Anvin19e20102007-09-18 15:08:20 -0700674 const struct disasm_index *ix;
675 uint8_t *dp;
H. Peter Anvin4836e332002-04-30 20:56:43 +0000676 int length, best_length = 0;
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000677 char *segover;
H. Peter Anvin19e20102007-09-18 15:08:20 -0700678 int i, slen, colon, n;
Keith Kaniosb7a89542007-04-12 02:40:54 +0000679 uint8_t *origdata;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000680 int works;
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000681 insn tmp_ins, ins;
Keith Kaniosb7a89542007-04-12 02:40:54 +0000682 uint32_t goodness, best;
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000683 int best_pref;
684 struct prefix_info prefix;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000685
H. Peter Anvinbfb888c2007-09-11 04:26:44 +0000686 memset(&ins, 0, sizeof ins);
687
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000688 /*
689 * Scan for prefixes.
690 */
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000691 memset(&prefix, 0, sizeof prefix);
692 prefix.asize = segsize;
693 prefix.osize = (segsize == 64) ? 32 : segsize;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000694 segover = NULL;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000695 origdata = data;
696 for (;;) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000697 if (*data == 0xF3 || *data == 0xF2)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000698 prefix.rep = *data++;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000699 else if (*data == 0xF0)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000700 prefix.lock = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000701 else if (*data == 0x2E)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000702 segover = "cs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000703 else if (*data == 0x36)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000704 segover = "ss", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000705 else if (*data == 0x3E)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000706 segover = "ds", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000707 else if (*data == 0x26)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000708 segover = "es", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000709 else if (*data == 0x64)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000710 segover = "fs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000711 else if (*data == 0x65)
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000712 segover = "gs", prefix.seg = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000713 else if (*data == 0x66) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000714 prefix.osize = (segsize == 16) ? 32 : 16;
715 prefix.osp = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000716 } else if (*data == 0x67) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000717 prefix.asize = (segsize == 32) ? 16 : 32;
718 prefix.asp = *data++;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000719 } else if (segsize == 64 && (*data & 0xf0) == REX_P) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000720 prefix.rex = *data++;
721 if (prefix.rex & REX_W)
722 prefix.osize = 64;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000723 break; /* REX is always the last prefix */
724 } else {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000725 break;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000726 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000727 }
728
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000729 best = -1; /* Worst possible */
H. Peter Anvin4836e332002-04-30 20:56:43 +0000730 best_p = NULL;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000731 best_pref = INT_MAX;
732
H. Peter Anvin19e20102007-09-18 15:08:20 -0700733 dp = data;
734 ix = itable + *dp++;
735 while (ix->n == (size_t)-1) {
736 ix = (const struct disasm_index *)ix->p + *dp++;
737 }
738
739 p = (const struct itemplate * const *)ix->p;
740 for (n = ix->n; n; n--, p++) {
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000741 if ((length = matches(*p, data, &prefix, segsize, &tmp_ins))) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000742 works = TRUE;
743 /*
744 * Final check to make sure the types of r/m match up.
H. Peter Anvindbf130e2007-05-30 00:18:26 +0000745 * XXX: Need to make sure this is actually correct.
H. Peter Anvine2c80182005-01-15 22:15:51 +0000746 */
747 for (i = 0; i < (*p)->operands; i++) {
H. Peter Anvin7786c362007-09-17 18:45:44 -0700748 if (!((*p)->opd[i] & SAME_AS) &&
749 (
750 /* If it's a mem-only EA but we have a register, die. */
751 ((tmp_ins.oprs[i].segment & SEG_RMREG) &&
752 !(MEMORY & ~(*p)->opd[i])) ||
753 /* If it's a reg-only EA but we have a memory ref, die. */
754 (!(tmp_ins.oprs[i].segment & SEG_RMREG) &&
755 !(REG_EA & ~(*p)->opd[i]) &&
756 !((*p)->opd[i] & REG_SMASK)) ||
757 /* Register type mismatch (eg FS vs REG_DESS): die. */
758 ((((*p)->opd[i] & (REGISTER | FPUREG)) ||
759 (tmp_ins.oprs[i].segment & SEG_RMREG)) &&
760 !whichreg((*p)->opd[i],
761 tmp_ins.oprs[i].basereg, tmp_ins.rex))
762 )) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000763 works = FALSE;
764 break;
765 }
766 }
767
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000768 /*
769 * Note: we always prefer instructions which incorporate
770 * prefixes in the instructions themselves. This is to allow
771 * e.g. PAUSE to be preferred to REP NOP, and deal with
772 * MMX/SSE instructions where prefixes are used to select
773 * between MMX and SSE register sets or outright opcode
774 * selection.
775 */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000776 if (works) {
777 goodness = ((*p)->flags & IF_PFMASK) ^ prefer;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000778 if (tmp_ins.nprefix < best_pref ||
779 (tmp_ins.nprefix == best_pref && goodness < best)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000780 /* This is the best one found so far */
781 best = goodness;
782 best_p = p;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000783 best_pref = tmp_ins.nprefix;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000784 best_length = length;
785 ins = tmp_ins;
786 }
787 }
788 }
H. Peter Anvin4836e332002-04-30 20:56:43 +0000789 }
H. Peter Anvineba20a72002-04-30 20:53:55 +0000790
H. Peter Anvinef7468f2002-04-30 20:57:59 +0000791 if (!best_p)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000792 return 0; /* no instruction was matched */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000793
H. Peter Anvin4836e332002-04-30 20:56:43 +0000794 /* Pick the best match */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000795 p = best_p;
H. Peter Anvin4836e332002-04-30 20:56:43 +0000796 length = best_length;
797
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000798 slen = 0;
799
Ed Beroset64ab5192004-12-15 23:32:57 +0000800 /* TODO: snprintf returns the value that the string would have if
H. Peter Anvine2c80182005-01-15 22:15:51 +0000801 * the buffer were long enough, and not the actual length of
802 * the returned string, so each instance of using the return
803 * value of snprintf should actually be checked to assure that
804 * the return value is "sane." Maybe a macro wrapper could
805 * be used for that purpose.
806 */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000807 for (i = 0; i < ins.nprefix; i++)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000808 switch (ins.prefixes[i]) {
H. Peter Anvin0db11e22007-04-17 20:23:11 +0000809 case P_LOCK:
810 slen += snprintf(output + slen, outbufsize - slen, "lock ");
811 break;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000812 case P_REP:
813 slen += snprintf(output + slen, outbufsize - slen, "rep ");
814 break;
815 case P_REPE:
816 slen += snprintf(output + slen, outbufsize - slen, "repe ");
817 break;
818 case P_REPNE:
819 slen += snprintf(output + slen, outbufsize - slen, "repne ");
820 break;
821 case P_A16:
822 slen += snprintf(output + slen, outbufsize - slen, "a16 ");
823 break;
824 case P_A32:
825 slen += snprintf(output + slen, outbufsize - slen, "a32 ");
826 break;
827 case P_O16:
828 slen += snprintf(output + slen, outbufsize - slen, "o16 ");
829 break;
830 case P_O32:
831 slen += snprintf(output + slen, outbufsize - slen, "o32 ");
832 break;
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000833 default:
834 break;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000835 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000836
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000837 for (i = 0; i < (int)elements(ico); i++)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000838 if ((*p)->opcode == ico[i]) {
839 slen +=
840 snprintf(output + slen, outbufsize - slen, "%s%s", icn[i],
841 whichcond(ins.condition));
842 break;
843 }
H. Peter Anvin2ba7ed72007-09-11 22:13:17 +0000844 if (i >= (int)elements(ico))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000845 slen +=
846 snprintf(output + slen, outbufsize - slen, "%s",
847 insn_names[(*p)->opcode]);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000848 colon = FALSE;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000849 length += data - origdata; /* fix up for prefixes */
850 for (i = 0; i < (*p)->operands; i++) {
H. Peter Anvin7786c362007-09-17 18:45:44 -0700851 opflags_t t = (*p)->opd[i];
852 const operand *o = &ins.oprs[i];
853 int64_t offs;
854
855 if (t & SAME_AS) {
856 o = &ins.oprs[t & ~SAME_AS];
857 t = (*p)->opd[t & ~SAME_AS];
858 }
859
H. Peter Anvine2c80182005-01-15 22:15:51 +0000860 output[slen++] = (colon ? ':' : i == 0 ? ' ' : ',');
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000861
H. Peter Anvin7786c362007-09-17 18:45:44 -0700862 offs = o->offset;
863 if (o->segment & SEG_RELATIVE) {
864 offs += offset + length;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000865 /*
866 * sort out wraparound
867 */
H. Peter Anvin7786c362007-09-17 18:45:44 -0700868 if (!(o->segment & (SEG_32BIT|SEG_64BIT)))
869 offs &= 0xffff;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000870 /*
871 * add sync marker, if autosync is on
872 */
873 if (autosync)
H. Peter Anvin7786c362007-09-17 18:45:44 -0700874 add_sync(offs, 0L);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000875 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000876
H. Peter Anvin7786c362007-09-17 18:45:44 -0700877 if (t & COLON)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000878 colon = TRUE;
879 else
880 colon = FALSE;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000881
H. Peter Anvin7786c362007-09-17 18:45:44 -0700882 if ((t & (REGISTER | FPUREG)) ||
883 (o->segment & SEG_RMREG)) {
884 enum reg_enum reg;
885 reg = whichreg(t, o->basereg, ins.rex);
886 if (t & TO)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000887 slen += snprintf(output + slen, outbufsize - slen, "to ");
888 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700889 reg_names[reg - EXPR_REG_START]);
890 } else if (!(UNITY & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000891 output[slen++] = '1';
H. Peter Anvin7786c362007-09-17 18:45:44 -0700892 } else if (t & IMMEDIATE) {
893 if (t & BITS8) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000894 slen +=
895 snprintf(output + slen, outbufsize - slen, "byte ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700896 if (o->segment & SEG_SIGNED) {
897 if (offs < 0) {
898 offs *= -1;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000899 output[slen++] = '-';
900 } else
901 output[slen++] = '+';
902 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700903 } else if (t & BITS16) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000904 slen +=
905 snprintf(output + slen, outbufsize - slen, "word ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700906 } else if (t & BITS32) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000907 slen +=
908 snprintf(output + slen, outbufsize - slen, "dword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700909 } else if (t & BITS64) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000910 slen +=
911 snprintf(output + slen, outbufsize - slen, "qword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700912 } else if (t & NEAR) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000913 slen +=
914 snprintf(output + slen, outbufsize - slen, "near ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700915 } else if (t & SHORT) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000916 slen +=
917 snprintf(output + slen, outbufsize - slen, "short ");
918 }
919 slen +=
Keith Kanios93f2e9a2007-04-14 00:10:59 +0000920 snprintf(output + slen, outbufsize - slen, "0x%"PRIx64"",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700921 offs);
922 } else if (!(MEM_OFFS & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000923 slen +=
Keith Kanios93f2e9a2007-04-14 00:10:59 +0000924 snprintf(output + slen, outbufsize - slen, "[%s%s%s0x%"PRIx64"]",
H. Peter Anvin62cb6062007-09-11 22:44:03 +0000925 (segover ? segover : ""),
926 (segover ? ":" : ""),
H. Peter Anvin7786c362007-09-17 18:45:44 -0700927 (o->addr_size ==
928 32 ? "dword " : o->addr_size ==
929 16 ? "word " : ""), offs);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000930 segover = NULL;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700931 } else if (!(REGMEM & ~t)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000932 int started = FALSE;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700933 if (t & BITS8)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000934 slen +=
935 snprintf(output + slen, outbufsize - slen, "byte ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700936 if (t & BITS16)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000937 slen +=
938 snprintf(output + slen, outbufsize - slen, "word ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700939 if (t & BITS32)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000940 slen +=
941 snprintf(output + slen, outbufsize - slen, "dword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700942 if (t & BITS64)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000943 slen +=
944 snprintf(output + slen, outbufsize - slen, "qword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700945 if (t & BITS80)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000946 slen +=
947 snprintf(output + slen, outbufsize - slen, "tword ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700948 if (t & FAR)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000949 slen += snprintf(output + slen, outbufsize - slen, "far ");
H. Peter Anvin7786c362007-09-17 18:45:44 -0700950 if (t & NEAR)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000951 slen +=
952 snprintf(output + slen, outbufsize - slen, "near ");
953 output[slen++] = '[';
H. Peter Anvin7786c362007-09-17 18:45:44 -0700954 if (o->addr_size)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000955 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700956 (o->addr_size == 64 ? "qword " :
957 o->addr_size == 32 ? "dword " :
958 o->addr_size == 16 ? "word " :
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000959 ""));
H. Peter Anvin7786c362007-09-17 18:45:44 -0700960 if (o->eaflags & EAF_REL)
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +0000961 slen += snprintf(output + slen, outbufsize - slen, "rel ");
H. Peter Anvine2c80182005-01-15 22:15:51 +0000962 if (segover) {
963 slen +=
964 snprintf(output + slen, outbufsize - slen, "%s:",
965 segover);
966 segover = NULL;
967 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700968 if (o->basereg != -1) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000969 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700970 reg_names[(o->basereg -
H. Peter Anvine2c80182005-01-15 22:15:51 +0000971 EXPR_REG_START)]);
972 started = TRUE;
973 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700974 if (o->indexreg != -1) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000975 if (started)
976 output[slen++] = '+';
977 slen += snprintf(output + slen, outbufsize - slen, "%s",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700978 reg_names[(o->indexreg -
H. Peter Anvine2c80182005-01-15 22:15:51 +0000979 EXPR_REG_START)]);
H. Peter Anvin7786c362007-09-17 18:45:44 -0700980 if (o->scale > 1)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000981 slen +=
982 snprintf(output + slen, outbufsize - slen, "*%d",
H. Peter Anvin7786c362007-09-17 18:45:44 -0700983 o->scale);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000984 started = TRUE;
985 }
H. Peter Anvin7786c362007-09-17 18:45:44 -0700986 if (o->segment & SEG_DISP8) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000987 int minus = 0;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700988 int8_t offset = offs;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000989 if (offset < 0) {
990 minus = 1;
991 offset = -offset;
992 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000993 slen +=
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000994 snprintf(output + slen, outbufsize - slen, "%s0x%"PRIx8"",
995 minus ? "-" : "+", offset);
H. Peter Anvin7786c362007-09-17 18:45:44 -0700996 } else if (o->segment & SEG_DISP16) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000997 int minus = 0;
H. Peter Anvin7786c362007-09-17 18:45:44 -0700998 int16_t offset = offs;
H. Peter Anvin0ee01422007-04-16 01:18:30 +0000999 if (offset < 0) {
1000 minus = 1;
1001 offset = -offset;
1002 }
H. Peter Anvine2c80182005-01-15 22:15:51 +00001003 slen +=
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001004 snprintf(output + slen, outbufsize - slen, "%s0x%"PRIx16"",
1005 minus ? "-" : started ? "+" : "", offset);
H. Peter Anvin7786c362007-09-17 18:45:44 -07001006 } else if (o->segment & SEG_DISP32) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001007 char *prefix = "";
H. Peter Anvin7786c362007-09-17 18:45:44 -07001008 int32_t offset = offs;
H. Peter Anvin99c4ecd2007-08-28 23:06:00 +00001009 if (offset < 0) {
H. Peter Anvin0ee01422007-04-16 01:18:30 +00001010 offset = -offset;
1011 prefix = "-";
1012 } else {
1013 prefix = started ? "+" : "";
1014 }
1015 slen +=
1016 snprintf(output + slen, outbufsize - slen,
1017 "%s0x%"PRIx32"", prefix, offset);
H. Peter Anvine2c80182005-01-15 22:15:51 +00001018 }
1019 output[slen++] = ']';
1020 } else {
1021 slen +=
1022 snprintf(output + slen, outbufsize - slen, "<operand%d>",
1023 i);
1024 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001025 }
1026 output[slen] = '\0';
H. Peter Anvine2c80182005-01-15 22:15:51 +00001027 if (segover) { /* unused segment override */
Keith Kaniosa6dfa782007-04-13 16:47:53 +00001028 char *p = output;
H. Peter Anvine2c80182005-01-15 22:15:51 +00001029 int count = slen + 1;
1030 while (count--)
1031 p[count + 3] = p[count];
1032 strncpy(output, segover, 2);
1033 output[2] = ' ';
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001034 }
1035 return length;
1036}
1037
Keith Kaniosa6dfa782007-04-13 16:47:53 +00001038int32_t eatbyte(uint8_t *data, char *output, int outbufsize)
H. Peter Anvineba20a72002-04-30 20:53:55 +00001039{
Ed Beroset92348172004-12-15 18:27:50 +00001040 snprintf(output, outbufsize, "db 0x%02X", *data);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00001041 return 1;
1042}