blob: 31f02a2d371414ffbed77e3c052332e12b80dde9 [file] [log] [blame]
H. Peter Anvin9e6747c2009-06-28 17:13:04 -07001/* ----------------------------------------------------------------------- *
H. Peter Anvina73ccfe2019-08-28 19:02:47 -07002 *
H. Peter Anvin9e6747c2009-06-28 17:13:04 -07003 * Copyright 1996-2009 The NASM Authors - All Rights Reserved
4 * See the file AUTHORS included with the NASM distribution for
5 * the specific copyright holders.
H. Peter Anvinea6e34d2002-04-30 20:51:32 +00006 *
H. Peter Anvin9e6747c2009-06-28 17:13:04 -07007 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following
9 * conditions are met:
10 *
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following
15 * disclaimer in the documentation and/or other materials provided
16 * with the distribution.
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070017 *
H. Peter Anvin9e6747c2009-06-28 17:13:04 -070018 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
19 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
20 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
21 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
26 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
29 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
30 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31 *
32 * ----------------------------------------------------------------------- */
33
34/*
35 * ndisasm.c the Netwide Disassembler main module
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000036 */
37
H. Peter Anvinfe501952007-10-02 21:53:51 -070038#include "compiler.h"
39
H. Peter Anvinc2f3f262018-12-27 12:37:25 -080040#include "nctype.h"
H. Peter Anvin76690a12002-04-30 20:52:49 +000041#include <errno.h>
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000042
H. Peter Anvin4836e332002-04-30 20:56:43 +000043#include "insns.h"
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000044#include "nasm.h"
45#include "nasmlib.h"
H. Peter Anvinb20bc732017-03-07 19:23:03 -080046#include "error.h"
H. Peter Anvin2bc0ab32016-03-08 02:17:36 -080047#include "ver.h"
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000048#include "sync.h"
49#include "disasm.h"
50
H. Peter Anvine2c80182005-01-15 22:15:51 +000051#define BPL 8 /* bytes per line of hex dump */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000052
Keith Kaniosa6dfa782007-04-13 16:47:53 +000053static const char *help =
H. Peter Anvine2c80182005-01-15 22:15:51 +000054 "usage: ndisasm [-a] [-i] [-h] [-r] [-u] [-b bits] [-o origin] [-s sync...]\n"
55 " [-e bytes] [-k start,bytes] [-p vendor] file\n"
56 " -a or -i activates auto (intelligent) sync\n"
H. Peter Anvin99f309c2007-04-15 23:12:17 +000057 " -u same as -b 32\n"
58 " -b 16, -b 32 or -b 64 sets the processor mode\n"
H. Peter Anvine2c80182005-01-15 22:15:51 +000059 " -h displays this text\n"
60 " -r or -v displays the version number\n"
61 " -e skips <bytes> bytes of header\n"
62 " -k avoids disassembling <bytes> bytes from position <start>\n"
63 " -p selects the preferred vendor instruction set (intel, amd, cyrix, idt)\n";
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000064
Ruslan Kabatsayev3ebed502017-02-12 19:31:19 +030065static void output_ins(uint64_t, uint8_t *, int, char *);
Keith Kaniosb7a89542007-04-12 02:40:54 +000066static void skip(uint32_t dist, FILE * fp);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000067
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070068void nasm_verror(errflags severity, const char *fmt, va_list val)
H. Peter Anvin87f252a2007-09-19 21:40:37 -070069{
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070070 severity &= ERR_MASK;
H. Peter Anvin87f252a2007-09-19 21:40:37 -070071
H. Peter Anvin6a4353c2019-08-28 18:32:46 -070072 vfprintf(stderr, fmt, val);
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070073 if (severity >= ERR_FATAL)
74 exit(severity - ERR_FATAL + 1);
H. Peter Anvin6a4353c2019-08-28 18:32:46 -070075}
H. Peter Anvin87f252a2007-09-19 21:40:37 -070076
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070077fatal_func nasm_verror_critical(errflags severity, const char *fmt, va_list val)
H. Peter Anvin6a4353c2019-08-28 18:32:46 -070078{
H. Peter Anvina73ccfe2019-08-28 19:02:47 -070079 nasm_verror(severity, fmt, val);
80 abort();
H. Peter Anvin87f252a2007-09-19 21:40:37 -070081}
82
H. Peter Anvin038d8612007-04-12 16:54:50 +000083int main(int argc, char **argv)
H. Peter Anvineba20a72002-04-30 20:53:55 +000084{
H. Peter Anvin99f309c2007-04-15 23:12:17 +000085 char buffer[INSN_MAX * 2], *p, *ep, *q;
Keith Kaniosa6dfa782007-04-13 16:47:53 +000086 char outbuf[256];
87 char *pname = *argv;
88 char *filename = NULL;
Keith Kaniosb7a89542007-04-12 02:40:54 +000089 uint32_t nextsync, synclen, initskip = 0L;
H. Peter Anvin4cf17482002-04-30 21:01:38 +000090 int lenread;
Keith Kaniosb7a89542007-04-12 02:40:54 +000091 int32_t lendis;
H. Peter Anvin6867acc2007-10-10 14:58:45 -070092 bool autosync = false;
H. Peter Anvin99f309c2007-04-15 23:12:17 +000093 int bits = 16, b;
H. Peter Anvin6867acc2007-10-10 14:58:45 -070094 bool eof = false;
Cyrill Gorcunov08359152013-11-09 22:16:11 +040095 iflag_t prefer;
H. Peter Anvin70055962007-10-11 00:05:31 -070096 bool rn_error;
Ruslan Kabatsayev3ebed502017-02-12 19:31:19 +030097 int64_t offset;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +000098 FILE *fp;
99
H. Peter Anvin13506202018-11-28 14:55:58 -0800100 nasm_ctype_init();
Cyrill Gorcunov08359152013-11-09 22:16:11 +0400101 iflag_clear_all(&prefer);
H. Peter Anvin87f252a2007-09-19 21:40:37 -0700102
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000103 offset = 0;
104 init_sync();
105
106 while (--argc) {
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000107 char *v, *vv, *p = *++argv;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000108 if (*p == '-' && p[1]) {
109 p++;
110 while (*p)
H. Peter Anvinac8f8fc2008-06-11 15:49:41 -0700111 switch (nasm_tolower(*p)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000112 case 'a': /* auto or intelligent sync */
113 case 'i':
H. Peter Anvin6867acc2007-10-10 14:58:45 -0700114 autosync = true;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000115 p++;
116 break;
117 case 'h':
Victor van den Elzen0dd450c2009-08-13 15:07:59 +0200118 fputs(help, stderr);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000119 return 0;
120 case 'r':
121 case 'v':
122 fprintf(stderr,
Dale Curtis10760492018-10-31 13:03:37 -0700123 "NDISASM version %s\n",
124 nasm_version);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000125 return 0;
H. Peter Anvin99f309c2007-04-15 23:12:17 +0000126 case 'u': /* -u for -b 32, -uu for -b 64 */
127 if (bits < 64)
128 bits <<= 1;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000129 p++;
130 break;
131 case 'b': /* bits */
132 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
133 if (!v) {
134 fprintf(stderr, "%s: `-b' requires an argument\n",
135 pname);
136 return 1;
137 }
H. Peter Anvin99f309c2007-04-15 23:12:17 +0000138 b = strtoul(v, &ep, 10);
139 if (*ep || !(bits == 16 || bits == 32 || bits == 64)) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000140 fprintf(stderr, "%s: argument to `-b' should"
H. Peter Anvin99f309c2007-04-15 23:12:17 +0000141 " be 16, 32 or 64\n", pname);
142 } else {
143 bits = b;
144 }
H. Peter Anvine2c80182005-01-15 22:15:51 +0000145 p = ""; /* force to next argument */
146 break;
147 case 'o': /* origin */
148 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
149 if (!v) {
150 fprintf(stderr, "%s: `-o' requires an argument\n",
151 pname);
152 return 1;
153 }
154 offset = readnum(v, &rn_error);
155 if (rn_error) {
156 fprintf(stderr,
157 "%s: `-o' requires a numeric argument\n",
158 pname);
159 return 1;
160 }
161 p = ""; /* force to next argument */
162 break;
163 case 's': /* sync point */
164 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
165 if (!v) {
166 fprintf(stderr, "%s: `-s' requires an argument\n",
167 pname);
168 return 1;
169 }
170 add_sync(readnum(v, &rn_error), 0L);
171 if (rn_error) {
172 fprintf(stderr,
173 "%s: `-s' requires a numeric argument\n",
174 pname);
175 return 1;
176 }
177 p = ""; /* force to next argument */
178 break;
179 case 'e': /* skip a header */
180 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
181 if (!v) {
182 fprintf(stderr, "%s: `-e' requires an argument\n",
183 pname);
184 return 1;
185 }
186 initskip = readnum(v, &rn_error);
187 if (rn_error) {
188 fprintf(stderr,
189 "%s: `-e' requires a numeric argument\n",
190 pname);
191 return 1;
192 }
193 p = ""; /* force to next argument */
194 break;
195 case 'k': /* skip a region */
196 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
197 if (!v) {
198 fprintf(stderr, "%s: `-k' requires an argument\n",
199 pname);
200 return 1;
201 }
202 vv = strchr(v, ',');
203 if (!vv) {
204 fprintf(stderr,
205 "%s: `-k' requires two numbers separated"
206 " by a comma\n", pname);
207 return 1;
208 }
209 *vv++ = '\0';
210 nextsync = readnum(v, &rn_error);
211 if (rn_error) {
212 fprintf(stderr,
213 "%s: `-k' requires numeric arguments\n",
214 pname);
215 return 1;
216 }
217 synclen = readnum(vv, &rn_error);
218 if (rn_error) {
219 fprintf(stderr,
220 "%s: `-k' requires numeric arguments\n",
221 pname);
222 return 1;
223 }
224 add_sync(nextsync, synclen);
225 p = ""; /* force to next argument */
226 break;
227 case 'p': /* preferred vendor */
228 v = p[1] ? p + 1 : --argc ? *++argv : NULL;
229 if (!v) {
230 fprintf(stderr, "%s: `-p' requires an argument\n",
231 pname);
232 return 1;
233 }
234 if (!strcmp(v, "intel")) {
Cyrill Gorcunov08359152013-11-09 22:16:11 +0400235 iflag_clear_all(&prefer); /* default */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000236 } else if (!strcmp(v, "amd")) {
Cyrill Gorcunov08359152013-11-09 22:16:11 +0400237 iflag_clear_all(&prefer);
238 iflag_set(&prefer, IF_AMD);
239 iflag_set(&prefer, IF_3DNOW);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000240 } else if (!strcmp(v, "cyrix")) {
Cyrill Gorcunov08359152013-11-09 22:16:11 +0400241 iflag_clear_all(&prefer);
242 iflag_set(&prefer, IF_CYRIX);
243 iflag_set(&prefer, IF_3DNOW);
244 } else if (!strcmp(v, "idt") ||
245 !strcmp(v, "centaur") ||
246 !strcmp(v, "winchip")) {
247 iflag_clear_all(&prefer);
248 iflag_set(&prefer, IF_3DNOW);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000249 } else {
250 fprintf(stderr,
251 "%s: unknown vendor `%s' specified with `-p'\n",
252 pname, v);
253 return 1;
254 }
255 p = ""; /* force to next argument */
256 break;
257 default: /*bf */
258 fprintf(stderr, "%s: unrecognised option `-%c'\n",
259 pname, *p);
260 return 1;
261 }
262 } else if (!filename) {
263 filename = p;
264 } else {
265 fprintf(stderr, "%s: more than one filename specified\n",
266 pname);
267 return 1;
268 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000269 }
270
271 if (!filename) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000272 fprintf(stderr, help, pname);
273 return 0;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000274 }
275
H. Peter Anvineba20a72002-04-30 20:53:55 +0000276 if (strcmp(filename, "-")) {
H. Peter Anvin0c0fdaa2016-05-25 04:47:02 -0700277 fp = fopen(filename, "rb");
H. Peter Anvine2c80182005-01-15 22:15:51 +0000278 if (!fp) {
279 fprintf(stderr, "%s: unable to open `%s': %s\n",
280 pname, filename, strerror(errno));
281 return 1;
282 }
Chang S. Baebd1055b2020-03-24 14:24:43 -0700283 } else {
284 nasm_set_binary_mode(stdin);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000285 fp = stdin;
Chang S. Baebd1055b2020-03-24 14:24:43 -0700286 }
H. Peter Anvineba20a72002-04-30 20:53:55 +0000287
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000288 if (initskip > 0)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000289 skip(initskip, fp);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000290
291 /*
292 * This main loop is really horrible, and wants rewriting with
293 * an axe. It'll stay the way it is for a while though, until I
294 * find the energy...
295 */
296
297 p = q = buffer;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000298 nextsync = next_sync(offset, &synclen);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000299 do {
Keith Kaniosb7a89542007-04-12 02:40:54 +0000300 uint32_t to_read = buffer + sizeof(buffer) - p;
H. Peter Anvin914fdf92007-12-20 12:24:17 -0800301 if ((nextsync || synclen) &&
302 to_read > nextsync - offset - (p - q))
H. Peter Anvine2c80182005-01-15 22:15:51 +0000303 to_read = nextsync - offset - (p - q);
304 if (to_read) {
305 lenread = fread(p, 1, to_read, fp);
306 if (lenread == 0)
H. Peter Anvin6867acc2007-10-10 14:58:45 -0700307 eof = true; /* help along systems with bad feof */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000308 } else
309 lenread = 0;
310 p += lenread;
H. Peter Anvin914fdf92007-12-20 12:24:17 -0800311 if ((nextsync || synclen) &&
312 (uint32_t)offset == nextsync) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000313 if (synclen) {
Ruslan Kabatsayev3ebed502017-02-12 19:31:19 +0300314 fprintf(stdout, "%08"PRIX64" skipping 0x%"PRIX32" bytes\n",
H. Peter Anvined37aa82009-03-18 23:10:19 -0700315 offset, synclen);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000316 offset += synclen;
317 skip(synclen, fp);
318 }
319 p = q = buffer;
320 nextsync = next_sync(offset, &synclen);
321 }
322 while (p > q && (p - q >= INSN_MAX || lenread == 0)) {
Cyrill Gorcunov55d09bb2018-08-15 01:12:19 +0300323 lendis = disasm((uint8_t *)q, INSN_MAX, outbuf, sizeof(outbuf),
324 bits, offset, autosync, &prefer);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000325 if (!lendis || lendis > (p - q)
H. Peter Anvin914fdf92007-12-20 12:24:17 -0800326 || ((nextsync || synclen) &&
327 (uint32_t)lendis > nextsync - offset))
H. Peter Anvined37aa82009-03-18 23:10:19 -0700328 lendis = eatbyte((uint8_t *) q, outbuf, sizeof(outbuf), bits);
Charles Crayne46b31b02007-10-18 21:17:20 -0700329 output_ins(offset, (uint8_t *) q, lendis, outbuf);
H. Peter Anvine2c80182005-01-15 22:15:51 +0000330 q += lendis;
331 offset += lendis;
332 }
333 if (q >= buffer + INSN_MAX) {
Charles Crayne46b31b02007-10-18 21:17:20 -0700334 uint8_t *r = (uint8_t *) buffer, *s = (uint8_t *) q;
H. Peter Anvine2c80182005-01-15 22:15:51 +0000335 int count = p - q;
336 while (count--)
337 *r++ = *s++;
338 p -= (q - buffer);
339 q = buffer;
340 }
H. Peter Anvin87bc6192002-04-30 20:53:16 +0000341 } while (lenread > 0 || !(eof || feof(fp)));
H. Peter Anvineba20a72002-04-30 20:53:55 +0000342
343 if (fp != stdin)
H. Peter Anvine2c80182005-01-15 22:15:51 +0000344 fclose(fp);
H. Peter Anvineba20a72002-04-30 20:53:55 +0000345
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000346 return 0;
347}
348
Ruslan Kabatsayev3ebed502017-02-12 19:31:19 +0300349static void output_ins(uint64_t offset, uint8_t *data,
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000350 int datalen, char *insn)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000351{
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000352 int bytes;
Ruslan Kabatsayev3ebed502017-02-12 19:31:19 +0300353 fprintf(stdout, "%08"PRIX64" ", offset);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000354
355 bytes = 0;
356 while (datalen > 0 && bytes < BPL) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000357 fprintf(stdout, "%02X", *data++);
358 bytes++;
359 datalen--;
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000360 }
361
H. Peter Anvine2c80182005-01-15 22:15:51 +0000362 fprintf(stdout, "%*s%s\n", (BPL + 1 - bytes) * 2, "", insn);
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000363
364 while (datalen > 0) {
H. Peter Anvine2c80182005-01-15 22:15:51 +0000365 fprintf(stdout, " -");
366 bytes = 0;
367 while (datalen > 0 && bytes < BPL) {
368 fprintf(stdout, "%02X", *data++);
369 bytes++;
370 datalen--;
371 }
372 fprintf(stdout, "\n");
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000373 }
374}
375
376/*
377 * Skip a certain amount of data in a file, either by seeking if
378 * possible, or if that fails then by reading and discarding.
379 */
Keith Kaniosb7a89542007-04-12 02:40:54 +0000380static void skip(uint32_t dist, FILE * fp)
H. Peter Anvineba20a72002-04-30 20:53:55 +0000381{
Keith Kaniosa6dfa782007-04-13 16:47:53 +0000382 char buffer[256]; /* should fit on most stacks :-) */
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000383
384 /*
385 * Got to be careful with fseek: at least one fseek I've tried
386 * doesn't approve of SEEK_CUR. So I'll use SEEK_SET and
387 * ftell... horrible but apparently necessary.
388 */
H. Peter Anvine2c80182005-01-15 22:15:51 +0000389 if (fseek(fp, dist + ftell(fp), SEEK_SET)) {
390 while (dist > 0) {
Keith Kaniosb7a89542007-04-12 02:40:54 +0000391 uint32_t len = (dist < sizeof(buffer) ?
H. Peter Anvine2c80182005-01-15 22:15:51 +0000392 dist : sizeof(buffer));
393 if (fread(buffer, 1, len, fp) < len) {
394 perror("fread");
395 exit(1);
396 }
397 dist -= len;
398 }
H. Peter Anvinea6e34d2002-04-30 20:51:32 +0000399 }
400}