H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 1 | /* ndisasm.c the Netwide Disassembler main module |
| 2 | * |
| 3 | * The Netwide Assembler is copyright (C) 1996 Simon Tatham and |
| 4 | * Julian Hall. All rights reserved. The software is |
| 5 | * redistributable under the licence given in the file "Licence" |
| 6 | * distributed in the NASM archive. |
| 7 | */ |
| 8 | |
| 9 | #include <stdio.h> |
H. Peter Anvin | d7ed89e | 2002-04-30 20:52:08 +0000 | [diff] [blame] | 10 | #include <stdlib.h> |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 11 | #include <string.h> |
| 12 | #include <ctype.h> |
H. Peter Anvin | 76690a1 | 2002-04-30 20:52:49 +0000 | [diff] [blame] | 13 | #include <errno.h> |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 14 | #include <inttypes.h> |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 15 | |
H. Peter Anvin | 4836e33 | 2002-04-30 20:56:43 +0000 | [diff] [blame] | 16 | #include "insns.h" |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 17 | #include "nasm.h" |
| 18 | #include "nasmlib.h" |
| 19 | #include "sync.h" |
| 20 | #include "disasm.h" |
| 21 | |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 22 | #define BPL 8 /* bytes per line of hex dump */ |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 23 | |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 24 | static const char *help = |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 25 | "usage: ndisasm [-a] [-i] [-h] [-r] [-u] [-b bits] [-o origin] [-s sync...]\n" |
| 26 | " [-e bytes] [-k start,bytes] [-p vendor] file\n" |
| 27 | " -a or -i activates auto (intelligent) sync\n" |
| 28 | " -u sets USE32 (32-bit mode)\n" |
| 29 | " -b 16 or -b 32 sets number of bits too\n" |
| 30 | " -h displays this text\n" |
| 31 | " -r or -v displays the version number\n" |
| 32 | " -e skips <bytes> bytes of header\n" |
| 33 | " -k avoids disassembling <bytes> bytes from position <start>\n" |
| 34 | " -p selects the preferred vendor instruction set (intel, amd, cyrix, idt)\n"; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 35 | |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 36 | static void output_ins(uint32_t, uint8_t *, int, char *); |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 37 | static void skip(uint32_t dist, FILE * fp); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 38 | |
H. Peter Anvin | 038d861 | 2007-04-12 16:54:50 +0000 | [diff] [blame] | 39 | int main(int argc, char **argv) |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 40 | { |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 41 | uint8_t buffer[INSN_MAX * 2], *p, *q; |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 42 | char outbuf[256]; |
| 43 | char *pname = *argv; |
| 44 | char *filename = NULL; |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 45 | uint32_t nextsync, synclen, initskip = 0L; |
H. Peter Anvin | 4cf1748 | 2002-04-30 21:01:38 +0000 | [diff] [blame] | 46 | int lenread; |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 47 | int32_t lendis; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 48 | int autosync = FALSE; |
| 49 | int bits = 16; |
H. Peter Anvin | 87bc619 | 2002-04-30 20:53:16 +0000 | [diff] [blame] | 50 | int eof = FALSE; |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 51 | uint32_t prefer = 0; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 52 | int rn_error; |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 53 | int32_t offset; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 54 | FILE *fp; |
| 55 | |
| 56 | offset = 0; |
| 57 | init_sync(); |
| 58 | |
| 59 | while (--argc) { |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 60 | char *v, *vv, *p = *++argv; |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 61 | if (*p == '-' && p[1]) { |
| 62 | p++; |
| 63 | while (*p) |
| 64 | switch (tolower(*p)) { |
| 65 | case 'a': /* auto or intelligent sync */ |
| 66 | case 'i': |
| 67 | autosync = TRUE; |
| 68 | p++; |
| 69 | break; |
| 70 | case 'h': |
| 71 | fprintf(stderr, help); |
| 72 | return 0; |
| 73 | case 'r': |
| 74 | case 'v': |
| 75 | fprintf(stderr, |
| 76 | "NDISASM version %s compiled " __DATE__ "\n", |
| 77 | NASM_VER); |
| 78 | return 0; |
| 79 | case 'u': /* USE32 */ |
| 80 | bits = 32; |
| 81 | p++; |
| 82 | break; |
| 83 | case 'b': /* bits */ |
| 84 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 85 | if (!v) { |
| 86 | fprintf(stderr, "%s: `-b' requires an argument\n", |
| 87 | pname); |
| 88 | return 1; |
| 89 | } |
| 90 | if (!strcmp(v, "16")) |
| 91 | bits = 16; |
| 92 | else if (!strcmp(v, "32")) |
| 93 | bits = 32; |
| 94 | else { |
| 95 | fprintf(stderr, "%s: argument to `-b' should" |
| 96 | " be `16' or `32'\n", pname); |
| 97 | } |
| 98 | p = ""; /* force to next argument */ |
| 99 | break; |
| 100 | case 'o': /* origin */ |
| 101 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 102 | if (!v) { |
| 103 | fprintf(stderr, "%s: `-o' requires an argument\n", |
| 104 | pname); |
| 105 | return 1; |
| 106 | } |
| 107 | offset = readnum(v, &rn_error); |
| 108 | if (rn_error) { |
| 109 | fprintf(stderr, |
| 110 | "%s: `-o' requires a numeric argument\n", |
| 111 | pname); |
| 112 | return 1; |
| 113 | } |
| 114 | p = ""; /* force to next argument */ |
| 115 | break; |
| 116 | case 's': /* sync point */ |
| 117 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 118 | if (!v) { |
| 119 | fprintf(stderr, "%s: `-s' requires an argument\n", |
| 120 | pname); |
| 121 | return 1; |
| 122 | } |
| 123 | add_sync(readnum(v, &rn_error), 0L); |
| 124 | if (rn_error) { |
| 125 | fprintf(stderr, |
| 126 | "%s: `-s' requires a numeric argument\n", |
| 127 | pname); |
| 128 | return 1; |
| 129 | } |
| 130 | p = ""; /* force to next argument */ |
| 131 | break; |
| 132 | case 'e': /* skip a header */ |
| 133 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 134 | if (!v) { |
| 135 | fprintf(stderr, "%s: `-e' requires an argument\n", |
| 136 | pname); |
| 137 | return 1; |
| 138 | } |
| 139 | initskip = readnum(v, &rn_error); |
| 140 | if (rn_error) { |
| 141 | fprintf(stderr, |
| 142 | "%s: `-e' requires a numeric argument\n", |
| 143 | pname); |
| 144 | return 1; |
| 145 | } |
| 146 | p = ""; /* force to next argument */ |
| 147 | break; |
| 148 | case 'k': /* skip a region */ |
| 149 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 150 | if (!v) { |
| 151 | fprintf(stderr, "%s: `-k' requires an argument\n", |
| 152 | pname); |
| 153 | return 1; |
| 154 | } |
| 155 | vv = strchr(v, ','); |
| 156 | if (!vv) { |
| 157 | fprintf(stderr, |
| 158 | "%s: `-k' requires two numbers separated" |
| 159 | " by a comma\n", pname); |
| 160 | return 1; |
| 161 | } |
| 162 | *vv++ = '\0'; |
| 163 | nextsync = readnum(v, &rn_error); |
| 164 | if (rn_error) { |
| 165 | fprintf(stderr, |
| 166 | "%s: `-k' requires numeric arguments\n", |
| 167 | pname); |
| 168 | return 1; |
| 169 | } |
| 170 | synclen = readnum(vv, &rn_error); |
| 171 | if (rn_error) { |
| 172 | fprintf(stderr, |
| 173 | "%s: `-k' requires numeric arguments\n", |
| 174 | pname); |
| 175 | return 1; |
| 176 | } |
| 177 | add_sync(nextsync, synclen); |
| 178 | p = ""; /* force to next argument */ |
| 179 | break; |
| 180 | case 'p': /* preferred vendor */ |
| 181 | v = p[1] ? p + 1 : --argc ? *++argv : NULL; |
| 182 | if (!v) { |
| 183 | fprintf(stderr, "%s: `-p' requires an argument\n", |
| 184 | pname); |
| 185 | return 1; |
| 186 | } |
| 187 | if (!strcmp(v, "intel")) { |
| 188 | prefer = 0; /* Default */ |
| 189 | } else if (!strcmp(v, "amd")) { |
| 190 | prefer = IF_AMD | IF_3DNOW; |
| 191 | } else if (!strcmp(v, "cyrix")) { |
| 192 | prefer = IF_CYRIX | IF_3DNOW; |
| 193 | } else if (!strcmp(v, "idt") || !strcmp(v, "centaur") |
| 194 | || !strcmp(v, "winchip")) { |
| 195 | prefer = IF_3DNOW; |
| 196 | } else { |
| 197 | fprintf(stderr, |
| 198 | "%s: unknown vendor `%s' specified with `-p'\n", |
| 199 | pname, v); |
| 200 | return 1; |
| 201 | } |
| 202 | p = ""; /* force to next argument */ |
| 203 | break; |
| 204 | default: /*bf */ |
| 205 | fprintf(stderr, "%s: unrecognised option `-%c'\n", |
| 206 | pname, *p); |
| 207 | return 1; |
| 208 | } |
| 209 | } else if (!filename) { |
| 210 | filename = p; |
| 211 | } else { |
| 212 | fprintf(stderr, "%s: more than one filename specified\n", |
| 213 | pname); |
| 214 | return 1; |
| 215 | } |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 216 | } |
| 217 | |
| 218 | if (!filename) { |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 219 | fprintf(stderr, help, pname); |
| 220 | return 0; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 221 | } |
| 222 | |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 223 | if (strcmp(filename, "-")) { |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 224 | fp = fopen(filename, "rb"); |
| 225 | if (!fp) { |
| 226 | fprintf(stderr, "%s: unable to open `%s': %s\n", |
| 227 | pname, filename, strerror(errno)); |
| 228 | return 1; |
| 229 | } |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 230 | } else |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 231 | fp = stdin; |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 232 | |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 233 | if (initskip > 0) |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 234 | skip(initskip, fp); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 235 | |
| 236 | /* |
| 237 | * This main loop is really horrible, and wants rewriting with |
| 238 | * an axe. It'll stay the way it is for a while though, until I |
| 239 | * find the energy... |
| 240 | */ |
| 241 | |
| 242 | p = q = buffer; |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 243 | nextsync = next_sync(offset, &synclen); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 244 | do { |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 245 | uint32_t to_read = buffer + sizeof(buffer) - p; |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 246 | if (to_read > nextsync - offset - (p - q)) |
| 247 | to_read = nextsync - offset - (p - q); |
| 248 | if (to_read) { |
| 249 | lenread = fread(p, 1, to_read, fp); |
| 250 | if (lenread == 0) |
| 251 | eof = TRUE; /* help along systems with bad feof */ |
| 252 | } else |
| 253 | lenread = 0; |
| 254 | p += lenread; |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 255 | if ((uint32_t)offset == nextsync) { |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 256 | if (synclen) { |
| 257 | fprintf(stdout, "%08lX skipping 0x%lX bytes\n", offset, |
| 258 | synclen); |
| 259 | offset += synclen; |
| 260 | skip(synclen, fp); |
| 261 | } |
| 262 | p = q = buffer; |
| 263 | nextsync = next_sync(offset, &synclen); |
| 264 | } |
| 265 | while (p > q && (p - q >= INSN_MAX || lenread == 0)) { |
| 266 | lendis = |
| 267 | disasm(q, outbuf, sizeof(outbuf), bits, offset, autosync, |
| 268 | prefer); |
| 269 | if (!lendis || lendis > (p - q) |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 270 | || (uint32_t)lendis > nextsync - offset) |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 271 | lendis = eatbyte(q, outbuf, sizeof(outbuf)); |
| 272 | output_ins(offset, q, lendis, outbuf); |
| 273 | q += lendis; |
| 274 | offset += lendis; |
| 275 | } |
| 276 | if (q >= buffer + INSN_MAX) { |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 277 | uint8_t *r = buffer, *s = q; |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 278 | int count = p - q; |
| 279 | while (count--) |
| 280 | *r++ = *s++; |
| 281 | p -= (q - buffer); |
| 282 | q = buffer; |
| 283 | } |
H. Peter Anvin | 87bc619 | 2002-04-30 20:53:16 +0000 | [diff] [blame] | 284 | } while (lenread > 0 || !(eof || feof(fp))); |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 285 | |
| 286 | if (fp != stdin) |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 287 | fclose(fp); |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 288 | |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 289 | return 0; |
| 290 | } |
| 291 | |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 292 | static void output_ins(uint32_t offset, uint8_t *data, |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 293 | int datalen, char *insn) |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 294 | { |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 295 | int bytes; |
H. Peter Anvin | 090a218 | 2002-04-30 21:04:18 +0000 | [diff] [blame] | 296 | fprintf(stdout, "%08lX ", offset); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 297 | |
| 298 | bytes = 0; |
| 299 | while (datalen > 0 && bytes < BPL) { |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 300 | fprintf(stdout, "%02X", *data++); |
| 301 | bytes++; |
| 302 | datalen--; |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 303 | } |
| 304 | |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 305 | fprintf(stdout, "%*s%s\n", (BPL + 1 - bytes) * 2, "", insn); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 306 | |
| 307 | while (datalen > 0) { |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 308 | fprintf(stdout, " -"); |
| 309 | bytes = 0; |
| 310 | while (datalen > 0 && bytes < BPL) { |
| 311 | fprintf(stdout, "%02X", *data++); |
| 312 | bytes++; |
| 313 | datalen--; |
| 314 | } |
| 315 | fprintf(stdout, "\n"); |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 316 | } |
| 317 | } |
| 318 | |
| 319 | /* |
| 320 | * Skip a certain amount of data in a file, either by seeking if |
| 321 | * possible, or if that fails then by reading and discarding. |
| 322 | */ |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 323 | static void skip(uint32_t dist, FILE * fp) |
H. Peter Anvin | eba20a7 | 2002-04-30 20:53:55 +0000 | [diff] [blame] | 324 | { |
Keith Kanios | a6dfa78 | 2007-04-13 16:47:53 +0000 | [diff] [blame^] | 325 | char buffer[256]; /* should fit on most stacks :-) */ |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 326 | |
| 327 | /* |
| 328 | * Got to be careful with fseek: at least one fseek I've tried |
| 329 | * doesn't approve of SEEK_CUR. So I'll use SEEK_SET and |
| 330 | * ftell... horrible but apparently necessary. |
| 331 | */ |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 332 | if (fseek(fp, dist + ftell(fp), SEEK_SET)) { |
| 333 | while (dist > 0) { |
Keith Kanios | b7a8954 | 2007-04-12 02:40:54 +0000 | [diff] [blame] | 334 | uint32_t len = (dist < sizeof(buffer) ? |
H. Peter Anvin | e2c8018 | 2005-01-15 22:15:51 +0000 | [diff] [blame] | 335 | dist : sizeof(buffer)); |
| 336 | if (fread(buffer, 1, len, fp) < len) { |
| 337 | perror("fread"); |
| 338 | exit(1); |
| 339 | } |
| 340 | dist -= len; |
| 341 | } |
H. Peter Anvin | ea6e34d | 2002-04-30 20:51:32 +0000 | [diff] [blame] | 342 | } |
| 343 | } |