| 1 | /* |
| 2 | * ia32rtools |
| 3 | * (C) notaz, 2013-2015 |
| 4 | * |
| 5 | * This work is licensed under the terms of 3-clause BSD license. |
| 6 | * See COPYING file in the top-level directory. |
| 7 | */ |
| 8 | |
| 9 | #define _GNU_SOURCE |
| 10 | #include <stdio.h> |
| 11 | #include <stdlib.h> |
| 12 | #include <string.h> |
| 13 | #include <stdint.h> |
| 14 | #include <inttypes.h> |
| 15 | |
| 16 | #include "my_assert.h" |
| 17 | #include "my_str.h" |
| 18 | #include "common.h" |
| 19 | |
| 20 | #include "protoparse.h" |
| 21 | |
| 22 | static const char *asmfn; |
| 23 | static int asmln; |
| 24 | |
| 25 | static const struct parsed_proto *g_func_sym_pp; |
| 26 | static char g_comment[256]; |
| 27 | static int g_warn_cnt; |
| 28 | static int g_cconv_novalidate; |
| 29 | static int g_arm_mode; |
| 30 | |
| 31 | // note: must be in ascending order |
| 32 | enum dx_type { |
| 33 | DXT_UNSPEC, |
| 34 | DXT_BYTE, |
| 35 | DXT_WORD, |
| 36 | DXT_DWORD, |
| 37 | DXT_QUAD, |
| 38 | DXT_TEN, |
| 39 | }; |
| 40 | |
| 41 | #define anote(fmt, ...) \ |
| 42 | printf("%s:%d: note: " fmt, asmfn, asmln, ##__VA_ARGS__) |
| 43 | #define awarn(fmt, ...) do { \ |
| 44 | printf("%s:%d: warning: " fmt, asmfn, asmln, ##__VA_ARGS__); \ |
| 45 | if (++g_warn_cnt == 10) { \ |
| 46 | fcloseall(); \ |
| 47 | exit(1); \ |
| 48 | } \ |
| 49 | } while (0) |
| 50 | #define aerr(fmt, ...) do { \ |
| 51 | printf("%s:%d: error: " fmt, asmfn, asmln, ##__VA_ARGS__); \ |
| 52 | fcloseall(); \ |
| 53 | exit(1); \ |
| 54 | } while (0) |
| 55 | |
| 56 | #include "masm_tools.h" |
| 57 | |
| 58 | static char *next_word_s(char *w, size_t wsize, char *s) |
| 59 | { |
| 60 | int quote = 0; |
| 61 | size_t i; |
| 62 | |
| 63 | s = sskip(s); |
| 64 | |
| 65 | for (i = 0; i < wsize - 1; i++) { |
| 66 | if (s[i] == '\'') |
| 67 | quote ^= 1; |
| 68 | if (s[i] == 0 || (!quote && (my_isblank(s[i]) || s[i] == ','))) |
| 69 | break; |
| 70 | w[i] = s[i]; |
| 71 | } |
| 72 | w[i] = 0; |
| 73 | |
| 74 | if (s[i] != 0 && !my_isblank(s[i]) && s[i] != ',') |
| 75 | printf("warning: '%s' truncated\n", w); |
| 76 | |
| 77 | return s + i; |
| 78 | } |
| 79 | |
| 80 | static void next_section(FILE *fasm, char *name) |
| 81 | { |
| 82 | char words[2][256]; |
| 83 | char line[256]; |
| 84 | int wordc; |
| 85 | char *p; |
| 86 | |
| 87 | name[0] = 0; |
| 88 | |
| 89 | while (my_fgets(line, sizeof(line), fasm)) |
| 90 | { |
| 91 | wordc = 0; |
| 92 | asmln++; |
| 93 | |
| 94 | p = sskip(line); |
| 95 | if (*p == 0) |
| 96 | continue; |
| 97 | |
| 98 | if (*p == ';') |
| 99 | continue; |
| 100 | |
| 101 | for (wordc = 0; wordc < ARRAY_SIZE(words); wordc++) { |
| 102 | p = sskip(next_word(words[wordc], sizeof(words[0]), p)); |
| 103 | if (*p == 0 || *p == ';') { |
| 104 | wordc++; |
| 105 | break; |
| 106 | } |
| 107 | } |
| 108 | |
| 109 | if (wordc < 2) |
| 110 | continue; |
| 111 | |
| 112 | if (!IS(words[1], "segment")) |
| 113 | continue; |
| 114 | |
| 115 | strcpy(name, words[0]); |
| 116 | break; |
| 117 | } |
| 118 | } |
| 119 | |
| 120 | static enum dx_type parse_dx_directive(const char *name) |
| 121 | { |
| 122 | if (IS(name, "dd")) |
| 123 | return DXT_DWORD; |
| 124 | if (IS(name, "dw")) |
| 125 | return DXT_WORD; |
| 126 | if (IS(name, "db")) |
| 127 | return DXT_BYTE; |
| 128 | if (IS(name, "dq")) |
| 129 | return DXT_QUAD; |
| 130 | if (IS(name, "dt")) |
| 131 | return DXT_TEN; |
| 132 | |
| 133 | return DXT_UNSPEC; |
| 134 | } |
| 135 | |
| 136 | static const char *type_name(enum dx_type type) |
| 137 | { |
| 138 | switch (type) { |
| 139 | case DXT_BYTE: |
| 140 | return ".byte"; |
| 141 | case DXT_WORD: |
| 142 | return ".hword"; |
| 143 | case DXT_DWORD: |
| 144 | return ".long"; |
| 145 | case DXT_QUAD: |
| 146 | return ".quad"; |
| 147 | case DXT_TEN: |
| 148 | return ".tfloat"; |
| 149 | case DXT_UNSPEC: |
| 150 | break; |
| 151 | } |
| 152 | return "<bad>"; |
| 153 | } |
| 154 | |
| 155 | static const char *type_name_float(enum dx_type type) |
| 156 | { |
| 157 | switch (type) { |
| 158 | case DXT_DWORD: |
| 159 | return ".float"; |
| 160 | case DXT_QUAD: |
| 161 | return ".double"; |
| 162 | case DXT_TEN: |
| 163 | return ".tfloat"; |
| 164 | default: |
| 165 | break; |
| 166 | } |
| 167 | return "<bad_float>"; |
| 168 | } |
| 169 | |
| 170 | static int type_size(enum dx_type type) |
| 171 | { |
| 172 | switch (type) { |
| 173 | case DXT_BYTE: |
| 174 | return 1; |
| 175 | case DXT_WORD: |
| 176 | return 2; |
| 177 | case DXT_DWORD: |
| 178 | return 4; |
| 179 | case DXT_QUAD: |
| 180 | return 8; |
| 181 | case DXT_TEN: |
| 182 | return 10; |
| 183 | case DXT_UNSPEC: |
| 184 | break; |
| 185 | } |
| 186 | return -1; |
| 187 | } |
| 188 | |
| 189 | static char *escape_string(char *s) |
| 190 | { |
| 191 | char buf[256]; |
| 192 | char *t = buf; |
| 193 | |
| 194 | for (; *s != 0; s++) { |
| 195 | if (*s == '"') { |
| 196 | strcpy(t, "\\\""); |
| 197 | t += strlen(t); |
| 198 | continue; |
| 199 | } |
| 200 | if (*s == '\\') { |
| 201 | strcpy(t, "\\\\"); |
| 202 | t += strlen(t); |
| 203 | continue; |
| 204 | } |
| 205 | *t++ = *s; |
| 206 | } |
| 207 | *t++ = *s; |
| 208 | if (t - buf > sizeof(buf)) |
| 209 | aerr("string is too long\n"); |
| 210 | return strcpy(s, buf); |
| 211 | } |
| 212 | |
| 213 | static void sprint_pp_short(const struct parsed_proto *pp, char *buf, |
| 214 | size_t buf_size) |
| 215 | { |
| 216 | char *p = buf; |
| 217 | size_t l; |
| 218 | int i; |
| 219 | |
| 220 | if (pp->ret_type.is_ptr) |
| 221 | *p++ = 'p'; |
| 222 | else if (IS(pp->ret_type.name, "void")) |
| 223 | *p++ = 'v'; |
| 224 | else |
| 225 | *p++ = 'i'; |
| 226 | *p++ = '('; |
| 227 | l = 2; |
| 228 | |
| 229 | for (i = 0; i < pp->argc; i++) { |
| 230 | if (pp->arg[i].reg != NULL) |
| 231 | snprintf(buf + l, buf_size - l, "%s%s", |
| 232 | i == 0 ? "" : ",", pp->arg[i].reg); |
| 233 | else |
| 234 | snprintf(buf + l, buf_size - l, "%sa%d", |
| 235 | i == 0 ? "" : ",", i + 1); |
| 236 | l = strlen(buf); |
| 237 | } |
| 238 | snprintf(buf + l, buf_size - l, ")"); |
| 239 | } |
| 240 | |
| 241 | static const struct parsed_proto *check_var(FILE *fhdr, |
| 242 | const char *sym, const char *varname, int is_export) |
| 243 | { |
| 244 | const struct parsed_proto *pp, *pp_sym; |
| 245 | char fp_sym[256], fp_var[256], *p; |
| 246 | int i; |
| 247 | |
| 248 | pp = proto_parse(fhdr, varname, 1); |
| 249 | if (pp == NULL) { |
| 250 | if (IS_START(varname, "sub_")) |
| 251 | awarn("sub_ sym missing proto: '%s'\n", varname); |
| 252 | return NULL; |
| 253 | } |
| 254 | |
| 255 | if (is_export) |
| 256 | return NULL; |
| 257 | if (!pp->is_func && !pp->is_fptr) |
| 258 | return NULL; |
| 259 | |
| 260 | pp_print(fp_var, sizeof(fp_var), pp); |
| 261 | |
| 262 | if (pp->argc_reg == 0) |
| 263 | goto check_sym; |
| 264 | if (pp->argc_reg == 1 && pp->argc_stack == 0 |
| 265 | && IS(pp->arg[0].reg, "ecx")) |
| 266 | { |
| 267 | goto check_sym; |
| 268 | } |
| 269 | if (!g_cconv_novalidate |
| 270 | && (pp->argc_reg != 2 |
| 271 | || !IS(pp->arg[0].reg, "ecx") |
| 272 | || !IS(pp->arg[1].reg, "edx"))) |
| 273 | { |
| 274 | awarn("unhandled reg call: %s\n", fp_var); |
| 275 | } |
| 276 | |
| 277 | check_sym: |
| 278 | // fptrs must use 32bit args, callsite might have no information and |
| 279 | // lack a cast to smaller types, which results in incorrectly masked |
| 280 | // args passed (callee may assume masked args, it does on ARM) |
| 281 | for (i = 0; i < pp->argc; i++) { |
| 282 | if (pp->arg[i].type.is_ptr) |
| 283 | continue; |
| 284 | p = pp->arg[i].type.name; |
| 285 | if (strstr(p, "int8") || strstr(p, "int16") |
| 286 | || strstr(p, "char") || strstr(p, "short")) |
| 287 | { |
| 288 | awarn("reference to %s with arg%d '%s'\n", pp->name, i + 1, p); |
| 289 | } |
| 290 | } |
| 291 | |
| 292 | sprint_pp_short(pp, g_comment, sizeof(g_comment)); |
| 293 | |
| 294 | if (sym != NULL) { |
| 295 | g_func_sym_pp = NULL; |
| 296 | pp_sym = proto_parse(fhdr, sym, 1); |
| 297 | if (pp_sym == NULL) |
| 298 | return pp; |
| 299 | if (!pp_sym->is_fptr) |
| 300 | aerr("func ptr data, but label '%s' !is_fptr\n", pp_sym->name); |
| 301 | g_func_sym_pp = pp_sym; |
| 302 | } |
| 303 | else { |
| 304 | pp_sym = g_func_sym_pp; |
| 305 | if (pp_sym == NULL) |
| 306 | return pp; |
| 307 | } |
| 308 | |
| 309 | if (!pp_compatible_func(pp_sym, pp)) { |
| 310 | pp_print(fp_sym, sizeof(fp_sym), pp_sym); |
| 311 | anote("entry: %s\n", fp_var); |
| 312 | anote("label: %s\n", fp_sym); |
| 313 | awarn("^ mismatch\n"); |
| 314 | } |
| 315 | |
| 316 | return pp; |
| 317 | } |
| 318 | |
| 319 | static void output_decorated_pp(FILE *fout, |
| 320 | const struct parsed_proto *pp) |
| 321 | { |
| 322 | if (pp->name[0] != '_') |
| 323 | fprintf(fout, pp->is_fastcall ? "@" : "_"); |
| 324 | fprintf(fout, "%s", pp->name); |
| 325 | if (pp->is_stdcall && pp->argc > 0) |
| 326 | fprintf(fout, "@%d", pp->argc * 4); |
| 327 | } |
| 328 | |
| 329 | static int align_value(int src_val) |
| 330 | { |
| 331 | if (src_val <= 0) { |
| 332 | awarn("bad align: %d\n", src_val); |
| 333 | src_val = 1; |
| 334 | } |
| 335 | if (!g_arm_mode) |
| 336 | return src_val; |
| 337 | |
| 338 | return __builtin_ffs(src_val) - 1; |
| 339 | } |
| 340 | |
| 341 | static int cmpstringp(const void *p1, const void *p2) |
| 342 | { |
| 343 | return strcmp(*(char * const *)p1, *(char * const *)p2); |
| 344 | } |
| 345 | |
| 346 | /* XXX: maybe move to external file? */ |
| 347 | static const char *unwanted_syms[] = { |
| 348 | "aRuntimeError", |
| 349 | "aTlossError", |
| 350 | "aSingError", |
| 351 | "aDomainError", |
| 352 | "aR6029ThisAppli", |
| 353 | "aR6028UnableToI", |
| 354 | "aR6027NotEnough", |
| 355 | "aR6026NotEnough", |
| 356 | "aR6025PureVirtu", |
| 357 | "aR6024NotEnough", |
| 358 | "aR6019UnableToO", |
| 359 | "aR6018Unexpecte", |
| 360 | "aR6017Unexpecte", |
| 361 | "aR6016NotEnough", |
| 362 | "aAbnormalProgra", |
| 363 | "aR6009NotEnough", |
| 364 | "aR6008NotEnough", |
| 365 | "aR6002FloatingP", |
| 366 | "aMicrosoftVisua", |
| 367 | "aRuntimeErrorPr", |
| 368 | "aThisApplicatio", |
| 369 | "aMicrosoftFindF", |
| 370 | "aMicrosoftOffic", |
| 371 | }; |
| 372 | |
| 373 | static int is_unwanted_sym(const char *sym) |
| 374 | { |
| 375 | return bsearch(&sym, unwanted_syms, ARRAY_SIZE(unwanted_syms), |
| 376 | sizeof(unwanted_syms[0]), cmpstringp) != NULL; |
| 377 | } |
| 378 | |
| 379 | int main(int argc, char *argv[]) |
| 380 | { |
| 381 | FILE *fout, *fasm, *fhdr = NULL, *frlist; |
| 382 | const struct parsed_proto *pp; |
| 383 | int no_decorations = 0; |
| 384 | int header_mode = 0; |
| 385 | int maybe_func_table; |
| 386 | int in_export_table; |
| 387 | int rm_labels_lines; |
| 388 | int is_zero_val; |
| 389 | char comment_char = '#'; |
| 390 | char words[20][256]; |
| 391 | char word[256]; |
| 392 | char line[256]; |
| 393 | char last_sym[32]; |
| 394 | unsigned long val; |
| 395 | unsigned long cnt; |
| 396 | uint64_t val64; |
| 397 | const char *sym; |
| 398 | enum dx_type type; |
| 399 | char **pub_syms; |
| 400 | int pub_sym_cnt = 0; |
| 401 | int pub_sym_alloc; |
| 402 | char **rlist; |
| 403 | int rlist_cnt = 0; |
| 404 | int rlist_alloc; |
| 405 | int is_ro = 0; |
| 406 | int is_label; |
| 407 | int is_bss; |
| 408 | int wordc; |
| 409 | int first; |
| 410 | int arg_out; |
| 411 | int arg = 1; |
| 412 | int len; |
| 413 | int w, i; |
| 414 | char *p; |
| 415 | char *p2; |
| 416 | |
| 417 | if (argc < 4) { |
| 418 | // -nd: no symbol decorations |
| 419 | printf("usage:\n%s [-nd] [-i] [-a] <.s> <.asm> <hdrf> [rlist]*\n" |
| 420 | "%s -hdr <.h> <.asm>\n", |
| 421 | argv[0], argv[0]); |
| 422 | return 1; |
| 423 | } |
| 424 | |
| 425 | for (arg = 1; arg < argc; arg++) { |
| 426 | if (IS(argv[arg], "-nd")) |
| 427 | no_decorations = 1; |
| 428 | else if (IS(argv[arg], "-i")) |
| 429 | g_cconv_novalidate = 1; |
| 430 | else if (IS(argv[arg], "-a")) { |
| 431 | comment_char = '@'; |
| 432 | g_arm_mode = 1; |
| 433 | } |
| 434 | else if (IS(argv[arg], "-hdr")) |
| 435 | header_mode = 1; |
| 436 | else |
| 437 | break; |
| 438 | } |
| 439 | |
| 440 | arg_out = arg++; |
| 441 | |
| 442 | asmfn = argv[arg++]; |
| 443 | fasm = fopen(asmfn, "r"); |
| 444 | my_assert_not(fasm, NULL); |
| 445 | |
| 446 | if (!header_mode) { |
| 447 | hdrfn = argv[arg++]; |
| 448 | fhdr = fopen(hdrfn, "r"); |
| 449 | my_assert_not(fhdr, NULL); |
| 450 | } |
| 451 | |
| 452 | fout = fopen(argv[arg_out], "w"); |
| 453 | my_assert_not(fout, NULL); |
| 454 | |
| 455 | pub_sym_alloc = 64; |
| 456 | pub_syms = malloc(pub_sym_alloc * sizeof(pub_syms[0])); |
| 457 | my_assert_not(pub_syms, NULL); |
| 458 | |
| 459 | rlist_alloc = 64; |
| 460 | rlist = malloc(rlist_alloc * sizeof(rlist[0])); |
| 461 | my_assert_not(rlist, NULL); |
| 462 | |
| 463 | for (; arg < argc; arg++) { |
| 464 | frlist = fopen(argv[arg], "r"); |
| 465 | my_assert_not(frlist, NULL); |
| 466 | |
| 467 | while (my_fgets(line, sizeof(line), frlist)) { |
| 468 | p = sskip(line); |
| 469 | if (*p == 0 || *p == ';' || *p == '#') |
| 470 | continue; |
| 471 | |
| 472 | p = next_word(words[0], sizeof(words[0]), p); |
| 473 | if (words[0][0] == 0) |
| 474 | continue; |
| 475 | |
| 476 | if (rlist_cnt >= rlist_alloc) { |
| 477 | rlist_alloc = rlist_alloc * 2 + 64; |
| 478 | rlist = realloc(rlist, rlist_alloc * sizeof(rlist[0])); |
| 479 | my_assert_not(rlist, NULL); |
| 480 | } |
| 481 | rlist[rlist_cnt++] = strdup(words[0]); |
| 482 | } |
| 483 | |
| 484 | fclose(frlist); |
| 485 | frlist = NULL; |
| 486 | } |
| 487 | |
| 488 | if (rlist_cnt > 0) |
| 489 | qsort(rlist, rlist_cnt, sizeof(rlist[0]), cmpstringp); |
| 490 | |
| 491 | qsort(unwanted_syms, ARRAY_SIZE(unwanted_syms), |
| 492 | sizeof(unwanted_syms[0]), cmpstringp); |
| 493 | |
| 494 | while (1) { |
| 495 | last_sym[0] = 0; |
| 496 | g_func_sym_pp = NULL; |
| 497 | maybe_func_table = 0; |
| 498 | in_export_table = 0; |
| 499 | rm_labels_lines = 0; |
| 500 | |
| 501 | next_section(fasm, line); |
| 502 | if (feof(fasm)) |
| 503 | break; |
| 504 | if (IS(line + 1, "text")) |
| 505 | continue; |
| 506 | |
| 507 | if (IS(line + 1, "rdata")) { |
| 508 | is_ro = 1; |
| 509 | if (!header_mode) |
| 510 | fprintf(fout, "\n.section .rodata\n"); |
| 511 | } |
| 512 | else if (IS(line + 1, "data")) { |
| 513 | is_ro = 0; |
| 514 | if (!header_mode) |
| 515 | fprintf(fout, "\n.data\n"); |
| 516 | } |
| 517 | else |
| 518 | aerr("unhandled section: '%s'\n", line); |
| 519 | |
| 520 | if (!header_mode) |
| 521 | fprintf(fout, ".align %d\n", align_value(4)); |
| 522 | |
| 523 | while (my_fgets(line, sizeof(line), fasm)) |
| 524 | { |
| 525 | is_zero_val = 0; |
| 526 | sym = NULL; |
| 527 | asmln++; |
| 528 | |
| 529 | p = sskip(line); |
| 530 | if (*p == 0) |
| 531 | continue; |
| 532 | |
| 533 | if (*p == ';') { |
| 534 | if (IS_START(p, ";org") && sscanf(p + 5, "%Xh", &i) == 1) { |
| 535 | // ;org is only seen at section start, so assume . addr 0 |
| 536 | i &= 0xfff; |
| 537 | if (i != 0 && !header_mode) |
| 538 | fprintf(fout, "\t\t .skip 0x%x\n", i); |
| 539 | } |
| 540 | else if (IS_START(p, "; Export Address")) |
| 541 | in_export_table = 1; |
| 542 | else if (IS_START(p, "; Export")) |
| 543 | in_export_table = 0; |
| 544 | continue; |
| 545 | } |
| 546 | |
| 547 | for (wordc = 0; wordc < ARRAY_SIZE(words); wordc++) { |
| 548 | p = sskip(next_word_s(words[wordc], sizeof(words[0]), p)); |
| 549 | if (*p == 0 || *p == ';') { |
| 550 | wordc++; |
| 551 | break; |
| 552 | } |
| 553 | if (*p == ',') { |
| 554 | p = sskip(p + 1); |
| 555 | } |
| 556 | } |
| 557 | |
| 558 | if (*p == ';') { |
| 559 | p = sskip(p + 1); |
| 560 | if (IS_START(p, "sctclrtype")) { |
| 561 | maybe_func_table = 0; |
| 562 | g_func_sym_pp = NULL; |
| 563 | } |
| 564 | } |
| 565 | |
| 566 | if (wordc == 2 && IS(words[1], "ends")) |
| 567 | break; |
| 568 | if (wordc <= 2 && IS(words[0], "end")) |
| 569 | break; |
| 570 | if (wordc < 2) |
| 571 | aerr("unhandled: '%s'\n", words[0]); |
| 572 | |
| 573 | // don't cares |
| 574 | if (IS(words[0], "assume")) |
| 575 | continue; |
| 576 | |
| 577 | if (IS(words[0], "align")) { |
| 578 | if (header_mode) |
| 579 | continue; |
| 580 | |
| 581 | val = parse_number(words[1], 0); |
| 582 | fprintf(fout, "\t\t .align %d", align_value(val)); |
| 583 | goto fin; |
| 584 | } |
| 585 | |
| 586 | if (IS(words[0], "public")) { |
| 587 | // skip, sym should appear in header anyway |
| 588 | continue; |
| 589 | } |
| 590 | |
| 591 | w = 1; |
| 592 | type = parse_dx_directive(words[0]); |
| 593 | if (type == DXT_UNSPEC) { |
| 594 | type = parse_dx_directive(words[1]); |
| 595 | sym = words[0]; |
| 596 | w = 2; |
| 597 | } |
| 598 | if (type == DXT_UNSPEC) |
| 599 | aerr("unhandled decl: '%s %s'\n", words[0], words[1]); |
| 600 | |
| 601 | if (sym != NULL) |
| 602 | { |
| 603 | if (header_mode) { |
| 604 | int is_str = 0; |
| 605 | |
| 606 | fprintf(fout, "extern "); |
| 607 | if (is_ro) |
| 608 | fprintf(fout, "const "); |
| 609 | |
| 610 | switch (type) { |
| 611 | case DXT_BYTE: |
| 612 | for (i = w; i < wordc; i++) |
| 613 | if (words[i][0] == '\'') |
| 614 | is_str = 1; |
| 615 | if (is_str) |
| 616 | fprintf(fout, "char %s[];\n", sym); |
| 617 | else |
| 618 | fprintf(fout, "uint8_t %s;\n", sym); |
| 619 | break; |
| 620 | |
| 621 | case DXT_WORD: |
| 622 | fprintf(fout, "uint16_t %s;\n", sym); |
| 623 | break; |
| 624 | |
| 625 | case DXT_DWORD: |
| 626 | fprintf(fout, "uint32_t %s;\n", sym); |
| 627 | break; |
| 628 | |
| 629 | default: |
| 630 | fprintf(fout, "_UNKNOWN %s;\n", sym); |
| 631 | break; |
| 632 | } |
| 633 | |
| 634 | continue; |
| 635 | } |
| 636 | |
| 637 | snprintf(last_sym, sizeof(last_sym), "%s", sym); |
| 638 | maybe_func_table = type == DXT_DWORD; |
| 639 | |
| 640 | if (IS_START(sym, "__IMPORT_DESCRIPTOR_")) { |
| 641 | rm_labels_lines = 5; |
| 642 | maybe_func_table = 0; |
| 643 | } |
| 644 | |
| 645 | pp = proto_parse(fhdr, sym, 1); |
| 646 | if (pp != NULL) { |
| 647 | g_func_sym_pp = NULL; |
| 648 | |
| 649 | // public/global name |
| 650 | if (pub_sym_cnt >= pub_sym_alloc) { |
| 651 | pub_sym_alloc *= 2; |
| 652 | pub_syms = realloc(pub_syms, pub_sym_alloc * sizeof(pub_syms[0])); |
| 653 | my_assert_not(pub_syms, NULL); |
| 654 | } |
| 655 | pub_syms[pub_sym_cnt++] = strdup(sym); |
| 656 | } |
| 657 | |
| 658 | len = strlen(sym); |
| 659 | fprintf(fout, "%s%s:", no_decorations ? "" : "_", sym); |
| 660 | |
| 661 | len += 2; |
| 662 | if (len < 8) |
| 663 | fprintf(fout, "\t"); |
| 664 | if (len < 16) |
| 665 | fprintf(fout, "\t"); |
| 666 | if (len <= 16) |
| 667 | fprintf(fout, " "); |
| 668 | else |
| 669 | fprintf(fout, " "); |
| 670 | } |
| 671 | else { |
| 672 | if (header_mode) |
| 673 | continue; |
| 674 | |
| 675 | fprintf(fout, "\t\t "); |
| 676 | } |
| 677 | |
| 678 | // fill out some unwanted strings with zeroes.. |
| 679 | if (type == DXT_BYTE && words[w][0] == '\'' |
| 680 | && is_unwanted_sym(last_sym)) |
| 681 | { |
| 682 | len = 0; |
| 683 | for (; w < wordc; w++) { |
| 684 | if (words[w][0] == '\'') { |
| 685 | p = words[w] + 1; |
| 686 | for (; *p && *p != '\''; p++) |
| 687 | len++; |
| 688 | } |
| 689 | else { |
| 690 | // assume encoded byte |
| 691 | len++; |
| 692 | } |
| 693 | } |
| 694 | fprintf(fout, ".skip %d", len); |
| 695 | goto fin; |
| 696 | } |
| 697 | else if (type == DXT_BYTE |
| 698 | && (words[w][0] == '\'' |
| 699 | || (w + 1 < wordc && words[w + 1][0] == '\''))) |
| 700 | { |
| 701 | // string; use asciz for most common case |
| 702 | if (w == wordc - 2 && IS(words[w + 1], "0")) { |
| 703 | fprintf(fout, ".asciz \""); |
| 704 | wordc--; |
| 705 | } |
| 706 | else |
| 707 | fprintf(fout, ".ascii \""); |
| 708 | |
| 709 | for (; w < wordc; w++) { |
| 710 | if (words[w][0] == '\'') { |
| 711 | p = words[w] + 1; |
| 712 | p2 = strchr(p, '\''); |
| 713 | if (p2 == NULL) |
| 714 | aerr("unterminated string? '%s'\n", p); |
| 715 | memcpy(word, p, p2 - p); |
| 716 | word[p2 - p] = 0; |
| 717 | fprintf(fout, "%s", escape_string(word)); |
| 718 | } |
| 719 | else { |
| 720 | val = parse_number(words[w], 0); |
| 721 | if (val & ~0xff) |
| 722 | aerr("bad string trailing byte?\n"); |
| 723 | // unfortunately \xHH is unusable - gas interprets |
| 724 | // things like \x27b as 0x7b, so have to use octal here |
| 725 | fprintf(fout, "\\%03lo", val); |
| 726 | } |
| 727 | } |
| 728 | fprintf(fout, "\""); |
| 729 | goto fin; |
| 730 | } |
| 731 | |
| 732 | if (w == wordc - 2) { |
| 733 | if (IS_START(words[w + 1], "dup(")) { |
| 734 | cnt = parse_number(words[w], 0); |
| 735 | p = words[w + 1] + 4; |
| 736 | p2 = strchr(p, ')'); |
| 737 | if (p2 == NULL) |
| 738 | aerr("bad dup?\n"); |
| 739 | memmove(word, p, p2 - p); |
| 740 | word[p2 - p] = 0; |
| 741 | |
| 742 | val = 0; |
| 743 | if (!IS(word, "?")) |
| 744 | val = parse_number(word, 0); |
| 745 | |
| 746 | fprintf(fout, ".fill 0x%02lx,%d,0x%02lx", |
| 747 | cnt, type_size(type), val); |
| 748 | goto fin; |
| 749 | } |
| 750 | } |
| 751 | |
| 752 | if (type == DXT_DWORD && words[w][0] == '\'' |
| 753 | && words[w][5] == '\'' && strlen(words[w]) == 6) |
| 754 | { |
| 755 | if (w != wordc - 1) |
| 756 | aerr("TODO\n"); |
| 757 | |
| 758 | p = words[w]; |
| 759 | val = (p[1] << 24) | (p[2] << 16) | (p[3] << 8) | p[4]; |
| 760 | fprintf(fout, ".long 0x%lx", val); |
| 761 | snprintf(g_comment, sizeof(g_comment), "%s", words[w]); |
| 762 | goto fin; |
| 763 | } |
| 764 | |
| 765 | if (type >= DXT_DWORD && strchr(words[w], '.')) |
| 766 | { |
| 767 | if (w != wordc - 1) |
| 768 | aerr("TODO\n"); |
| 769 | |
| 770 | if (g_arm_mode && type == DXT_TEN) { |
| 771 | fprintf(fout, ".fill 10"); |
| 772 | snprintf(g_comment, sizeof(g_comment), "%s %s", |
| 773 | type_name_float(type), words[w]); |
| 774 | } |
| 775 | else |
| 776 | fprintf(fout, "%s %s", type_name_float(type), words[w]); |
| 777 | goto fin; |
| 778 | } |
| 779 | |
| 780 | first = 1; |
| 781 | fprintf(fout, "%s ", type_name(type)); |
| 782 | for (; w < wordc; w++) |
| 783 | { |
| 784 | if (!first) |
| 785 | fprintf(fout, ", "); |
| 786 | |
| 787 | is_label = is_bss = 0; |
| 788 | if (w <= wordc - 2 && IS(words[w], "offset")) { |
| 789 | is_label = 1; |
| 790 | w++; |
| 791 | } |
| 792 | else if (IS(words[w], "?")) { |
| 793 | is_bss = 1; |
| 794 | } |
| 795 | else if (type == DXT_DWORD |
| 796 | && !('0' <= words[w][0] && words[w][0] <= '9')) |
| 797 | { |
| 798 | // assume label |
| 799 | is_label = 1; |
| 800 | } |
| 801 | |
| 802 | if (is_bss) { |
| 803 | fprintf(fout, "0"); |
| 804 | } |
| 805 | else if (is_label) { |
| 806 | p = words[w]; |
| 807 | if (IS_START(p, "loc_") || IS_START(p, "__imp") |
| 808 | || strchr(p, '?') || strchr(p, '@') |
| 809 | || rm_labels_lines > 0 |
| 810 | || bsearch(&p, rlist, rlist_cnt, sizeof(rlist[0]), |
| 811 | cmpstringp)) |
| 812 | { |
| 813 | fprintf(fout, "0"); |
| 814 | snprintf(g_comment, sizeof(g_comment), "%s", p); |
| 815 | } |
| 816 | else { |
| 817 | const char *f_sym = maybe_func_table ? last_sym : NULL; |
| 818 | |
| 819 | pp = check_var(fhdr, f_sym, p, in_export_table); |
| 820 | if (pp == NULL) { |
| 821 | fprintf(fout, "%s%s", |
| 822 | (no_decorations || p[0] == '_') ? "" : "_", p); |
| 823 | } |
| 824 | else { |
| 825 | if (no_decorations) |
| 826 | fprintf(fout, "%s", pp->name); |
| 827 | else |
| 828 | output_decorated_pp(fout, pp); |
| 829 | } |
| 830 | } |
| 831 | } |
| 832 | else { |
| 833 | val64 = parse_number(words[w], 1); |
| 834 | if (val64 < 10) |
| 835 | fprintf(fout, "%d", (int)val64); |
| 836 | else |
| 837 | fprintf(fout, "0x%" PRIx64, val64); |
| 838 | |
| 839 | is_zero_val = val64 == 0; |
| 840 | } |
| 841 | |
| 842 | first = 0; |
| 843 | } |
| 844 | |
| 845 | fin: |
| 846 | if (!is_zero_val) |
| 847 | maybe_func_table = 0; |
| 848 | |
| 849 | if (rm_labels_lines > 0) |
| 850 | rm_labels_lines--; |
| 851 | |
| 852 | if (g_comment[0] != 0) { |
| 853 | fprintf(fout, "\t\t%c %s", comment_char, g_comment); |
| 854 | g_comment[0] = 0; |
| 855 | } |
| 856 | fprintf(fout, "\n"); |
| 857 | } |
| 858 | } |
| 859 | |
| 860 | fprintf(fout, "\n"); |
| 861 | |
| 862 | // dump public syms |
| 863 | for (i = 0; i < pub_sym_cnt; i++) |
| 864 | fprintf(fout, ".global %s%s\n", |
| 865 | no_decorations ? "" : "_", pub_syms[i]); |
| 866 | |
| 867 | fclose(fout); |
| 868 | fclose(fasm); |
| 869 | if (fhdr != NULL) |
| 870 | fclose(fhdr); |
| 871 | |
| 872 | return 0; |
| 873 | } |
| 874 | |
| 875 | // vim:ts=2:shiftwidth=2:expandtab |