9 #define ARRAY_SIZE(x) (sizeof(x) / sizeof(x[0]))
10 #define IS(w, y) !strcmp(w, y)
11 #define IS_START(w, y) !strncmp(w, y, strlen(y))
13 #include "protoparse.h"
15 static const char *asmfn;
18 static const struct parsed_proto *g_func_sym_pp;
19 static char g_comment[256];
20 static int g_warn_cnt;
21 static int g_cconv_novalidate;
23 // note: must be in ascending order
33 #define anote(fmt, ...) \
34 printf("%s:%d: note: " fmt, asmfn, asmln, ##__VA_ARGS__)
35 #define awarn(fmt, ...) do { \
36 printf("%s:%d: warning: " fmt, asmfn, asmln, ##__VA_ARGS__); \
37 if (++g_warn_cnt == 10) { \
42 #define aerr(fmt, ...) do { \
43 printf("%s:%d: error: " fmt, asmfn, asmln, ##__VA_ARGS__); \
48 #include "masm_tools.h"
50 static char *next_word_s(char *w, size_t wsize, char *s)
57 for (i = 0; i < wsize - 1; i++) {
60 if (s[i] == 0 || (!quote && (my_isblank(s[i]) || s[i] == ',')))
66 if (s[i] != 0 && !my_isblank(s[i]) && s[i] != ',')
67 printf("warning: '%s' truncated\n", w);
72 static void next_section(FILE *fasm, char *name)
81 while (fgets(line, sizeof(line), fasm))
91 while (strlen(line) == sizeof(line) - 1) {
92 // one of those long comment lines..
93 if (!fgets(line, sizeof(line), fasm))
99 for (wordc = 0; wordc < ARRAY_SIZE(words); wordc++) {
100 p = sskip(next_word(words[wordc], sizeof(words[0]), p));
101 if (*p == 0 || *p == ';') {
110 if (!IS(words[1], "segment"))
113 strcpy(name, words[0]);
118 static enum dx_type parse_dx_directive(const char *name)
134 static const char *type_name(enum dx_type type)
153 static const char *type_name_float(enum dx_type type)
165 return "<bad_float>";
168 static int type_size(enum dx_type type)
187 static char *escape_string(char *s)
192 for (; *s != 0; s++) {
206 return strcpy(s, buf);
209 static void sprint_pp_short(const struct parsed_proto *pp, char *buf,
216 if (pp->ret_type.is_ptr)
218 else if (IS(pp->ret_type.name, "void"))
225 for (i = 0; i < pp->argc; i++) {
226 if (pp->arg[i].reg != NULL)
227 snprintf(buf + l, buf_size - l, "%s%s",
228 i == 0 ? "" : ",", pp->arg[i].reg);
230 snprintf(buf + l, buf_size - l, "%sa%d",
231 i == 0 ? "" : ",", i + 1);
234 snprintf(buf + l, buf_size - l, ")");
237 static const struct parsed_proto *check_var(FILE *fhdr,
238 const char *sym, const char *varname)
240 const struct parsed_proto *pp, *pp_sym;
241 char fp_sym[256], fp_var[256];
244 pp = proto_parse(fhdr, varname, 1);
246 if (IS_START(varname, "sub_"))
247 awarn("sub_ sym missing proto: '%s'\n", varname);
251 if (!pp->is_func && !pp->is_fptr)
254 pp_print(fp_var, sizeof(fp_var), pp);
256 if (pp->argc_reg == 0)
258 if (pp->argc_reg == 1 && pp->argc_stack == 0
259 && IS(pp->arg[0].reg, "ecx"))
263 if (!g_cconv_novalidate
264 && (pp->argc_reg != 2
265 || !IS(pp->arg[0].reg, "ecx")
266 || !IS(pp->arg[1].reg, "edx")))
268 awarn("unhandled reg call: %s\n", fp_var);
272 sprint_pp_short(pp, g_comment, sizeof(g_comment));
275 g_func_sym_pp = NULL;
276 pp_sym = proto_parse(fhdr, sym, 1);
279 if (!pp_sym->is_fptr)
280 aerr("func ptr data, but label '%s' !is_fptr\n", pp_sym->name);
281 g_func_sym_pp = pp_sym;
284 pp_sym = g_func_sym_pp;
289 if (pp->argc != pp_sym->argc || pp->argc_reg != pp_sym->argc_reg)
292 for (i = 0; i < pp->argc; i++) {
293 if ((pp->arg[i].reg != NULL) != (pp_sym->arg[i].reg != NULL)) {
297 if ((pp->arg[i].reg != NULL)
298 && !IS(pp->arg[i].reg, pp_sym->arg[i].reg))
307 pp_print(fp_sym, sizeof(fp_sym), pp_sym);
308 anote("var: %s\n", fp_var);
309 anote("sym: %s\n", fp_sym);
310 awarn("^ mismatch\n");
316 static void output_decorated_pp(FILE *fout,
317 const struct parsed_proto *pp)
319 if (pp->name[0] != '_')
320 fprintf(fout, pp->is_fastcall ? "@" : "_");
321 fprintf(fout, "%s", pp->name);
322 if (pp->is_stdcall && pp->argc > 0)
323 fprintf(fout, "@%d", pp->argc * 4);
326 static int cmpstringp(const void *p1, const void *p2)
328 return strcmp(*(char * const *)p1, *(char * const *)p2);
331 /* XXX: maybe move to external file? */
332 static const char *unwanted_syms[] = {
358 static int is_unwanted_sym(const char *sym)
360 return bsearch(&sym, unwanted_syms, ARRAY_SIZE(unwanted_syms),
361 sizeof(unwanted_syms[0]), cmpstringp) != NULL;
364 int main(int argc, char *argv[])
366 FILE *fout, *fasm, *fhdr, *frlist;
367 const struct parsed_proto *pp;
368 int no_decorations = 0;
395 // -nd: no symbol decorations
396 printf("usage:\n%s [-nd] [-i] <.s> <.asm> <hdrf> [rlist]*\n",
401 for (arg = 1; arg < argc; arg++) {
402 if (IS(argv[arg], "-nd"))
404 else if (IS(argv[arg], "-i"))
405 g_cconv_novalidate = 1;
413 fasm = fopen(asmfn, "r");
414 my_assert_not(fasm, NULL);
417 fhdr = fopen(hdrfn, "r");
418 my_assert_not(fhdr, NULL);
420 fout = fopen(argv[arg_out], "w");
421 my_assert_not(fout, NULL);
424 pub_syms = malloc(pub_sym_alloc * sizeof(pub_syms[0]));
425 my_assert_not(pub_syms, NULL);
428 rlist = malloc(rlist_alloc * sizeof(rlist[0]));
429 my_assert_not(rlist, NULL);
431 for (; arg < argc; arg++) {
432 frlist = fopen(argv[arg], "r");
433 my_assert_not(frlist, NULL);
435 while (fgets(line, sizeof(line), frlist)) {
437 if (*p == 0 || *p == ';')
440 p = next_word(words[0], sizeof(words[0]), p);
441 if (words[0][0] == 0)
444 if (rlist_cnt >= rlist_alloc) {
445 rlist_alloc = rlist_alloc * 2 + 64;
446 rlist = realloc(rlist, rlist_alloc * sizeof(rlist[0]));
447 my_assert_not(rlist, NULL);
449 rlist[rlist_cnt++] = strdup(words[0]);
457 qsort(rlist, rlist_cnt, sizeof(rlist[0]), cmpstringp);
459 qsort(unwanted_syms, ARRAY_SIZE(unwanted_syms),
460 sizeof(unwanted_syms[0]), cmpstringp);
465 next_section(fasm, line);
468 if (IS(line + 1, "text"))
471 if (IS(line + 1, "rdata"))
472 fprintf(fout, "\n.section .rodata\n");
473 else if (IS(line + 1, "data"))
474 fprintf(fout, "\n.data\n");
476 aerr("unhandled section: '%s'\n", line);
478 fprintf(fout, ".align 4\n");
480 while (fgets(line, sizeof(line), fasm))
486 if (*p == 0 || *p == ';')
489 for (wordc = 0; wordc < ARRAY_SIZE(words); wordc++) {
490 p = sskip(next_word_s(words[wordc], sizeof(words[0]), p));
491 if (*p == 0 || *p == ';') {
502 if (IS_START(p, "sctclrtype"))
503 g_func_sym_pp = NULL;
506 if (wordc == 2 && IS(words[1], "ends"))
508 if (wordc <= 2 && IS(words[0], "end"))
511 aerr("unhandled: '%s'\n", words[0]);
514 if (IS(words[0], "assume"))
517 if (IS(words[0], "align")) {
518 val = parse_number(words[1]);
519 fprintf(fout, "\t\t .align %ld", val);
524 type = parse_dx_directive(words[0]);
525 if (type == DXT_UNSPEC) {
526 type = parse_dx_directive(words[1]);
530 if (type == DXT_UNSPEC)
531 aerr("unhandled decl: '%s %s'\n", words[0], words[1]);
534 snprintf(last_sym, sizeof(last_sym), "%s", sym);
536 pp = proto_parse(fhdr, sym, 1);
538 g_func_sym_pp = NULL;
540 // public/global name
541 if (pub_sym_cnt >= pub_sym_alloc) {
543 pub_syms = realloc(pub_syms, pub_sym_alloc * sizeof(pub_syms[0]));
544 my_assert_not(pub_syms, NULL);
546 pub_syms[pub_sym_cnt++] = strdup(sym);
550 fprintf(fout, "%s%s:", no_decorations ? "" : "_", sym);
563 fprintf(fout, "\t\t ");
566 // fill out some unwanted strings with zeroes..
567 if (type == DXT_BYTE && words[w][0] == '\''
568 && is_unwanted_sym(last_sym))
571 for (; w < wordc; w++) {
572 if (words[w][0] == '\'') {
574 for (; *p && *p != '\''; p++)
578 // assume encoded byte
582 fprintf(fout, ".skip %d", len);
585 else if (type == DXT_BYTE
586 && (words[w][0] == '\''
587 || (w + 1 < wordc && words[w + 1][0] == '\'')))
589 // string; use asciz for most common case
590 if (w == wordc - 2 && IS(words[w + 1], "0")) {
591 fprintf(fout, ".asciz \"");
595 fprintf(fout, ".ascii \"");
597 for (; w < wordc; w++) {
598 if (words[w][0] == '\'') {
600 p2 = strchr(p, '\'');
602 aerr("unterminated string? '%s'\n", p);
603 memcpy(word, p, p2 - p);
605 fprintf(fout, "%s", escape_string(word));
608 val = parse_number(words[w]);
610 aerr("bad string trailing byte?\n");
611 fprintf(fout, "\\x%02lx", val);
618 if (w == wordc - 2) {
619 if (IS_START(words[w + 1], "dup(")) {
620 cnt = parse_number(words[w]);
621 p = words[w + 1] + 4;
625 memmove(word, p, p2 - p);
630 val = parse_number(word);
632 fprintf(fout, ".fill 0x%02lx,%d,0x%02lx",
633 cnt, type_size(type), val);
638 if (type == DXT_DWORD && words[w][0] == '\''
639 && words[w][5] == '\'' && strlen(words[w]) == 6)
645 val = (p[1] << 24) | (p[2] << 16) | (p[3] << 8) | p[4];
646 fprintf(fout, ".long 0x%lx", val);
647 snprintf(g_comment, sizeof(g_comment), "%s", words[w]);
651 if (type >= DXT_DWORD && strchr(words[w], '.'))
656 fprintf(fout, "%s %s", type_name_float(type), words[w]);
661 fprintf(fout, "%s ", type_name(type));
662 for (; w < wordc; w++)
667 is_label = is_bss = 0;
668 if (w <= wordc - 2 && IS(words[w], "offset")) {
672 else if (IS(words[w], "?")) {
675 else if (type == DXT_DWORD
676 && !('0' <= words[w][0] && words[w][0] <= '9'))
687 if (IS_START(p, "loc_") || IS_START(p, "__imp")
688 || strchr(p, '?') || strchr(p, '@')
689 || bsearch(&p, rlist, rlist_cnt, sizeof(rlist[0]),
693 snprintf(g_comment, sizeof(g_comment), "%s", p);
696 pp = check_var(fhdr, sym, p);
698 fprintf(fout, "%s%s",
699 (no_decorations || p[0] == '_') ? "" : "_", p);
703 fprintf(fout, "%s", pp->name);
705 output_decorated_pp(fout, pp);
710 val = parse_number(words[w]);
712 fprintf(fout, "%ld", val);
714 fprintf(fout, "0x%lx", val);
721 if (g_comment[0] != 0) {
722 fprintf(fout, "\t\t# %s", g_comment);
732 for (i = 0; i < pub_sym_cnt; i++)
733 fprintf(fout, ".global %s%s\n",
734 no_decorations ? "" : "_", pub_syms[i]);
743 // vim:ts=2:shiftwidth=2:expandtab