+/*
+ * ia32rtools
+ * (C) notaz, 2013,2014
+ *
+ * This work is licensed under the terms of 3-clause BSD license.
+ * See COPYING file in the top-level directory.
+ */
struct parsed_proto;
unsigned int is_array:1;
unsigned int is_ptr:1;
unsigned int is_struct:1; // split for args
+ unsigned int is_retreg:1; // register to return to caller
+ unsigned int is_va_list:1;
+ unsigned int is_64bit:1;
+ unsigned int is_float:1; // float, double
};
struct parsed_proto_arg {
char *reg;
struct parsed_type type;
- struct parsed_proto *fptr;
+ struct parsed_proto *pp; // fptr or struct
void *datap;
+ unsigned int is_saved:1; // not set here, for tool use
};
struct parsed_proto {
unsigned int is_fastcall:1;
unsigned int is_vararg:1; // vararg func
unsigned int is_fptr:1;
+ unsigned int is_import:1; // data import
unsigned int is_noreturn:1;
unsigned int is_unresolved:1;
- unsigned int is_arg:1; // decl in func arg
+ unsigned int is_guessed:1; // for extra checking
+ unsigned int is_userstack:1;
+ unsigned int is_include:1; // not from top-level header
+ unsigned int is_osinc:1; // OS/system library func
+ unsigned int is_cinc:1; // crt library func
+ unsigned int is_arg:1; // declared in some func arg
unsigned int has_structarg:1;
+ unsigned int has_retreg:1;
+};
+
+struct parsed_struct {
+ char name[256];
+ struct {
+ int offset;
+ struct parsed_proto pp;
+ } members[64];
+ int member_count;
};
static const char *hdrfn;
static void pp_copy_arg(struct parsed_proto_arg *d,
const struct parsed_proto_arg *s);
-static int b_pp_c_handler(char *proto, const char *fname);
+static int b_pp_c_handler(char *proto, const char *fname,
+ int is_include, int is_osinc, int is_cinc);
+static int struct_handler(FILE *fhdr, char *proto, int *line);
-static int do_protostrs(FILE *fhdr, const char *fname)
+static int do_protostrs(FILE *fhdr, const char *fname, int is_include)
{
const char *finc_name;
const char *hdrfn_saved;
char protostr[256];
char path[256];
char fname_inc[256];
+ int is_osinc;
+ int is_cinc;
FILE *finc;
int line = 0;
int ret;
hdrfn_saved = hdrfn;
hdrfn = fname;
+ is_cinc = strstr(fname, "stdc.hlist") != NULL;
+ is_osinc = is_cinc || strstr(fname, "win32.hlist") != NULL;
+
while (fgets(protostr, sizeof(protostr), fhdr))
{
line++;
fname_inc, line, finc_name);
continue;
}
- ret = do_protostrs(finc, finc_name);
+ ret = do_protostrs(finc, finc_name, 1);
fclose(finc);
if (ret < 0)
break;
hdrfline = line;
- ret = b_pp_c_handler(protostr, hdrfn);
+ if (!strncmp(protostr, "struct", 6)
+ && strchr(protostr, '{') != NULL)
+ ret = struct_handler(fhdr, protostr, &line);
+ else
+ ret = b_pp_c_handler(protostr, hdrfn,
+ is_include, is_osinc, is_cinc);
if (ret < 0)
break;
}
return -1;
}
-static int get_regparm(char *dst, size_t dlen, char *p)
+static int get_regparm(char *dst, size_t dlen, char *p, int *retreg)
{
- int i, o;
+ int i = 0, o;
+
+ *retreg = 0;
if (*p != '<')
return 0;
- for (o = 0, i = 1; o < dlen; i++) {
+ i++;
+ if (p[i] == '*') {
+ *retreg = 1;
+ i++;
+ }
+
+ for (o = 0; o < dlen; i++) {
if (p[i] == 0)
return 0;
if (p[i] == '>')
"const",
"signed",
"unsigned",
- "struct",
"enum",
"CONST",
"volatile",
static const char *known_ptr_types[] = {
"FARPROC",
"WNDPROC",
+ "LINECALLBACK",
"HACCEL",
"HANDLE",
"HBITMAP",
+ "HBRUSH",
+ "HCALL",
"HCURSOR",
"HDC",
"HFONT",
"HGDIOBJ",
"HGLOBAL",
+ "HHOOK",
"HICON",
"HINSTANCE",
- //"HIMC", // DWORD
+ "HIMC", // DWORD in mingw, ptr in wine..
+ "HLINE",
+ "HLINEAPP",
+ "HLOCAL",
"HMODULE",
"HPALETTE",
"HRGN",
"HRSRC",
"HKEY",
"HMENU",
+ "HMONITOR",
+ "HWAVEOUT",
"HWND",
+ "PAPPBARDATA",
"PBYTE",
"PCRITICAL_SECTION",
+ "PDEVMODEA",
"PDWORD",
"PFILETIME",
+ "PLARGE_INTEGER",
+ "PHANDLE",
"PHKEY",
"PLONG",
"PMEMORY_BASIC_INFORMATION",
"PUINT",
+ "PULARGE_INTEGER",
+ "PULONG_PTR",
"PVOID",
"PCVOID",
"PWORD",
+ "REFCLSID",
+ "REFGUID",
+ "REFIID",
+ "HOOKPROC",
"DLGPROC",
"TIMERPROC",
"WNDENUMPROC",
"WINADVAPI",
};
-// returns ptr to char after type ends
static int typecmp(const char *n, const char *t)
{
for (; *t != 0; n++, t++) {
n = skip_type_mod(name);
+ if (!strncmp(n, "struct", 6) && my_isblank(n[6])) {
+ type->is_struct = 1;
+
+ n += 6;
+ while (my_isblank(*n))
+ n++;
+ }
+
for (i = 0; i < ARRAY_SIZE(known_ptr_types); i++) {
if (typecmp(n, known_ptr_types[i]))
continue;
ret = n1 - name;
type->name = strndup(name, ret);
+ if (IS(type->name, "__VALIST") || IS(type->name, "va_list"))
+ type->is_va_list = 1;
if (IS(type->name, "VOID"))
memcpy(type->name, "void", 4);
return 0;
}
+static int parse_protostr(char *protostr, struct parsed_proto *pp);
+
+static int parse_arg(char **p_, struct parsed_proto_arg *arg, int xarg)
+{
+ char buf[256];
+ char *p = *p_;
+ char *pe;
+ int ret;
+
+ arg->pp = calloc(1, sizeof(*arg->pp));
+ my_assert_not(arg->pp, NULL);
+ arg->pp->is_arg = 1;
+
+ pe = p;
+ while (1) {
+ pe = strpbrk(pe, ",()");
+ if (pe == NULL)
+ return -1;
+ if (*pe == ',' || *pe == ')')
+ break;
+ pe = strchr(pe, ')');
+ if (pe == NULL)
+ return -1;
+ pe++;
+ }
+
+ if (pe - p > sizeof(buf) - 1)
+ return -1;
+ memcpy(buf, p, pe - p);
+ buf[pe - p] = 0;
+
+ ret = parse_protostr(buf, arg->pp);
+ if (ret < 0)
+ return -1;
+
+ if (IS_START(arg->pp->name, "guess"))
+ arg->pp->is_guessed = 1;
+
+ // we don't use actual names right now...
+ snprintf(arg->pp->name, sizeof(arg->pp->name), "a%d", xarg);
+
+ if (!arg->type.is_struct)
+ // we'll treat it as void * for non-calls
+ arg->type.name = strdup("void *");
+ arg->type.is_ptr = 1;
+
+ p += ret;
+ *p_ = p;
+ return 0;
+}
+
static int parse_protostr(char *protostr, struct parsed_proto *pp)
{
struct parsed_proto_arg *arg;
char regparm[16];
char buf[256];
char cconv[32];
- int xarg = 0;
+ int is_retreg;
char *p, *p1;
+ int xarg = 0;
int i, l;
int ret;
p = sskip(p + 2);
}
- // strip unneeded stuff
+ // allow start of line comment
+ if (p[0] == '/' && p[1] == '*') {
+ p = strstr(p + 2, "*/");
+ if (p == NULL) {
+ printf("%s:%d: multiline comments unsupported\n",
+ hdrfn, hdrfline);
+ return -1;
+ }
+ p = sskip(p + 2);
+ }
+
+ // we need remaining hints in comments, so strip / *
for (p1 = p; p1[0] != 0 && p1[1] != 0; p1++) {
if ((p1[0] == '/' && p1[1] == '*')
|| (p1[0] == '*' && p1[1] == '/'))
p = sskip(p + l + 1);
}
+ if (IS_START(p, "DECL_IMPORT ")) {
+ pp->is_import = 1;
+ p = sskip(p + 12);
+ }
+
ret = check_type(p, &pp->ret_type);
if (ret <= 0) {
printf("%s:%d:%zd: unhandled return in '%s'\n",
if (!strchr(p, ')')) {
p = next_idt(buf, sizeof(buf), p);
p = sskip(p);
- if (buf[0] == 0) {
- printf("%s:%d:%zd: var name missing\n",
+ if (!pp->is_arg && buf[0] == 0) {
+ printf("%s:%d:%zd: var name is missing\n",
hdrfn, hdrfline, (p - protostr) + 1);
return -1;
}
pp->is_stdcall = 1; // IDA
else if (IS(cconv, "__usercall"))
pp->is_stdcall = 0; // IDA
- else if (IS(cconv, "WINAPI"))
+ else if (IS(cconv, "__userstack")) {
+ pp->is_stdcall = 0; // custom
+ pp->is_userstack = 1;
+ }
+ else if (IS(cconv, "WINAPI") || IS(cconv, "PASCAL"))
pp->is_stdcall = 1;
else {
printf("%s:%d:%zd: unhandled cconv: '%s'\n",
}
strcpy(pp->name, buf);
- ret = get_regparm(regparm, sizeof(regparm), p);
+ ret = get_regparm(regparm, sizeof(regparm), p, &is_retreg);
if (ret > 0) {
if (!IS(regparm, "eax") && !IS(regparm, "ax")
&& !IS(regparm, "al") && !IS(regparm, "edx:eax"))
}
p = sskip(p + ret);
- if (*p == '(') {
- // func ptr
- arg->fptr = calloc(1, sizeof(*arg->fptr));
- ret = parse_protostr(p1, arg->fptr);
+ if (*p == '(' || arg->type.is_struct) {
+ // func ptr or struct
+ ret = parse_arg(&p1, arg, xarg);
if (ret < 0) {
printf("%s:%d:%zd: funcarg parse failed\n",
hdrfn, hdrfline, p1 - protostr);
return -1;
}
- arg->fptr->is_arg = 1;
- // we don't use actual names right now..
- snprintf(arg->fptr->name,
- sizeof(arg->fptr->name), "a%d", xarg);
- // we'll treat it as void * for non-calls
- arg->type.name = strdup("void *");
- arg->type.is_ptr = 1;
-
- p = p1 + ret;
+ p = p1;
}
p = next_idt(buf, sizeof(buf), p);
#endif
arg->reg = NULL;
- ret = get_regparm(regparm, sizeof(regparm), p);
+ ret = get_regparm(regparm, sizeof(regparm), p, &is_retreg);
if (ret > 0) {
p += ret;
p = sskip(p);
arg->reg = strdup(map_reg(regparm));
+ arg->type.is_retreg = is_retreg;
+ pp->has_retreg |= is_retreg;
+ }
+
+ if (IS(arg->type.name, "float")
+ || IS(arg->type.name, "double"))
+ {
+ arg->type.is_float = 1;
}
- if (strstr(arg->type.name, "int64")
- || IS(arg->type.name, "double"))
+ if (!arg->type.is_ptr && (strstr(arg->type.name, "int64")
+ || IS(arg->type.name, "double")))
{
+ arg->type.is_64bit = 1;
// hack..
- free(arg->type.name);
- arg->type.name = strdup("int");
pp_copy_arg(&pp->arg[xarg], arg);
+ arg = &pp->arg[xarg];
xarg++;
+ free(arg->type.name);
+ arg->type.name = strdup("dummy");
}
ret = check_struct_arg(arg);
return strcmp(pp1->name, pp2->name);
}
+static int ps_name_cmp(const void *p1, const void *p2)
+{
+ const struct parsed_struct *ps1 = p1, *ps2 = p2;
+ return strcmp(ps1->name, ps2->name);
+}
+
+// parsed struct cache
+static struct parsed_struct *ps_cache;
+static int ps_cache_size;
+static int ps_cache_alloc;
+
+static int struct_handler(FILE *fhdr, char *proto, int *line)
+{
+ struct parsed_struct *ps;
+ char lstr[256], *p;
+ int offset = 0;
+ int m = 0;
+ int ret;
+
+ if (ps_cache_size >= ps_cache_alloc) {
+ ps_cache_alloc = ps_cache_alloc * 2 + 64;
+ ps_cache = realloc(ps_cache, ps_cache_alloc
+ * sizeof(ps_cache[0]));
+ my_assert_not(ps_cache, NULL);
+ memset(ps_cache + ps_cache_size, 0,
+ (ps_cache_alloc - ps_cache_size)
+ * sizeof(ps_cache[0]));
+ }
+
+ ps = &ps_cache[ps_cache_size++];
+ ret = sscanf(proto, "struct %255s {", ps->name);
+ if (ret != 1) {
+ printf("%s:%d: struct parse failed\n", hdrfn, *line);
+ return -1;
+ }
+
+ while (fgets(lstr, sizeof(lstr), fhdr))
+ {
+ (*line)++;
+
+ p = sskip(lstr);
+ if (p[0] == '/' && p[1] == '/')
+ continue;
+ if (p[0] == '}')
+ break;
+
+ if (m >= ARRAY_SIZE(ps->members)) {
+ printf("%s:%d: too many struct members\n",
+ hdrfn, *line);
+ return -1;
+ }
+
+ hdrfline = *line;
+ ret = parse_protostr(p, &ps->members[m].pp);
+ if (ret < 0) {
+ printf("%s:%d: struct member #%d/%02x "
+ "doesn't parse\n", hdrfn, *line,
+ m, offset);
+ return -1;
+ }
+ ps->members[m].offset = offset;
+ offset += 4;
+ m++;
+ }
+
+ ps->member_count = m;
+
+ return 0;
+}
+
+// parsed proto cache
static struct parsed_proto *pp_cache;
static int pp_cache_size;
static int pp_cache_alloc;
-static int b_pp_c_handler(char *proto, const char *fname)
+static int b_pp_c_handler(char *proto, const char *fname,
+ int is_include, int is_osinc, int is_cinc)
{
int ret;
if (ret < 0)
return -1;
+ pp_cache[pp_cache_size].is_include = is_include;
+ pp_cache[pp_cache_size].is_osinc = is_osinc;
+ pp_cache[pp_cache_size].is_cinc = is_cinc;
pp_cache_size++;
return 0;
}
-static void build_pp_cache(FILE *fhdr)
+static void build_caches(FILE *fhdr)
{
long pos;
int ret;
pos = ftell(fhdr);
rewind(fhdr);
- ret = do_protostrs(fhdr, hdrfn);
+ ret = do_protostrs(fhdr, hdrfn, 0);
if (ret < 0)
exit(1);
qsort(pp_cache, pp_cache_size, sizeof(pp_cache[0]), pp_name_cmp);
+ qsort(ps_cache, ps_cache_size, sizeof(ps_cache[0]), ps_name_cmp);
fseek(fhdr, pos, SEEK_SET);
}
{
const struct parsed_proto *pp_ret;
struct parsed_proto pp_search;
+ char *p;
if (pp_cache == NULL)
- build_pp_cache(fhdr);
+ build_caches(fhdr);
- if (sym[0] == '_') // && strncmp(fname, "stdc", 4) == 0)
+ // ugh...
+ if (sym[0] == '_' && !IS_START(sym, "__W"))
sym++;
strcpy(pp_search.name, sym);
+ p = strchr(pp_search.name, '@');
+ if (p != NULL)
+ *p = 0;
+
pp_ret = bsearch(&pp_search, pp_cache, pp_cache_size,
sizeof(pp_cache[0]), pp_name_cmp);
if (pp_ret == NULL && !quiet)
return pp_ret;
}
+static const struct parsed_proto *proto_lookup_struct(FILE *fhdr,
+ const char *type, int offset)
+{
+ struct parsed_struct ps_search, *ps;
+ int m;
+
+ if (pp_cache == NULL)
+ build_caches(fhdr);
+ if (ps_cache_size == 0)
+ return NULL;
+
+ while (my_isblank(*type))
+ type++;
+ if (!strncmp(type, "struct", 6) && my_isblank(type[6]))
+ type += 7;
+
+ if (sscanf(type, "%255s", ps_search.name) != 1)
+ return NULL;
+
+ ps = bsearch(&ps_search, ps_cache, ps_cache_size,
+ sizeof(ps_cache[0]), ps_name_cmp);
+ if (ps == NULL) {
+ printf("%s: struct '%s' is missing\n",
+ hdrfn, ps_search.name);
+ return NULL;
+ }
+
+ for (m = 0; m < ps->member_count; m++) {
+ if (ps->members[m].offset == offset)
+ return &ps->members[m].pp;
+ }
+
+ return NULL;
+}
+
static void pp_copy_arg(struct parsed_proto_arg *d,
const struct parsed_proto_arg *s)
{
d->type.name = strdup(s->type.name);
my_assert_not(d->type.name, NULL);
}
- if (s->fptr != NULL) {
- d->fptr = malloc(sizeof(*d->fptr));
- my_assert_not(d->fptr, NULL);
- memcpy(d->fptr, s->fptr, sizeof(*d->fptr));
+ if (s->pp != NULL) {
+ d->pp = malloc(sizeof(*d->pp));
+ my_assert_not(d->pp, NULL);
+ memcpy(d->pp, s->pp, sizeof(*d->pp));
}
}
return pp;
}
+
+static inline int pp_cmp_func(const struct parsed_proto *pp1,
+ const struct parsed_proto *pp2)
+{
+ int i;
+
+ if (pp1->argc != pp2->argc || pp1->argc_reg != pp2->argc_reg)
+ return 1;
+ else {
+ for (i = 0; i < pp1->argc; i++) {
+ if ((pp1->arg[i].reg != NULL) != (pp2->arg[i].reg != NULL))
+ return 1;
+
+ if ((pp1->arg[i].reg != NULL)
+ && !IS(pp1->arg[i].reg, pp2->arg[i].reg))
+ {
+ return 1;
+ }
+ }
+ }
+
+ return 0;
+}
+
static inline void pp_print(char *buf, size_t buf_size,
const struct parsed_proto *pp)
{
free(pp->arg[i].reg);
if (pp->arg[i].type.name != NULL)
free(pp->arg[i].type.name);
- if (pp->arg[i].fptr != NULL)
- free(pp->arg[i].fptr);
+ if (pp->arg[i].pp != NULL)
+ free(pp->arg[i].pp);
}
if (pp->ret_type.name != NULL)
free(pp->ret_type.name);
free(pp);
+
+ (void)proto_lookup_struct;
}