make run_imp.sh more generic, add run_exp.sh
[ia32rtools.git] / plugin / saveasm.cpp
CommitLineData
d8891fcc 1#define NO_OBSOLETE_FUNCS
2#include <ida.hpp>
3#include <idp.hpp>
4#include <bytes.hpp>
5#include <loader.hpp>
6#include <kernwin.hpp>
7
8#include <name.hpp>
9#include <frame.hpp>
10#include <struct.hpp>
11#include <auto.hpp>
15c7b2a4 12#include <intel.hpp>
d8891fcc 13
14#define IS_START(w, y) !strncmp(w, y, strlen(y))
15#define ARRAY_SIZE(x) (sizeof(x) / sizeof(x[0]))
16
15c7b2a4 17// non-local branch targets
18static ea_t *nonlocal_bt;
19static int nonlocal_bt_alloc;
20static int nonlocal_bt_cnt;
21
d8891fcc 22//--------------------------------------------------------------------------
23static int idaapi init(void)
24{
25 return PLUGIN_OK;
26}
27
28//--------------------------------------------------------------------------
29static void idaapi term(void)
30{
15c7b2a4 31 if (nonlocal_bt != NULL) {
32 free(nonlocal_bt);
33 nonlocal_bt = NULL;
34 }
35 nonlocal_bt_alloc = 0;
d8891fcc 36}
37
38//--------------------------------------------------------------------------
39
40static const char *reserved_names[] = {
41 "name",
b587e6ae 42 "type",
d8891fcc 43 "offset",
b587e6ae 44 "aam",
d8891fcc 45};
46
47static int is_name_reserved(const char *name)
48{
49 int i;
50 for (i = 0; i < ARRAY_SIZE(reserved_names); i++)
51 if (strcasecmp(name, reserved_names[i]) == 0)
52 return 1;
53
54 return 0;
55}
56
15c7b2a4 57static int nonlocal_bt_cmp(const void *p1, const void *p2)
58{
59 const ea_t *e1 = (const ea_t *)p1, *e2 = (const ea_t *)p2;
60 return *e1 - *e2;
61}
62
63static void nonlocal_add(ea_t ea)
64{
65 if (nonlocal_bt_cnt >= nonlocal_bt_alloc) {
66 nonlocal_bt_alloc += nonlocal_bt_alloc * 2 + 64;
67 nonlocal_bt = (ea_t *)realloc(nonlocal_bt,
68 nonlocal_bt_alloc * sizeof(nonlocal_bt[0]));
69 if (nonlocal_bt == NULL) {
70 msg("OOM\n");
71 return;
72 }
73 }
74 nonlocal_bt[nonlocal_bt_cnt++] = ea;
75}
76
b587e6ae 77// is instruction a (un)conditional jump (not call)?
78static int is_insn_jmp(uint16 itype)
79{
80 return itype == NN_jmp || (NN_ja <= itype && itype <= NN_jz);
81}
82
d8891fcc 83static void do_def_line(char *buf, size_t buf_size, const char *line)
84{
15c7b2a4 85 char *endp = NULL;
86 ea_t ea, *ea_ret;
d8891fcc 87 int len;
88
89 tag_remove(line, buf, buf_size); // remove color codes
90 len = strlen(buf);
91 if (len < 9) {
92 buf[0] = 0;
93 return;
94 }
95 memmove(buf, buf + 9, len - 9 + 1); // rm address
15c7b2a4 96
97 if (IS_START(buf, "loc_")) {
98 ea = strtoul(buf + 4, &endp, 16);
99 if (ea != 0 && *endp == ':') {
100 ea_ret = (ea_t *)bsearch(&ea, nonlocal_bt, nonlocal_bt_cnt,
101 sizeof(nonlocal_bt[0]), nonlocal_bt_cmp);
102 if (ea_ret != 0) {
103 if (endp[1] != ' ')
104 msg("no trailing blank in '%s'\n", buf);
105 else
106 endp[1] = ':';
107 }
108 }
109 }
d8891fcc 110}
111
112static void idaapi run(int /*arg*/)
113{
15c7b2a4 114 // isEnabled(ea) // address belongs to disassembly
d8891fcc 115 // ea_t ea = get_screen_ea();
15c7b2a4 116 // foo = DecodeInstruction(ScreenEA());
d8891fcc 117 FILE *fout = NULL;
118 int fout_line = 0;
119 char buf[MAXSTR];
1caf86bb 120 char buf2[MAXSTR];
b587e6ae 121 const char *name;
d8891fcc 122 struc_t *frame;
123 func_t *func;
15c7b2a4 124 ea_t ui_ea_block = 0, ea_size;
125 ea_t tmp_ea, target_ea;
d8891fcc 126 ea_t ea;
b587e6ae 127 flags_t ea_flags;
1caf86bb 128 uval_t idx;
d8891fcc 129 int i, o, m, n;
130 int ret;
131 char *p;
132
15c7b2a4 133 nonlocal_bt_cnt = 0;
134
1caf86bb 135 // get rid of structs, masm doesn't understand them
136 idx = get_first_struc_idx();
137 while (idx != BADNODE) {
138 tid_t tid = get_struc_by_idx(idx);
139 struc_t *struc = get_struc(tid);
140 get_struc_name(tid, buf, sizeof(buf));
141 msg("removing struct '%s'\n", buf);
142 //del_struc_members(struc, 0, get_max_offset(struc));
143 del_struc(struc);
144
145 idx = get_first_struc_idx();
146 }
147
15c7b2a4 148 // 1st pass: walk through all funcs
149 func = get_func(inf.minEA);
d8891fcc 150 while (func != NULL)
151 {
15c7b2a4 152 func_tail_iterator_t fti(func);
153 if (!fti.main()) {
154 msg("%x: func_tail_iterator_t main failed\n", ea);
155 return;
156 }
157 const area_t &f_area = fti.chunk();
158 ea = f_area.startEA;
159
160 // rename global syms which conflict with frame member names
d8891fcc 161 frame = get_frame(func);
162 if (frame != NULL)
163 {
164 for (m = 0; m < (int)frame->memqty; m++)
165 {
166 ret = get_member_name(frame->members[m].id, buf, sizeof(buf));
167 if (ret <= 0) {
168 msg("%x: member has no name?\n", ea);
169 return;
170 }
171 if (buf[0] == ' ') // what's this?
172 continue;
173 if (IS_START(buf, "arg_") || IS_START(buf, "var_"))
174 continue;
175
1caf86bb 176 // check for dupe names
177 int m1, dupe = 0;
178 for (m1 = 0; m1 < m; m1++) {
179 get_member_name(frame->members[m1].id, buf2, sizeof(buf2));
180 if (stricmp(buf, buf2) == 0)
181 dupe = 1;
182 }
183
184 if (is_name_reserved(buf) || dupe) {
d8891fcc 185 msg("%x: renaming '%s'\n", ea, buf);
186 qstrncat(buf, "_", sizeof(buf));
187 ret = set_member_name(frame, frame->members[m].soff, buf);
188 if (!ret) {
189 msg("%x: renaming failed\n", ea);
190 return;
191 }
192 }
193
194 tmp_ea = get_name_ea(ea, buf);
195 if (tmp_ea == 0 || tmp_ea == ~0)
196 continue;
197
198 msg("%x: from %x: renaming '%s'\n", tmp_ea, ea, buf);
199 qstrncat(buf, "_g", sizeof(buf));
200 set_name(tmp_ea, buf);
201 }
202 }
203
204 func = get_next_func(ea);
15c7b2a4 205 }
206
b587e6ae 207 // 2nd pass over whole .text and .(ro)data segments
15c7b2a4 208 for (ea = inf.minEA; ea != BADADDR; ea = next_head(ea, inf.maxEA))
209 {
210 segment_t *seg = getseg(ea);
b587e6ae 211 if (!seg)
212 break;
213 if (seg->type == SEG_XTRN)
214 continue;
215 if (seg->type != SEG_CODE && seg->type != SEG_DATA)
15c7b2a4 216 break;
217
b587e6ae 218 ea_flags = get_flags_novalue(ea);
15c7b2a4 219 func = get_func(ea);
220 if (isCode(ea_flags))
221 {
222 if (!decode_insn(ea)) {
223 msg("%x: decode_insn() failed\n", ea);
224 continue;
225 }
226
b587e6ae 227 // masm doesn't understand IDA's float/xmm types
228 if (cmd.itype == NN_fld || cmd.itype == NN_fst
229 || cmd.itype == NN_movapd || cmd.itype == NN_movlpd)
230 {
231 for (o = 0; o < UA_MAXOP; o++) {
232 if (cmd.Operands[o].type == o_void)
233 break;
234
235 if (cmd.Operands[o].type == o_mem) {
236 tmp_ea = cmd.Operands[o].addr;
237 flags_t tmp_ea_flags = get_flags_novalue(tmp_ea);
238 if (!isUnknown(tmp_ea_flags)) {
239 buf[0] = 0;
240 get_name(ea, tmp_ea, buf, sizeof(buf));
241 msg("%x: undefining %x '%s'\n", ea, tmp_ea, buf);
242 do_unknown(tmp_ea, DOUNK_EXPAND);
243 }
244 }
245 }
246 }
1caf86bb 247 // detect code alignment
248 else if (cmd.itype == NN_lea) {
249 if (cmd.Operands[0].reg == cmd.Operands[1].reg
250 && cmd.Operands[1].type == o_displ
251 && cmd.Operands[1].addr == 0)
252 {
253 tmp_ea = next_head(ea, inf.maxEA);
254 if ((tmp_ea & 0x03) == 0) {
255 n = calc_max_align(tmp_ea);
256 if (n > 4) // masm doesn't like more..
257 n = 4;
258 msg("%x: align %d\n", ea, 1 << n);
259 do_unknown(ea, DOUNK_SIMPLE);
260 doAlign(ea, tmp_ea - ea, n);
261 }
262 }
263 }
b587e6ae 264
15c7b2a4 265 // find non-local branches
b587e6ae 266 if (is_insn_jmp(cmd.itype) && cmd.Operands[0].type == o_near)
15c7b2a4 267 {
268 target_ea = cmd.Operands[0].addr;
269 if (func == NULL)
270 nonlocal_add(target_ea);
271 else {
272 ret = get_func_chunknum(func, target_ea);
273 if (ret != 0) {
274 // a jump to another func or chunk
275 // check if it lands on func start
276 if (!isFunc(get_flags_novalue(target_ea)))
277 nonlocal_add(target_ea);
278 }
279 }
280 }
281 }
282 else { // not code
1caf86bb 283 int do_undef = 0;
284 ea_size = get_item_size(ea);
285
15c7b2a4 286 if (func == NULL && isOff0(ea_flags)) {
15c7b2a4 287 for (tmp_ea = 0; tmp_ea < ea_size; tmp_ea += 4)
288 nonlocal_add(get_long(ea + tmp_ea));
289 }
b587e6ae 290
291 // IDA vs masm float/mmx/xmm type incompatibility
292 if (isDouble(ea_flags) || isTbyt(ea_flags)
293 || isPackReal(ea_flags))
294 {
1caf86bb 295 do_undef = 1;
296 }
297 else if (isOwrd(ea_flags)) {
b587e6ae 298 buf[0] = 0;
299 get_name(BADADDR, ea, buf, sizeof(buf));
1caf86bb 300 if (IS_START(buf, "xmm"))
301 do_undef = 1;
302 }
303 // masm doesn't understand IDA's unicode
304 else if (isASCII(ea_flags) && ea_size >= 4
305 && (get_long(ea) & 0xff00ff00) == 0) // lame..
306 {
307 do_undef = 1;
308 }
309 // masm doesn't understand large aligns
310 else if (isAlign(ea_flags) && ea_size > 0x10) {
311 msg("%x: undefining align %d\n", ea, ea_size);
b587e6ae 312 do_unknown(ea, DOUNK_EXPAND);
313 }
1caf86bb 314
315 if (do_undef) {
b587e6ae 316 buf[0] = 0;
317 get_name(BADADDR, ea, buf, sizeof(buf));
1caf86bb 318 msg("%x: undefining '%s'\n", ea, buf);
319 do_unknown(ea, DOUNK_EXPAND);
b587e6ae 320 }
321 }
322 }
323
324 // check namelist for reserved names
325 n = get_nlist_size();
326 for (i = 0; i < n; i++) {
327 ea = get_nlist_ea(i);
328 name = get_nlist_name(i);
329 if (name == NULL) {
330 msg("%x: null name?\n", ea);
331 continue;
332 }
333
334 if (is_name_reserved(name)) {
335 msg("%x: renaming name '%s'\n", ea, name);
336 qsnprintf(buf, sizeof(buf), "%s_g", name);
337 set_name(ea, buf);
15c7b2a4 338 }
339 }
340
341 if (nonlocal_bt_cnt > 1) {
342 qsort(nonlocal_bt, nonlocal_bt_cnt,
343 sizeof(nonlocal_bt[0]), nonlocal_bt_cmp);
d8891fcc 344 }
345
346 char *fname = askfile_c(1, NULL, "Save asm file");
347 if (fname == NULL)
348 return;
349 fout = qfopen(fname, "w");
350 if (fout == NULL) {
351 msg("couldn't open '%s'\n", fname);
352 return;
353 }
354
355 show_wait_box("Saving..");
356
357 // deal with the beginning
358 ea = inf.minEA;
359 int flags = 0; // calc_default_idaplace_flags();
360 linearray_t ln(&flags);
361 idaplace_t pl;
362 pl.ea = ea;
363 pl.lnnum = 0;
364 ln.set_place(&pl);
365 n = ln.get_linecnt();
366 for (i = 0; i < n - 1; i++) {
367 do_def_line(buf, sizeof(buf), ln.down());
368 if (strstr(buf, "include"))
369 continue;
370
371 fout_line++;
372 qfprintf(fout, "%s\n", buf);
373 p = strstr(buf, ".mmx");
374 if (p != NULL) {
375 memcpy(p, ".xmm", 4);
376 fout_line++;
377 qfprintf(fout, "%s\n", buf);
378 }
379 }
b587e6ae 380 pl.lnnum = i;
d8891fcc 381
382 for (;;)
383 {
1caf86bb 384 int drop_large = 0, drop_rva = 0, set_scale = 0, jmp_near = 0;
385 int word_imm = 0, dword_imm = 0, do_pushf = 0;
15c7b2a4 386
d8891fcc 387 if ((ea >> 14) != ui_ea_block) {
388 ui_ea_block = ea >> 14;
389 showAddr(ea);
390 if (wasBreak())
391 break;
392 }
393
394 segment_t *seg = getseg(ea);
b587e6ae 395 if (!seg || (seg->type != SEG_CODE && seg->type != SEG_DATA))
d8891fcc 396 goto pass;
397
b587e6ae 398 ea_flags = get_flags_novalue(ea);
399 if (isCode(ea_flags))
400 {
401 if (!decode_insn(ea))
402 goto pass;
d8891fcc 403
1caf86bb 404 if (is_insn_jmp(cmd.itype) && cmd.Operands[0].type == o_near
405 && cmd.Operands[0].dtyp == dt_dword)
406 {
407 jmp_near = 1;
408 }
409 else if ((cmd.itype == NN_pushf || cmd.itype == NN_popf)
410 && natop())
411 {
412 do_pushf = 1;
413 }
414
b587e6ae 415 for (o = 0; o < UA_MAXOP; o++) {
1caf86bb 416 const op_t &opr = cmd.Operands[o];
417 if (opr.type == o_void)
b587e6ae 418 break;
d8891fcc 419
1caf86bb 420 // correct?
421 if (opr.type == o_mem && opr.specval_shorts.high == 0x21)
b587e6ae 422 drop_large = 1;
1caf86bb 423 if (opr.hasSIB && x86_scale(opr) == 0
424 && x86_index(opr) != INDEX_NONE)
425 {
426 set_scale = 1;
427 }
428 // annoying alignment variant..
429 if (opr.type == o_imm && opr.dtyp == dt_dword
430 && (opr.value < 0x80 || opr.value > 0xffffff80)
431 && cmd.size >= opr.offb + 4)
432 {
433 if (get_long(ea + opr.offb) == opr.value)
434 dword_imm = 1;
435 }
436 else if (opr.type == o_imm && opr.dtyp == dt_word
437 && (opr.value < 0x80 || opr.value > 0xff80)
438 && cmd.size >= opr.offb + 2)
439 {
440 if (get_word(ea + opr.offb) == (ushort)opr.value)
441 word_imm = 1;
15c7b2a4 442 }
15c7b2a4 443 }
b587e6ae 444 }
445 else { // not code
446 if (isOff0(ea_flags))
447 drop_rva = 1;
d8891fcc 448 }
449
450pass:
b587e6ae 451 n = ln.get_linecnt();
452 for (i = pl.lnnum; i < n; i++) {
453 do_def_line(buf, sizeof(buf), ln.down());
15c7b2a4 454
1caf86bb 455 // patches..
b587e6ae 456 if (drop_large) {
457 p = strstr(buf, "large ");
458 if (p != NULL)
459 memmove(p, p + 6, strlen(p + 6) + 1);
460 }
461 while (drop_rva) {
462 p = strstr(buf, " rva ");
463 if (p == NULL)
464 break;
465 memmove(p, p + 4, strlen(p + 4) + 1);
466 }
1caf86bb 467 if (set_scale) {
468 p = strchr(buf, '[');
469 if (p != NULL)
470 p = strchr(p, '+');
471 if (p != NULL && p[1] == 'e') {
472 p += 4;
473 // scale is 1, must specify it explicitly so that
474 // masm chooses the right scaled reg
475 memmove(p + 2, p, strlen(p) + 1);
476 memcpy(p, "*1", 2);
477 }
478 }
479 else if (jmp_near) {
480 p = strchr(buf, 'j');
481 while (p && *p != ' ')
482 p++;
483 while (p && *p == ' ')
484 p++;
485 if (p != NULL) {
486 memmove(p + 9, p, strlen(p) + 1);
487 memcpy(p, "near ptr ", 9);
488 }
489 }
490 if (word_imm) {
491 p = strstr(buf, ", ");
492 if (p != NULL && '0' <= p[2] && p[2] <= '9') {
493 p += 2;
494 memmove(p + 9, p, strlen(p) + 1);
495 memcpy(p, "word ptr ", 9);
496 }
497 }
498 else if (dword_imm) {
499 p = strstr(buf, ", ");
500 if (p != NULL && '0' <= p[2] && p[2] <= '9') {
501 p += 2;
502 memmove(p + 10, p, strlen(p) + 1);
503 memcpy(p, "dword ptr ", 10);
504 }
505 }
506 else if (do_pushf) {
507 p = strstr(buf, "pushf");
508 if (p == NULL)
509 p = strstr(buf, "popf");
510 if (p != NULL) {
511 p = strchr(p, 'f') + 1;
512 memmove(p + 1, p, strlen(p) + 1);
513 *p = 'd';
514 }
515 }
b587e6ae 516
517 fout_line++;
518 qfprintf(fout, "%s\n", buf);
519 }
d8891fcc 520
15c7b2a4 521 // note: next_head skips some undefined stuff
d8891fcc 522 ea = next_not_tail(ea); // correct?
15c7b2a4 523 if (ea == BADADDR)
d8891fcc 524 break;
525
526 pl.ea = ea;
527 pl.lnnum = 0;
528 ln.set_place(&pl);
d8891fcc 529 }
530
531 if (fout != NULL)
532 qfclose(fout);
15c7b2a4 533 if (fname != NULL)
534 qfree(fname);
d8891fcc 535
536 hide_wait_box();
537 msg("%d lines saved.\n", fout_line);
538}
539
540//--------------------------------------------------------------------------
541
542static const char comment[] = "Generate disassembly lines for one address";
543static const char help[] = "Generate asm file\n";
544static const char wanted_name[] = "Save asm";
545static const char wanted_hotkey[] = "Ctrl-F6";
546
547//--------------------------------------------------------------------------
548//
549// PLUGIN DESCRIPTION BLOCK
550//
551//--------------------------------------------------------------------------
552plugin_t PLUGIN =
553{
554 IDP_INTERFACE_VERSION,
555 0, // plugin flags
556 init, // initialize
557 term, // terminate. this pointer may be NULL.
558 run, // invoke plugin
559 comment, // long comment about the plugin
560 // it could appear in the status line
561 // or as a hint
562 help, // multiline help about the plugin
563 wanted_name, // the preferred short name of the plugin
564 wanted_hotkey // the preferred hotkey to run the plugin
565};
566
567// vim:ts=2:shiftwidth=2:expandtab