allow to add symbols for host_dasm
[picodrive.git] / cpu / drc / emit_x86.c
CommitLineData
3863edbd 1/*
8b4f38f4 2 * note:
3 * temp registers must be eax-edx due to use of SETcc.
f0d7b1fa 4 * note about silly things like emith_eor_r_r_r:
8b4f38f4 5 * these are here because the compiler was designed
6 * for ARM as it's primary target.
3863edbd 7 */
679af8a3 8#include <stdarg.h>
9
f4bb5d6b 10enum { xAX = 0, xCX, xDX, xBX, xSP, xBP, xSI, xDI };
11
f4bb5d6b 12#define CONTEXT_REG xBP
679af8a3 13
18b94127 14#define ICOND_JO 0x00
15#define ICOND_JNO 0x01
16#define ICOND_JB 0x02
17#define ICOND_JAE 0x03
18#define ICOND_JE 0x04
19#define ICOND_JNE 0x05
20#define ICOND_JBE 0x06
21#define ICOND_JA 0x07
22#define ICOND_JS 0x08
23#define ICOND_JNS 0x09
24#define ICOND_JL 0x0c
25#define ICOND_JGE 0x0d
26#define ICOND_JLE 0x0e
27#define ICOND_JG 0x0f
28
29#define IOP_JMP 0xeb
80599a42 30
31// unified conditions (we just use rel8 jump instructions for x86)
18b94127 32#define DCOND_EQ ICOND_JE
33#define DCOND_NE ICOND_JNE
34#define DCOND_MI ICOND_JS // MInus
35#define DCOND_PL ICOND_JNS // PLus or zero
36#define DCOND_HI ICOND_JA // higher (unsigned)
37#define DCOND_HS ICOND_JAE // higher || same (unsigned)
38#define DCOND_LO ICOND_JB // lower (unsigned)
39#define DCOND_LS ICOND_JBE // lower || same (unsigned)
40#define DCOND_GE ICOND_JGE // greater || equal (signed)
41#define DCOND_GT ICOND_JG // greater (signed)
42#define DCOND_LE ICOND_JLE // less || equal (signed)
43#define DCOND_LT ICOND_JL // less (signed)
44#define DCOND_VS ICOND_JO // oVerflow Set
45#define DCOND_VC ICOND_JNO // oVerflow Clear
80599a42 46
679af8a3 47#define EMIT_PTR(ptr, val, type) \
48 *(type *)(ptr) = val
49
50#define EMIT(val, type) { \
51 EMIT_PTR(tcache_ptr, val, type); \
f4bb5d6b 52 tcache_ptr += sizeof(type); \
679af8a3 53}
54
e898de13 55#define EMIT_OP(op) { \
56 COUNT_OP; \
57 EMIT(op, u8); \
58}
59
679af8a3 60#define EMIT_MODRM(mod,r,rm) \
61 EMIT(((mod)<<6) | ((r)<<3) | (rm), u8)
62
f0d7b1fa 63#define EMIT_SIB(scale,index,base) \
64 EMIT(((scale)<<6) | ((index)<<3) | (base), u8)
65
679af8a3 66#define EMIT_OP_MODRM(op,mod,r,rm) { \
e898de13 67 EMIT_OP(op); \
679af8a3 68 EMIT_MODRM(mod, r, rm); \
69}
70
80599a42 71#define JMP8_POS(ptr) \
72 ptr = tcache_ptr; \
73 tcache_ptr += 2
74
75#define JMP8_EMIT(op, ptr) \
18b94127 76 EMIT_PTR(ptr, 0x70|(op), u8); \
77 EMIT_PTR(ptr + 1, (tcache_ptr - (ptr+2)), u8)
78
79#define JMP8_EMIT_NC(ptr) \
80 EMIT_PTR(ptr, IOP_JMP, u8); \
80599a42 81 EMIT_PTR(ptr + 1, (tcache_ptr - (ptr+2)), u8)
82
3863edbd 83// _r_r
679af8a3 84#define emith_move_r_r(dst, src) \
85 EMIT_OP_MODRM(0x8b, 3, dst, src)
86
80599a42 87#define emith_add_r_r(d, s) \
88 EMIT_OP_MODRM(0x01, 3, s, d)
89
90#define emith_sub_r_r(d, s) \
91 EMIT_OP_MODRM(0x29, 3, s, d)
92
3863edbd 93#define emith_adc_r_r(d, s) \
94 EMIT_OP_MODRM(0x11, 3, s, d)
95
96#define emith_sbc_r_r(d, s) \
97 EMIT_OP_MODRM(0x19, 3, s, d) /* SBB */
98
80599a42 99#define emith_or_r_r(d, s) \
100 EMIT_OP_MODRM(0x09, 3, s, d)
101
3863edbd 102#define emith_and_r_r(d, s) \
103 EMIT_OP_MODRM(0x21, 3, s, d)
104
80599a42 105#define emith_eor_r_r(d, s) \
3863edbd 106 EMIT_OP_MODRM(0x31, 3, s, d) /* XOR */
107
108#define emith_tst_r_r(d, s) \
109 EMIT_OP_MODRM(0x85, 3, s, d) /* TEST */
110
111#define emith_cmp_r_r(d, s) \
112 EMIT_OP_MODRM(0x39, 3, s, d)
80599a42 113
114// fake teq - test equivalence - get_flags(d ^ s)
115#define emith_teq_r_r(d, s) { \
116 emith_push(d); \
117 emith_eor_r_r(d, s); \
118 emith_pop(d); \
119}
120
52d759c3 121#define emith_mvn_r_r(d, s) { \
122 if (d != s) \
123 emith_move_r_r(d, s); \
124 EMIT_OP_MODRM(0xf7, 3, 2, d); /* NOT d */ \
125}
126
127#define emith_negc_r_r(d, s) { \
128 int tmp_ = rcache_get_tmp(); \
129 emith_move_r_imm(tmp_, 0); \
130 emith_sbc_r_r(tmp_, s); \
131 emith_move_r_r(d, tmp_); \
132 rcache_free_tmp(tmp_); \
133}
134
135#define emith_neg_r_r(d, s) { \
136 if (d != s) \
137 emith_move_r_r(d, s); \
138 EMIT_OP_MODRM(0xf7, 3, 3, d); /* NEG d */ \
139}
140
3863edbd 141// _r_r_r
142#define emith_eor_r_r_r(d, s1, s2) { \
52d759c3 143 if (d == s1) { \
144 emith_eor_r_r(d, s2); \
145 } else if (d == s2) { \
146 emith_eor_r_r(d, s1); \
147 } else { \
3863edbd 148 emith_move_r_r(d, s1); \
52d759c3 149 emith_eor_r_r(d, s2); \
150 } \
3863edbd 151}
152
f0d7b1fa 153// _r_r_shift
154#define emith_or_r_r_lsl(d, s, lslimm) { \
52d759c3 155 int tmp_ = rcache_get_tmp(); \
f0d7b1fa 156 emith_lsl(tmp_, s, lslimm); \
157 emith_or_r_r(d, tmp_); \
52d759c3 158 rcache_free_tmp(tmp_); \
3863edbd 159}
160
f0d7b1fa 161// d != s
162#define emith_eor_r_r_lsr(d, s, lsrimm) { \
163 emith_push(s); \
164 emith_lsr(s, s, lsrimm); \
165 emith_eor_r_r(d, s); \
166 emith_pop(s); \
167}
168
80599a42 169// _r_imm
679af8a3 170#define emith_move_r_imm(r, imm) { \
e898de13 171 EMIT_OP(0xb8 + (r)); \
679af8a3 172 EMIT(imm, u32); \
173}
174
52d759c3 175#define emith_move_r_imm_s8(r, imm) \
176 emith_move_r_imm(r, (u32)(signed int)(signed char)(imm))
177
18b94127 178#define emith_arith_r_imm(op, r, imm) do { \
80599a42 179 EMIT_OP_MODRM(0x81, 3, op, r); \
679af8a3 180 EMIT(imm, u32); \
18b94127 181} while (0)
679af8a3 182
52d759c3 183// 2 - adc, 3 - sbb
80599a42 184#define emith_add_r_imm(r, imm) \
185 emith_arith_r_imm(0, r, imm)
186
187#define emith_or_r_imm(r, imm) \
188 emith_arith_r_imm(1, r, imm)
189
190#define emith_and_r_imm(r, imm) \
191 emith_arith_r_imm(4, r, imm)
192
193#define emith_sub_r_imm(r, imm) \
194 emith_arith_r_imm(5, r, imm)
195
52d759c3 196#define emith_eor_r_imm(r, imm) \
197 emith_arith_r_imm(6, r, imm)
198
ed8cf79b 199#define emith_cmp_r_imm(r, imm) \
200 emith_arith_r_imm(7, r, imm)
201
18b94127 202#define emith_tst_r_imm(r, imm) do { \
80599a42 203 EMIT_OP_MODRM(0xf7, 3, 0, r); \
679af8a3 204 EMIT(imm, u32); \
18b94127 205} while (0)
679af8a3 206
80599a42 207// fake
208#define emith_bic_r_imm(r, imm) \
209 emith_arith_r_imm(4, r, ~(imm))
210
211// fake conditionals (using SJMP instead)
8796b7ee 212#define emith_move_r_imm_c(cond, r, imm) { \
213 (void)(cond); \
214 emith_move_r_imm(r, imm); \
215}
216
80599a42 217#define emith_add_r_imm_c(cond, r, imm) { \
218 (void)(cond); \
3863edbd 219 emith_add_r_imm(r, imm); \
80599a42 220}
221
222#define emith_or_r_imm_c(cond, r, imm) { \
223 (void)(cond); \
3863edbd 224 emith_or_r_imm(r, imm); \
80599a42 225}
226
f0d7b1fa 227#define emith_eor_r_imm_c(cond, r, imm) { \
228 (void)(cond); \
229 emith_eor_r_imm(r, imm); \
230}
231
80599a42 232#define emith_sub_r_imm_c(cond, r, imm) { \
233 (void)(cond); \
3863edbd 234 emith_sub_r_imm(r, imm); \
235}
236
237#define emith_bic_r_imm_c(cond, r, imm) { \
238 (void)(cond); \
239 emith_bic_r_imm(r, imm); \
80599a42 240}
241
52d759c3 242// _r_r_imm
243#define emith_and_r_r_imm(d, s, imm) { \
244 if (d != s) \
245 emith_move_r_r(d, s); \
18b94127 246 emith_and_r_imm(d, imm); \
52d759c3 247}
248
80599a42 249// shift
250#define emith_shift(op, d, s, cnt) { \
251 if (d != s) \
252 emith_move_r_r(d, s); \
253 EMIT_OP_MODRM(0xc1, 3, op, d); \
254 EMIT(cnt, u8); \
255}
256
80599a42 257#define emith_lsl(d, s, cnt) \
258 emith_shift(4, d, s, cnt)
259
3863edbd 260#define emith_lsr(d, s, cnt) \
261 emith_shift(5, d, s, cnt)
262
263#define emith_asr(d, s, cnt) \
264 emith_shift(7, d, s, cnt)
265
ed8cf79b 266#define emith_rol(d, s, cnt) \
267 emith_shift(0, d, s, cnt)
268
269#define emith_ror(d, s, cnt) \
270 emith_shift(1, d, s, cnt)
271
272#define emith_rolc(r) \
273 EMIT_OP_MODRM(0xd1, 3, 2, r)
274
275#define emith_rorc(r) \
276 EMIT_OP_MODRM(0xd1, 3, 3, r)
277
80599a42 278// misc
279#define emith_push(r) \
280 EMIT_OP(0x50 + (r))
281
282#define emith_pop(r) \
283 EMIT_OP(0x58 + (r))
284
285#define emith_neg_r(r) \
286 EMIT_OP_MODRM(0xf7, 3, 3, r)
287
288#define emith_clear_msb(d, s, count) { \
289 u32 t = (u32)-1; \
290 t >>= count; \
291 if (d != s) \
292 emith_move_r_r(d, s); \
293 emith_and_r_imm(d, t); \
294}
295
f0d7b1fa 296#define emith_clear_msb_c(cond, d, s, count) { \
297 (void)(cond); \
298 emith_clear_msb(d, s, count); \
299}
300
80599a42 301#define emith_sext(d, s, bits) { \
302 emith_lsl(d, s, 32 - (bits)); \
303 emith_asr(d, d, 32 - (bits)); \
304}
305
f0d7b1fa 306#define emith_setc(r) { \
307 EMIT_OP(0x0f); \
8b4f38f4 308 EMIT_OP_MODRM(0x92, 3, 0, r); /* SETC r */ \
f0d7b1fa 309}
310
80599a42 311// XXX: stupid mess
3863edbd 312#define emith_mul_(op, dlo, dhi, s1, s2) { \
80599a42 313 int rmr; \
3863edbd 314 if (dlo != xAX && dhi != xAX) \
80599a42 315 emith_push(xAX); \
3863edbd 316 if (dlo != xDX && dhi != xDX) \
317 emith_push(xDX); \
80599a42 318 if ((s1) == xAX) \
319 rmr = s2; \
320 else if ((s2) == xAX) \
321 rmr = s1; \
322 else { \
323 emith_move_r_r(xAX, s1); \
324 rmr = s2; \
325 } \
3863edbd 326 EMIT_OP_MODRM(0xf7, 3, op, rmr); /* xMUL rmr */ \
327 /* XXX: using push/pop for the case of edx->eax; eax->edx */ \
328 if (dhi != xDX && dhi != -1) \
329 emith_push(xDX); \
330 if (dlo != xAX) \
331 emith_move_r_r(dlo, xAX); \
332 if (dhi != xDX && dhi != -1) \
333 emith_pop(dhi); \
334 if (dlo != xDX && dhi != xDX) \
335 emith_pop(xDX); \
336 if (dlo != xAX && dhi != xAX) \
80599a42 337 emith_pop(xAX); \
80599a42 338}
339
3863edbd 340#define emith_mul_u64(dlo, dhi, s1, s2) \
341 emith_mul_(4, dlo, dhi, s1, s2) /* MUL */
342
343#define emith_mul_s64(dlo, dhi, s1, s2) \
344 emith_mul_(5, dlo, dhi, s1, s2) /* IMUL */
345
346#define emith_mul(d, s1, s2) \
347 emith_mul_(4, d, -1, s1, s2)
348
f0d7b1fa 349// (dlo,dhi) += signed(s1) * signed(s2)
350#define emith_mula_s64(dlo, dhi, s1, s2) { \
351 emith_push(dhi); \
352 emith_push(dlo); \
353 emith_mul_(5, dlo, dhi, s1, s2); \
354 EMIT_OP_MODRM(0x03, 0, dlo, 4); \
355 EMIT_SIB(0, 4, 4); /* add dlo, [esp] */ \
356 EMIT_OP_MODRM(0x13, 1, dhi, 4); \
357 EMIT_SIB(0, 4, 4); \
358 EMIT(4, u8); /* adc dhi, [esp+4] */ \
359 emith_add_r_imm(xSP, 4*2); \
360}
361
80599a42 362// "flag" instructions are the same
363#define emith_subf_r_imm emith_sub_r_imm
3863edbd 364#define emith_addf_r_r emith_add_r_r
80599a42 365#define emith_subf_r_r emith_sub_r_r
3863edbd 366#define emith_adcf_r_r emith_adc_r_r
367#define emith_sbcf_r_r emith_sbc_r_r
8796b7ee 368#define emith_eorf_r_r emith_eor_r_r
52d759c3 369#define emith_negcf_r_r emith_negc_r_r
3863edbd 370
ed8cf79b 371#define emith_lslf emith_lsl
372#define emith_lsrf emith_lsr
373#define emith_asrf emith_asr
374#define emith_rolf emith_rol
375#define emith_rorf emith_ror
376#define emith_rolcf emith_rolc
377#define emith_rorcf emith_rorc
80599a42 378
679af8a3 379// XXX: offs is 8bit only
8796b7ee 380#define emith_ctx_read(r, offs) do { \
65c75cb0 381 EMIT_OP_MODRM(0x8b, 1, r, xBP); \
679af8a3 382 EMIT(offs, u8); /* mov tmp, [ebp+#offs] */ \
8796b7ee 383} while (0)
679af8a3 384
8796b7ee 385#define emith_ctx_read_multiple(r, offs, cnt, tmpr) do { \
386 int r_ = r, offs_ = offs, cnt_ = cnt; \
8b4f38f4 387 for (; cnt_ > 0; r_++, offs_ += 4, cnt_--) \
8796b7ee 388 emith_ctx_read(r_, offs_); \
389} while (0)
390
391#define emith_ctx_write(r, offs) do { \
65c75cb0 392 EMIT_OP_MODRM(0x89, 1, r, xBP); \
679af8a3 393 EMIT(offs, u8); /* mov [ebp+#offs], tmp */ \
8796b7ee 394} while (0)
395
396#define emith_ctx_write_multiple(r, offs, cnt, tmpr) do { \
397 int r_ = r, offs_ = offs, cnt_ = cnt; \
8b4f38f4 398 for (; cnt_ > 0; r_++, offs_ += 4, cnt_--) \
8796b7ee 399 emith_ctx_write(r_, offs_); \
400} while (0)
679af8a3 401
679af8a3 402#define emith_jump(ptr) { \
18b94127 403 u32 disp = (u32)(ptr) - ((u32)tcache_ptr + 5); \
e898de13 404 EMIT_OP(0xe9); \
679af8a3 405 EMIT(disp, u32); \
406}
407
18b94127 408#define emith_jump_cond(cond, ptr) { \
409 u32 disp = (u32)(ptr) - ((u32)tcache_ptr + 6); \
410 EMIT(0x0f, u8); \
411 EMIT_OP(0x80 | (cond)); \
412 EMIT(disp, u32); \
413}
414
415#define emith_jump_patchable(cond) \
416 emith_jump_cond(cond, 0)
417
418#define emith_jump_patch(ptr, target) do { \
419 u32 disp = (u32)(target) - ((u32)(ptr) + 6); \
420 EMIT_PTR((u8 *)(ptr) + 2, disp, u32); \
421} while (0)
422
679af8a3 423#define emith_call(ptr) { \
18b94127 424 u32 disp = (u32)(ptr) - ((u32)tcache_ptr + 5); \
e898de13 425 EMIT_OP(0xe8); \
679af8a3 426 EMIT(disp, u32); \
427}
428
f0d7b1fa 429#define emith_call_cond(cond, ptr) \
430 emith_call(ptr)
431
8796b7ee 432#define emith_jump_reg(r) \
433 EMIT_OP_MODRM(0xff, 3, 4, r)
434
435#define EMITH_JMP_START(cond) { \
80599a42 436 u8 *cond_ptr; \
437 JMP8_POS(cond_ptr)
438
8796b7ee 439#define EMITH_JMP_END(cond) \
80599a42 440 JMP8_EMIT(cond, cond_ptr); \
679af8a3 441}
442
8796b7ee 443// "simple" jump (no more then a few insns)
444#define EMITH_SJMP_START EMITH_JMP_START
445#define EMITH_SJMP_END EMITH_JMP_END
446
80599a42 447#define host_arg2reg(rd, arg) \
f4bb5d6b 448 switch (arg) { \
449 case 0: rd = xAX; break; \
450 case 1: rd = xDX; break; \
451 case 2: rd = xCX; break; \
679af8a3 452 }
453
f4bb5d6b 454#define emith_pass_arg_r(arg, reg) { \
455 int rd = 7; \
80599a42 456 host_arg2reg(rd, arg); \
f4bb5d6b 457 emith_move_r_r(rd, reg); \
458}
459
460#define emith_pass_arg_imm(arg, imm) { \
461 int rd = 7; \
80599a42 462 host_arg2reg(rd, arg); \
f4bb5d6b 463 emith_move_r_imm(rd, imm); \
679af8a3 464}
465
65c75cb0 466/* SH2 drc specific */
8796b7ee 467#define emith_sh2_drc_entry() { \
468 emith_push(xBX); \
469 emith_push(xBP); \
8b4f38f4 470 emith_push(xSI); \
471 emith_push(xDI); \
8796b7ee 472}
473
474#define emith_sh2_drc_exit() { \
8b4f38f4 475 emith_pop(xDI); \
476 emith_pop(xSI); \
8796b7ee 477 emith_pop(xBP); \
478 emith_pop(xBX); \
479 EMIT_OP(0xc3); /* ret */\
480}
481
80599a42 482#define emith_sh2_dtbf_loop() { \
483 u8 *jmp0; /* negative cycles check */ \
484 u8 *jmp1; /* unsinged overflow check */ \
485 int cr, rn; \
52d759c3 486 int tmp_ = rcache_get_tmp(); \
80599a42 487 cr = rcache_get_reg(SHR_SR, RC_GR_RMW); \
488 rn = rcache_get_reg((op >> 8) & 0x0f, RC_GR_RMW);\
489 emith_sub_r_imm(rn, 1); \
490 emith_sub_r_imm(cr, (cycles+1) << 12); \
491 cycles = 0; \
52d759c3 492 emith_asr(tmp_, cr, 2+12); \
80599a42 493 JMP8_POS(jmp0); /* no negative cycles */ \
52d759c3 494 emith_move_r_imm(tmp_, 0); \
18b94127 495 JMP8_EMIT(ICOND_JNS, jmp0); \
80599a42 496 emith_and_r_imm(cr, 0xffe); \
52d759c3 497 emith_subf_r_r(rn, tmp_); \
80599a42 498 JMP8_POS(jmp1); /* no overflow */ \
499 emith_neg_r(rn); /* count left */ \
500 emith_lsl(rn, rn, 2+12); \
501 emith_or_r_r(cr, rn); \
502 emith_or_r_imm(cr, 1); \
503 emith_move_r_imm(rn, 0); \
18b94127 504 JMP8_EMIT(ICOND_JA, jmp1); \
52d759c3 505 rcache_free_tmp(tmp_); \
65c75cb0 506}
507
18b94127 508#define emith_write_sr(sr, srcr) { \
52d759c3 509 int tmp_ = rcache_get_tmp(); \
18b94127 510 emith_clear_msb(tmp_, srcr, 22); \
511 emith_bic_r_imm(sr, 0x3ff); \
512 emith_or_r_r(sr, tmp_); \
52d759c3 513 rcache_free_tmp(tmp_); \
ed8cf79b 514}
515
8b4f38f4 516#define emith_tpop_carry(sr, is_sub) \
517 emith_lsr(sr, sr, 1)
518
519#define emith_tpush_carry(sr, is_sub) \
520 emith_adc_r_r(sr, sr)
ed8cf79b 521
f0d7b1fa 522/*
523 * if Q
524 * t = carry(Rn += Rm)
525 * else
526 * t = carry(Rn -= Rm)
527 * T ^= t
528 */
529#define emith_sh2_div1_step(rn, rm, sr) { \
530 u8 *jmp0, *jmp1; \
531 int tmp_ = rcache_get_tmp(); \
8b4f38f4 532 emith_eor_r_r(tmp_, tmp_); \
f0d7b1fa 533 emith_tst_r_imm(sr, Q); /* if (Q ^ M) */ \
534 JMP8_POS(jmp0); /* je do_sub */ \
535 emith_add_r_r(rn, rm); \
536 JMP8_POS(jmp1); /* jmp done */ \
18b94127 537 JMP8_EMIT(ICOND_JE, jmp0); /* do_sub: */ \
f0d7b1fa 538 emith_sub_r_r(rn, rm); \
18b94127 539 JMP8_EMIT_NC(jmp1); /* done: */ \
f0d7b1fa 540 emith_setc(tmp_); \
8b4f38f4 541 EMIT_OP_MODRM(0x31, 3, tmp_, sr); /* T = Q1 ^ Q2 */ \
f0d7b1fa 542 rcache_free_tmp(tmp_); \
543}
544