X-Git-Url: https://notaz.gp2x.de/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=cpu%2Fsh2%2Fmame%2Fsh2pico.c;h=636ebc6f4289de3af1094b5d4437c9c36a81e389;hb=e9a11abb3c8237286fd7b6c4b5048d9eec9b1a1b;hp=57b7d9c5462c87e90a85d75f272dc9eb8b9db244;hpb=553c3eaa3a4bda6ba99d925ecab518fe82530cd6;p=picodrive.git diff --git a/cpu/sh2/mame/sh2pico.c b/cpu/sh2/mame/sh2pico.c index 57b7d9c..636ebc6 100644 --- a/cpu/sh2/mame/sh2pico.c +++ b/cpu/sh2/mame/sh2pico.c @@ -1,19 +1,62 @@ #include "../sh2.h" +#ifdef DRC_CMP +#include "../compiler.c" +#define BUSY_LOOP_HACKS 0 +#else +#define BUSY_LOOP_HACKS 1 +#endif + // MAME types +#ifndef INT8 typedef signed char INT8; typedef signed short INT16; typedef signed int INT32; typedef unsigned int UINT32; typedef unsigned short UINT16; typedef unsigned char UINT8; +#endif + +#ifdef DRC_SH2 -#define RB(a) p32x_sh2_read8(a,sh2) -#define RW(a) p32x_sh2_read16(a,sh2) -#define RL(a) p32x_sh2_read32(a,sh2) -#define WB(a,d) p32x_sh2_write8(a,d,sh2) -#define WW(a,d) p32x_sh2_write16(a,d,sh2) -#define WL(a,d) p32x_sh2_write32(a,d,sh2) +// this nasty conversion is needed for drc-expecting memhandlers +#define MAKE_READFUNC(name, cname) \ +static __inline unsigned int name(SH2 *sh2, unsigned int a) \ +{ \ + unsigned int ret; \ + sh2->sr |= sh2->icount << 12; \ + ret = cname(a, sh2); \ + sh2->icount = (signed int)sh2->sr >> 12; \ + sh2->sr &= 0x3f3; \ + return ret; \ +} + +#define MAKE_WRITEFUNC(name, cname) \ +static __inline void name(SH2 *sh2, unsigned int a, unsigned int d) \ +{ \ + sh2->sr |= sh2->icount << 12; \ + cname(a, d, sh2); \ + sh2->icount = (signed int)sh2->sr >> 12; \ + sh2->sr &= 0x3f3; \ +} + +MAKE_READFUNC(RB, p32x_sh2_read8) +MAKE_READFUNC(RW, p32x_sh2_read16) +MAKE_READFUNC(RL, p32x_sh2_read32) +MAKE_WRITEFUNC(WB, p32x_sh2_write8) +MAKE_WRITEFUNC(WW, p32x_sh2_write16) +MAKE_WRITEFUNC(WL, p32x_sh2_write32) + +#else + +#define RB(sh2, a) p32x_sh2_read8(a, sh2) +#define RW(sh2, a) p32x_sh2_read16(a, sh2) +#define RL(sh2, a) p32x_sh2_read32(a, sh2) +#define WB(sh2, a, d) p32x_sh2_write8(a, d, sh2) +#define WW(sh2, a, d) p32x_sh2_write16(a, d, sh2) +#define WL(sh2, a, d) p32x_sh2_write32(a, d, sh2) + +#endif // some stuff from sh2comn.h #define T 0x00000001 @@ -29,47 +72,173 @@ typedef unsigned char UINT8; #define Rn ((opcode>>8)&15) #define Rm ((opcode>>4)&15) -#define sh2_icount sh2->icount +#define sh2_state SH2 + +extern void lprintf(const char *fmt, ...); +#define logerror lprintf + +#ifdef SH2_STATS +static SH2 sh2_stats; +static unsigned int op_refs[0x10000]; +# define LRN 1 +# define LRM 2 +# define LRNM (LRN|LRM) +# define rlog(rnm) { \ + int op = opcode; \ + if ((rnm) & LRN) { \ + op &= ~0x0f00; \ + sh2_stats.r[Rn]++; \ + } \ + if ((rnm) & LRM) { \ + op &= ~0x00f0; \ + sh2_stats.r[Rm]++; \ + } \ + op_refs[op]++; \ +} +# define rlog1(x) sh2_stats.r[x]++ +# define rlog2(x1,x2) sh2_stats.r[x1]++; sh2_stats.r[x2]++ +#else +# define rlog(x) +# define rlog1(...) +# define rlog2(...) +#endif #include "sh2.c" -#ifndef DRC_TMP +#ifndef DRC_CMP -void sh2_execute(SH2 *sh2_, int cycles) +int sh2_execute_interpreter(SH2 *sh2, int cycles) { - sh2 = sh2_; - sh2->cycles_aim += cycles; - sh2->icount = cycles = sh2->cycles_aim - sh2->cycles_done; + UINT32 opcode; + + sh2->icount = cycles; if (sh2->icount <= 0) - return; + goto out; do { - UINT32 opcode; + if (sh2->delay) + { + sh2->ppc = sh2->delay; + opcode = RW(sh2, sh2->delay); + + // TODO: more branch types + if ((opcode >> 13) == 5) { // BRA/BSR + sh2->r[15] -= 4; + WL(sh2, sh2->r[15], sh2->sr); + sh2->r[15] -= 4; + WL(sh2, sh2->r[15], sh2->pc); + sh2->pc = RL(sh2, sh2->vbr + 6 * 4); + sh2->icount -= 5; + opcode = 9; // NOP + } + + sh2->pc -= 2; + } + else + { + sh2->ppc = sh2->pc; + opcode = RW(sh2, sh2->pc); + } + + sh2->delay = 0; + sh2->pc += 2; + + switch (opcode & ( 15 << 12)) + { + case 0<<12: op0000(sh2, opcode); break; + case 1<<12: op0001(sh2, opcode); break; + case 2<<12: op0010(sh2, opcode); break; + case 3<<12: op0011(sh2, opcode); break; + case 4<<12: op0100(sh2, opcode); break; + case 5<<12: op0101(sh2, opcode); break; + case 6<<12: op0110(sh2, opcode); break; + case 7<<12: op0111(sh2, opcode); break; + case 8<<12: op1000(sh2, opcode); break; + case 9<<12: op1001(sh2, opcode); break; + case 10<<12: op1010(sh2, opcode); break; + case 11<<12: op1011(sh2, opcode); break; + case 12<<12: op1100(sh2, opcode); break; + case 13<<12: op1101(sh2, opcode); break; + case 14<<12: op1110(sh2, opcode); break; + default: op1111(sh2, opcode); break; + } + + sh2->icount--; if (sh2->test_irq && !sh2->delay && sh2->pending_level > ((sh2->sr >> 4) & 0x0f)) { - if (sh2->pending_irl > sh2->pending_int_irq) - sh2_do_irq(sh2, sh2->pending_irl, 64 + sh2->pending_irl/2); - else { - sh2_do_irq(sh2, sh2->pending_int_irq, sh2->pending_int_vector); - sh2->pending_int_irq = 0; // auto-clear - sh2->pending_level = sh2->pending_irl; - } + int level = sh2->pending_level; + int vector = sh2->irq_callback(sh2, level); + sh2_do_irq(sh2, level, vector); sh2->test_irq = 0; } + } + while (sh2->icount > 0 || sh2->delay); /* can't interrupt before delay */ + +out: + return sh2->icount; +} + +#else // if DRC_CMP + +int sh2_execute_interpreter(SH2 *sh2, int cycles) +{ + static unsigned int base_pc_[2] = { 0, 0 }; + static unsigned int end_pc_[2] = { 0, 0 }; + static unsigned char op_flags_[2][BLOCK_INSN_LIMIT]; + unsigned int *base_pc = &base_pc_[sh2->is_slave]; + unsigned int *end_pc = &end_pc_[sh2->is_slave]; + unsigned char *op_flags = op_flags_[sh2->is_slave]; + unsigned int pc_expect; + UINT32 opcode; + + sh2->icount = sh2->cycles_timeslice = cycles; + + if (sh2->pending_level > ((sh2->sr >> 4) & 0x0f)) + { + int level = sh2->pending_level; + int vector = sh2->irq_callback(sh2, level); + sh2_do_irq(sh2, level, vector); + } + pc_expect = sh2->pc; + + if (sh2->icount <= 0) + goto out; + + do + { + if (!sh2->delay) { + if (sh2->pc < *base_pc || sh2->pc >= *end_pc) { + *base_pc = sh2->pc; + scan_block(*base_pc, sh2->is_slave, + op_flags, end_pc, NULL); + } + if ((op_flags[(sh2->pc - *base_pc) / 2] + & OF_BTARGET) || sh2->pc == *base_pc + || pc_expect != sh2->pc) // branched + { + pc_expect = sh2->pc; + if (sh2->icount < 0) + break; + } + + do_sh2_trace(sh2, sh2->icount); + } + pc_expect += 2; + if (sh2->delay) { sh2->ppc = sh2->delay; - opcode = RW(sh2->delay); + opcode = RW(sh2, sh2->delay); sh2->pc -= 2; } else { sh2->ppc = sh2->pc; - opcode = RW(sh2->pc); + opcode = RW(sh2, sh2->pc); } sh2->delay = 0; @@ -77,65 +246,93 @@ void sh2_execute(SH2 *sh2_, int cycles) switch (opcode & ( 15 << 12)) { - case 0<<12: op0000(opcode); break; - case 1<<12: op0001(opcode); break; - case 2<<12: op0010(opcode); break; - case 3<<12: op0011(opcode); break; - case 4<<12: op0100(opcode); break; - case 5<<12: op0101(opcode); break; - case 6<<12: op0110(opcode); break; - case 7<<12: op0111(opcode); break; - case 8<<12: op1000(opcode); break; - case 9<<12: op1001(opcode); break; - case 10<<12: op1010(opcode); break; - case 11<<12: op1011(opcode); break; - case 12<<12: op1100(opcode); break; - case 13<<12: op1101(opcode); break; - case 14<<12: op1110(opcode); break; - default: op1111(opcode); break; + case 0<<12: op0000(sh2, opcode); break; + case 1<<12: op0001(sh2, opcode); break; + case 2<<12: op0010(sh2, opcode); break; + case 3<<12: op0011(sh2, opcode); break; + case 4<<12: op0100(sh2, opcode); break; + case 5<<12: op0101(sh2, opcode); break; + case 6<<12: op0110(sh2, opcode); break; + case 7<<12: op0111(sh2, opcode); break; + case 8<<12: op1000(sh2, opcode); break; + case 9<<12: op1001(sh2, opcode); break; + case 10<<12: op1010(sh2, opcode); break; + case 11<<12: op1011(sh2, opcode); break; + case 12<<12: op1100(sh2, opcode); break; + case 13<<12: op1101(sh2, opcode); break; + case 14<<12: op1110(sh2, opcode); break; + default: op1111(sh2, opcode); break; } sh2->icount--; + + if (sh2->test_irq && !sh2->delay && sh2->pending_level > ((sh2->sr >> 4) & 0x0f)) + { + int level = sh2->pending_level; + int vector = sh2->irq_callback(sh2, level); + sh2_do_irq(sh2, level, vector); + sh2->test_irq = 0; + } + } - while (sh2->icount > 0 || sh2->delay); /* can't interrupt before delay */ + while (1); - sh2->cycles_done += cycles - sh2->icount; +out: + return sh2->icount; } -#else // DRC_TMP +#endif // DRC_CMP -#ifdef __i386__ -#define REGPARM(x) __attribute__((regparm(x))) -#else -#define REGPARM(x) -#endif +#ifdef SH2_STATS +#include +#include +#include "sh2dasm.h" -// tmp -void REGPARM(2) sh2_do_op(SH2 *sh2_, int opcode) +void sh2_dump_stats(void) { - sh2 = sh2_; - sh2->pc += 2; + static const char *rnames[] = { + "R0", "R1", "R2", "R3", "R4", "R5", "R6", "R7", + "R8", "R9", "R10", "R11", "R12", "R13", "R14", "SP", + "PC", "", "PR", "SR", "GBR", "VBR", "MACH", "MACL" + }; + long long total; + char buff[64]; + int u, i; - switch (opcode & ( 15 << 12)) - { - case 0<<12: op0000(opcode); break; - case 1<<12: op0001(opcode); break; - case 2<<12: op0010(opcode); break; - case 3<<12: op0011(opcode); break; - case 4<<12: op0100(opcode); break; - case 5<<12: op0101(opcode); break; - case 6<<12: op0110(opcode); break; - case 7<<12: op0111(opcode); break; - case 8<<12: op1000(opcode); break; - case 9<<12: op1001(opcode); break; - case 10<<12: op1010(opcode); break; - case 11<<12: op1011(opcode); break; - case 12<<12: op1100(opcode); break; - case 13<<12: op1101(opcode); break; - case 14<<12: op1110(opcode); break; - default: op1111(opcode); break; + // dump reg usage + total = 0; + for (i = 0; i < 24; i++) + total += sh2_stats.r[i]; + + for (i = 0; i < 24; i++) { + if (i == 16 || i == 17 || i == 19) + continue; + printf("r %6.3f%% %-4s %9d\n", (double)sh2_stats.r[i] * 100.0 / total, + rnames[i], sh2_stats.r[i]); } -} + memset(&sh2_stats, 0, sizeof(sh2_stats)); + + // dump ops + printf("\n"); + total = 0; + for (i = 0; i < 0x10000; i++) + total += op_refs[i]; + + for (u = 0; u < 16; u++) { + int max = 0, op = 0; + for (i = 0; i < 0x10000; i++) { + if (op_refs[i] > max) { + max = op_refs[i]; + op = i; + } + } + DasmSH2(buff, 0, op); + printf("i %6.3f%% %9d %s\n", (double)op_refs[op] * 100.0 / total, + op_refs[op], buff); + op_refs[op] = 0; + } + memset(op_refs, 0, sizeof(op_refs)); +} #endif