2 @* Compiler helper functions and some SVP HLE code
3 @* (C) notaz, 2008,2009
5 @* This work is licensed under the terms of MAME license.
6 @* See COPYING file in the top-level directory.
9 #include <pico/arm_features.h>
15 @ SSP_GR0, SSP_X, SSP_Y, SSP_A,
16 @ SSP_ST, SSP_STACK, SSP_PC, SSP_P,
17 @ SSP_PM0, SSP_PM1, SSP_PM2, SSP_XST,
18 @ SSP_PM4, SSP_gr13, SSP_PMC, SSP_AL
23 @ r6: STACK and emu flags: sss0 * .uu. .lll NZCV (NZCV is PSR bits from ARM)
32 #define SSP_OFFS_GR 0x400
37 #define SSP_OFFS_PM_WRITE 0x46c // pmac_write[]
38 #define SSP_OFFS_EMUSTAT 0x484 // emu_status
39 #define SSP_OFFS_IRAM_ROM 0x48c // ptr_iram_rom
40 #define SSP_OFFS_DRAM 0x490 // ptr_dram
41 #define SSP_OFFS_IRAM_DIRTY 0x494
42 #define SSP_OFFS_IRAM_CTX 0x498 // iram_context
43 #define SSP_OFFS_BLTAB 0x49c // block_table
44 #define SSP_OFFS_BLTAB_IRAM 0x4a0
45 #define SSP_OFFS_TMP0 0x4a4 // for entry PC
46 #define SSP_OFFS_TMP1 0x4a8
47 #define SSP_OFFS_TMP2 0x4ac
48 #define SSP_WAIT_PM0 0x2000
51 .macro ssp_drc_do_next patch_jump=0
53 str lr, [r7, #SSP_OFFS_TMP2] @ jump instr. (actually call) address + 4
57 str r0, [r7, #SSP_OFFS_TMP0]
61 ldr r2, [r7, #SSP_OFFS_BLTAB]
62 ldr r2, [r2, r0, lsl #2]
69 bl ssp_translate_block
71 ldr r0, [r7, #SSP_OFFS_TMP0] @ entry PC
72 ldr r1, [r7, #SSP_OFFS_BLTAB]
73 str r2, [r1, r0, lsl #2]
81 ldr r1, [r7, #SSP_OFFS_IRAM_DIRTY]
83 ldreq r1, [r7, #SSP_OFFS_IRAM_CTX]
84 beq 1f @ ssp_de_iram_ctx
86 bl ssp_get_iram_context
88 str r1, [r7, #SSP_OFFS_IRAM_DIRTY]
90 str r1, [r7, #SSP_OFFS_IRAM_CTX]
91 ldr r0, [r7, #SSP_OFFS_TMP0] @ entry PC
94 ldr r2, [r7, #SSP_OFFS_BLTAB_IRAM]
95 add r2, r2, r1, lsl #12 @ block_tab_iram + iram_context * 0x800/2*4
96 add r1, r2, r0, lsl #2
104 str r1, [r7, #SSP_OFFS_TMP1]
105 bl ssp_translate_block
107 ldr r0, [r7, #SSP_OFFS_TMP0] @ entry PC
108 ldr r1, [r7, #SSP_OFFS_TMP1] @ &block_table_iram[iram_context][rPC]
115 .endm @ ssp_drc_do_next
118 FUNCTION(ssp_drc_entry):
119 stmfd sp!, {r4-r11, lr}
125 ldmia r2, {r3,r4,r5,r6,r8}
128 orr r4, r3, r4, lsr #16 @ XXYY
130 and r8, r8, #0x0f0000
131 mov r8, r8, lsl #13 @ sss0 *
132 and r9, r6, #0x670000
136 orrne r8, r8, #0x4 @ sss0 * NZ..
137 orr r6, r8, r9, lsr #12 @ sss0 * .uu. .lll NZ..
139 ldr r8, [r7, #0x440] @ r0-r2
140 ldr r9, [r7, #0x444] @ r4-r6
141 ldr r10,[r7, #(0x400+SSP_P*4)] @ P
143 ldr r0, [r7, #(SSP_OFFS_GR+SSP_PC*4)]
147 FUNCTION(ssp_drc_next):
151 FUNCTION(ssp_drc_next_patch):
155 ldr r1, [r7, #SSP_OFFS_TMP2] @ jump instr. (actually call) address + 4
157 moveq r3, #0xe1000000
158 orreq r3, r3, #0x00a00000 @ nop
165 streq r3, [r1, #-4] @ move the other cond up
166 moveq r3, #0xe1000000
167 orreq r3, r3, #0x00a00000
168 streq r3, [r1] @ fill it's place with nop
174 bic r3, r3, #1 @ L bit
175 orr r3, r3, r12,lsl #6
176 mov r3, r3, ror #8 @ patched branch instruction
177 str r3, [r1, #-4] @ patch the bl/b to jump directly to another handler
180 str r2, [r7, #SSP_OFFS_TMP1]
183 bl cache_flush_d_inval_i
184 ldr r2, [r7, #SSP_OFFS_TMP1]
185 ldr r0, [r7, #SSP_OFFS_TMP0]
189 FUNCTION(ssp_drc_end):
191 str r0, [r7, #(SSP_OFFS_GR+SSP_PC*4)]
194 str r10,[r7, #(0x400+SSP_P*4)] @ P
195 str r8, [r7, #0x440] @ r0-r2
196 str r9, [r7, #0x444] @ r4-r6
199 and r9, r9, #(7<<16) @ STACK
201 msr cpsr_f, r3 @ to to ARM PSR
204 orrmi r6, r6, #0x80000000 @ N
205 orreq r6, r6, #0x20000000 @ Z
207 mov r3, r4, lsl #16 @ Y
209 mov r2, r2, lsl #16 @ X
212 stmia r8, {r2,r3,r5,r6,r9}
215 ldmfd sp!, {r4-r11, lr}
223 FUNCTION(ssp_hle_800):
224 ldr r0, [r7, #(SSP_OFFS_GR+SSP_PM0*4)]
225 ldr r1, [r7, #SSP_OFFS_EMUSTAT]
227 orreq r1, r1, #SSP_WAIT_PM0
229 streq r1, [r7, #SSP_OFFS_EMUSTAT]
236 .macro hle_flushflags
239 orr r6, r6, r1, lsr #28
243 sub r6, r6, #0x20000000
245 add r1, r1, #0x048 @ stack
246 add r1, r1, r6, lsr #28
250 FUNCTION(ssp_hle_902):
256 ldr r3, [r7, #SSP_OFFS_IRAM_ROM]
257 add r2, r3, r0, lsl #1 @ (r7|00)
262 add r3, r3, r0, lsl #1 @ IRAM dest
263 ldrh r12,[r2], #2 @ length
264 bic r3, r3, #3 @ always seen aligned
265 @ orr r5, r5, #0x08000000
266 @ orr r5, r5, #0x00880000
267 @ sub r5, r5, r12, lsl #16
271 str r0, [r7, #SSP_OFFS_IRAM_DIRTY]
272 sub r11,r11,r12,lsl #1
273 sub r11,r11,r12 @ -= length*3
279 orr r0, r0, r1, lsl #16
287 ldr r0, [r7, #SSP_OFFS_IRAM_ROM]
291 strh r2, [r1] @ (r7|00)
295 orr r0, r0, #0x08000000
296 orr r0, r0, #0x001c8000
297 str r0, [r7, #(SSP_OFFS_GR+SSP_PMC*4)]
298 str r0, [r7, #(SSP_OFFS_PM_WRITE+4*4)]
301 subs r11,r11,#16 @ timeslice is likely to end
306 @ this one is car rendering related
307 .macro hle_11_12c_mla offs_in
308 ldrsh r5, [r7, #(\offs_in+0)]
309 ldrsh r0, [r7, #(\offs_in+2)]
310 ldrsh r1, [r7, #(\offs_in+4)]
312 ldrsh r12,[r7, #(\offs_in+6)]
315 add r5, r5, r12,lsl #11
318 add r1, r7, r8, lsr #23
323 FUNCTION(ssp_hle_11_12c):
339 mov r2, r2, asr #15 @ (r7|00) << 1
341 mov r3, r3, asr #15 @ (r7|01) << 1
343 mov r4, r4, asr #15 @ (r7|10) << 1
360 FUNCTION(ssp_hle_11_384):
364 FUNCTION(ssp_hle_11_38a):
371 mov r2, #0 @ EFh, EEh
373 add r0, r7, #0x1c0 @ r0 (based)
379 eor r5, r5, r5, asr #31
380 add r5, r5, r5, lsr #31 @ abs(r5)
382 orrpl r2, r2, r1,lsl #16 @ EFh |= r4
387 orrpl r2, r2, r1,lsl #16 @ EFh |= r4
397 bpl ssp_hle_11_38x_loop
402 orr r8, r8, r0, lsr #1
408 sub r11,r11,#(9+30*4)
412 FUNCTION(ssp_hle_07_6d6):
417 and r0, r8, #0xff @ assuming alignment
418 add r0, r7, r0, lsl #1
420 mov r1, r1, lsl #16 @ 106h << 16
421 mov r2, r2, lsl #16 @ 107h << 16
426 bmi ssp_hle_07_6d6_end
432 bmi ssp_hle_07_6d6_loop
434 b ssp_hle_07_6d6_loop
441 orr r1, r2, r1, lsr #16
448 FUNCTION(ssp_hle_07_030):
451 orr r0, r0, r0, lsr #16
455 FUNCTION(ssp_hle_07_036):
456 ldr r1, [r7, #0x1e0] @ F1h F0h
457 rsb r5, r1, r1, lsr #16
458 mov r5, r5, lsl #16 @ AL not needed
461 bmi hle_07_036_ending2
462 ldr r1, [r7, #0x1dc] @ EEh
469 strh r0, [r1, #0xea] @ F5h
470 ldr r0, [r7, #0x1e0] @ F0h
472 strh r0, [r1, #0xf0] @ F8h
473 add r2, r0, #0xc0 @ r2
474 add r2, r7, r2, lsl #1
480 @ will handle PMC later
481 ldr r0, [r7, #0x1e8] @ F5h << 16
482 ldr r1, [r7, #0x1f0] @ F8h
483 ldr r2, [r7, #0x1d4] @ EAh
485 add r0, r0, r1, lsl #16
486 sub r0, r2, r0, asr #18
488 rsbs r0, r0, #0x78 @ length
489 ble hle_07_036_ending1
494 ldr r1, [r7, #(SSP_OFFS_GR+SSP_PMC*4)]
495 ldr r2, [r7, #SSP_OFFS_DRAM]
497 add r1, r2, r1, lsr #15 @ addr (based)
498 ldrh r2, [r7, #0] @ pattern
499 ldrh r3, [r7, #6] @ mode
504 subnes r12,r12,#0x0400
507 orr r2, r2, r2, lsl #16
513 strneh r2, [r1], #0x3e @ align
526 strne r2, [r1], #0x40
529 b hle_07_036_end_copy
533 orreq r12,r12,#0x000f
535 orreq r12,r12,#0x00f0
537 orreq r12,r12,#0x0f00
539 orreq r12,r12,#0xf000
540 orrs r12,r12,r12,lsl #16
541 beq hle_07_036_no_ovrwr
548 strh r3, [r1], #0x3e @ align
571 ldr r2, [r7, #SSP_OFFS_DRAM]
573 sub r0, r1, r2 @ new addr
575 strh r0, [r3, #(0x6c+4*4)] @ SSP_OFFS_PM_WRITE+4*4 (low)
578 ldr r0, [r7, #0x1e0] @ F1h << 16
581 add r0, r0, #(0xc4<<16)
582 bic r8, r8, #0xff0000
584 add r0, r7, r0, lsr #15
590 ldr r1, [r7, #4] @ new mode
592 strh r1, [r2, #(0x6c+4*4+2)] @ SSP_OFFS_PM_WRITE+4*4 (high)
606 b ssp_drc_next @ let the dispatcher finish this
609 @ ios stuff - preserving r9 on external calls
612 #define APPLE_WRAP(f) \
618 APPLE_WRAP(cache_flush_d_inval_i)
619 APPLE_WRAP(ssp_get_iram_context)
620 APPLE_WRAP(ssp_pm_read)
621 APPLE_WRAP(ssp_pm_write)
622 APPLE_WRAP(ssp_translate_block)
623 APPLE_WRAP(tr_unhandled)
627 @ vim:filetype=armasm