full ym2612 save/load for 940
[picodrive.git] / platform / gp2x / 940ctl.c
... / ...
CommitLineData
1// Code for communication with ARM940 and control of it.\r
2// (c) Copyright 2007, Grazvydas "notaz" Ignotas\r
3\r
4#include <stdio.h>\r
5#include <stdlib.h>\r
6#include <string.h>\r
7#include <unistd.h>\r
8#include <sys/mman.h>\r
9#include <sys/ioctl.h>\r
10#include <fcntl.h>\r
11#include <errno.h>\r
12\r
13#include "code940/940shared.h"\r
14#include "gp2x.h"\r
15#include "emu.h"\r
16#include "menu.h"\r
17#include "../common/mp3.h"\r
18#include "../common/arm_utils.h"\r
19#include "../common/menu.h"\r
20#include "../common/emu.h"\r
21#include "../../Pico/PicoInt.h"\r
22#include "../../Pico/sound/ym2612.h"\r
23#include "../../Pico/sound/mix.h"\r
24\r
25/* we will need some gp2x internals here */\r
26extern volatile unsigned short *gp2x_memregs; /* from minimal library rlyeh */\r
27extern volatile unsigned long *gp2x_memregl;\r
28\r
29extern int reset_timing;\r
30static unsigned char *shared_mem = 0;\r
31static _940_data_t *shared_data = 0;\r
32_940_ctl_t *shared_ctl = 0;\r
33unsigned char *mp3_mem = 0;\r
34\r
35#define MP3_SIZE_MAX (0x400000 + 0x800000) // 12M\r
36#define CODE940_FILE "pico940_v3.bin"\r
37\r
38int crashed_940 = 0;\r
39\r
40static FILE *loaded_mp3 = 0;\r
41\r
42/***********************************************************/\r
43\r
44#define MAXOUT (+32767)\r
45#define MINOUT (-32768)\r
46\r
47/* limitter */\r
48#define Limit(val, max,min) { \\r
49 if ( val > max ) val = max; \\r
50 else if ( val < min ) val = min; \\r
51}\r
52\r
53/* these will be managed locally on our side */\r
54static UINT8 ST_address; /* address register */\r
55static INT32 addr_A1; /* address line A1 */\r
56\r
57static int writebuff_ptr = 0;\r
58\r
59\r
60/* YM2612 write */\r
61/* a = address */\r
62/* v = value */\r
63/* returns 1 if sample affecting state changed */\r
64int YM2612Write_940(unsigned int a, unsigned int v, int scanline)\r
65{\r
66 int upd = 1; /* the write affects sample generation */\r
67\r
68 a &= 3;\r
69\r
70 //printf("%05i:%03i: ym w ([%i] %02x)\n", Pico.m.frame_count, Pico.m.scanline, a, v);\r
71\r
72 switch (a)\r
73 {\r
74 case 0: /* address port 0 */\r
75 if (addr_A1 == 0 && ST_address == v)\r
76 return 0; /* address already selected, don't send this command to 940 */\r
77 ST_address = v;\r
78 addr_A1 = 0;\r
79 /* don't send DAC or timer related address changes to 940 */\r
80 if (v == 0x24 || v == 0x25 || v == 0x26 || v == 0x2a)\r
81 return 0;\r
82 upd = 0;\r
83 break;\r
84\r
85 case 1: /* data port 0 */\r
86 if (ST_address == 0x2b) upd = 0; /* DAC sel */\r
87 break;\r
88\r
89 case 2: /* address port 1 */\r
90 if (addr_A1 == 1 && ST_address == v)\r
91 return 0;\r
92 ST_address = v;\r
93 addr_A1 = 1;\r
94 upd = 0;\r
95 break;\r
96 }\r
97\r
98 //printf("ym pass\n");\r
99\r
100 if (currentConfig.EmuOpt & 4)\r
101 {\r
102 UINT16 *writebuff = shared_ctl->writebuffsel ? shared_ctl->writebuff0 : shared_ctl->writebuff1;\r
103\r
104 /* detect rapid ym updates */\r
105 if (upd && !(writebuff_ptr & 0x80000000) && scanline < 224)\r
106 {\r
107 int mid = Pico.m.pal ? 68 : 93;\r
108 if (scanline > mid) {\r
109 //printf("%05i:%03i: rapid ym\n", Pico.m.frame_count, scanline);\r
110 writebuff[writebuff_ptr++ & 0xffff] = 0xfffe;\r
111 writebuff_ptr |= 0x80000000;\r
112 //printf("%05i:%03i: ym w ([%02x] %02x, upd=%i)\n", Pico.m.frame_count, scanline, addr, v, upd);\r
113 }\r
114 }\r
115\r
116 /* queue this write for 940 */\r
117 if ((writebuff_ptr&0xffff) < 2047) {\r
118 writebuff[writebuff_ptr++ & 0xffff] = (a<<8)|v;\r
119 } else {\r
120 printf("warning: writebuff_ptr > 2047 ([%i] %02x)\n", a, v);\r
121 }\r
122 }\r
123\r
124 return 0; // cause the engine to do updates once per frame only\r
125}\r
126\r
127\r
128#define CHECK_BUSY(job) \\r
129 (gp2x_memregs[0x3b46>>1] & (1<<(job-1)))\r
130\r
131static void wait_busy_940(int job)\r
132{\r
133 int i;\r
134\r
135 job--;\r
136 for (i = 0; (gp2x_memregs[0x3b46>>1] & (1<<job)) && i < 0x10000; i++)\r
137 spend_cycles(8*1024); // tested to be best for mp3 dec\r
138 if (i < 0x10000) return;\r
139\r
140 /* 940 crashed */\r
141 printf("940 crashed (cnt: %i, ve: ", shared_ctl->loopc);\r
142 for (i = 0; i < 8; i++)\r
143 printf("%i ", shared_ctl->vstarts[i]);\r
144 printf(")\n");\r
145 printf("irq pending flags: DUALCPU %04x, SRCPND %08lx (see 26), INTPND %08lx\n",\r
146 gp2x_memregs[0x3b46>>1], gp2x_memregl[0x4500>>2], gp2x_memregl[0x4510>>2]);\r
147 printf("last lr: %08x, lastjob: %i\n", shared_ctl->last_lr, shared_ctl->lastjob);\r
148 printf("trying to interrupt..\n");\r
149 gp2x_memregs[0x3B3E>>1] = 0xffff;\r
150 for (i = 0; gp2x_memregs[0x3b46>>1] && i < 0x10000; i++)\r
151 spend_cycles(8*1024);\r
152 printf("i = 0x%x\n", i);\r
153 printf("irq pending flags: DUALCPU %04x, SRCPND %08lx (see 26), INTPND %08lx\n",\r
154 gp2x_memregs[0x3b46>>1], gp2x_memregl[0x4500>>2], gp2x_memregl[0x4510>>2]);\r
155 printf("last lr: %08x, lastjob: %i\n", shared_ctl->last_lr, shared_ctl->lastjob);\r
156\r
157 strcpy(menuErrorMsg, "940 crashed, too much overclock?");\r
158 engineState = PGS_Menu;\r
159 crashed_940 = 1;\r
160}\r
161\r
162\r
163static void add_job_940(int job)\r
164{\r
165 if (job <= 0 || job > 16) {\r
166 printf("add_job_940: bad job: %i\n", job);\r
167 return;\r
168 }\r
169\r
170 // generate interrupt for this job\r
171 job--;\r
172 gp2x_memregs[(0x3B20+job*2)>>1] = 1;\r
173\r
174// printf("added %i, pending %04x\n", job+1, gp2x_memregs[0x3b46>>1]);\r
175}\r
176\r
177\r
178void YM2612PicoStateLoad_940(void)\r
179{\r
180 UINT8 *REGS = YM2612GetRegs();\r
181\r
182 /* make sure JOB940_PICOSTATELOAD gets done before next JOB940_YM2612UPDATEONE */\r
183 add_job_940(JOB940_PICOSTATELOAD);\r
184 if (CHECK_BUSY(JOB940_PICOSTATELOAD)) wait_busy_940(JOB940_PICOSTATELOAD);\r
185\r
186 writebuff_ptr = 0;\r
187 addr_A1 = *(INT32 *) (REGS + 0x200);\r
188}\r
189\r
190void YM2612PicoStateSave2_940(int tat, int tbt)\r
191{\r
192 UINT8 *ym_remote_regs, *ym_local_regs;\r
193 add_job_940(JOB940_PICOSTATESAVE2);\r
194 if (CHECK_BUSY(JOB940_PICOSTATESAVE2)) wait_busy_940(JOB940_PICOSTATESAVE2);\r
195\r
196 ym_remote_regs = (UINT8 *) shared_ctl->writebuff0;\r
197 ym_local_regs = YM2612GetRegs();\r
198 if (*(UINT32 *)(ym_remote_regs + 0x100) != 0x41534d59) {\r
199 printf("code940 didn't return valid save data\n");\r
200 return;\r
201 }\r
202\r
203 /* copy addin data only */\r
204 memcpy(ym_local_regs, ym_remote_regs, 0x20);\r
205 memcpy(ym_local_regs + 0x100, ym_remote_regs + 0x100, 0x30);\r
206 memcpy(ym_local_regs + 0x0b8, ym_remote_regs + 0x0b8, 0x48);\r
207 memcpy(ym_local_regs + 0x1b8, ym_remote_regs + 0x1b8, 0x48);\r
208 *(INT32 *)(ym_local_regs + 0x108) = tat;\r
209 *(INT32 *)(ym_local_regs + 0x10c) = tbt;\r
210}\r
211\r
212int YM2612PicoStateLoad2_940(int *tat, int *tbt)\r
213{\r
214 UINT8 *ym_remote_regs, *ym_local_regs;\r
215 ym_local_regs = YM2612GetRegs();\r
216 ym_remote_regs = (UINT8 *) shared_ctl->writebuff0;\r
217\r
218 if (*(UINT32 *)(ym_local_regs + 0x100) != 0x41534d59)\r
219 return -1;\r
220\r
221 *tat = *(INT32 *)(ym_local_regs + 0x108);\r
222 *tbt = *(INT32 *)(ym_local_regs + 0x10c);\r
223\r
224 if (CHECK_BUSY(JOB940_YM2612UPDATEONE)) wait_busy_940(JOB940_YM2612UPDATEONE);\r
225\r
226 /* flush writes */\r
227 if (shared_ctl->writebuffsel == 1) {\r
228 shared_ctl->writebuff0[writebuff_ptr & 0xffff] = 0xffff;\r
229 } else {\r
230 shared_ctl->writebuff1[writebuff_ptr & 0xffff] = 0xffff;\r
231 }\r
232 shared_ctl->writebuffsel ^= 1;\r
233 writebuff_ptr = 0;\r
234 add_job_940(JOB940_PICOSTATELOAD2_PREP);\r
235 if (CHECK_BUSY(JOB940_PICOSTATELOAD2_PREP)) wait_busy_940(JOB940_PICOSTATELOAD2_PREP);\r
236\r
237 memcpy(ym_remote_regs, ym_local_regs, 0x200);\r
238\r
239 add_job_940(JOB940_PICOSTATELOAD2);\r
240 if (CHECK_BUSY(JOB940_PICOSTATELOAD2)) wait_busy_940(JOB940_PICOSTATELOAD2);\r
241\r
242 return 0;\r
243}\r
244\r
245\r
246static void internal_reset(void)\r
247{\r
248 writebuff_ptr = 0;\r
249 ST_address = addr_A1 = -1;\r
250}\r
251\r
252\r
253/* this must be called after mmu hack, the allocated regions must not get cached */\r
254void sharedmem_init(void)\r
255{\r
256 if (shared_mem != NULL) return;\r
257\r
258 shared_mem = (unsigned char *) mmap(0, 0x210000, PROT_READ|PROT_WRITE, MAP_SHARED, memdev, 0x2000000);\r
259 if (shared_mem == MAP_FAILED)\r
260 {\r
261 printf("mmap(shared_data) failed with %i\n", errno);\r
262 exit(1);\r
263 }\r
264 shared_data = (_940_data_t *) (shared_mem+0x100000);\r
265 /* this area must not get buffered on either side */\r
266 shared_ctl = (_940_ctl_t *) (shared_mem+0x200000);\r
267 mp3_mem = (unsigned char *) mmap(0, MP3_SIZE_MAX, PROT_READ|PROT_WRITE, MAP_SHARED, memdev, 0x2400000);\r
268 if (mp3_mem == MAP_FAILED)\r
269 {\r
270 printf("mmap(mp3_mem) failed with %i\n", errno);\r
271 exit(1);\r
272 }\r
273 crashed_940 = 1;\r
274}\r
275\r
276\r
277void sharedmem_deinit(void)\r
278{\r
279 munmap(shared_mem, 0x210000);\r
280 munmap(mp3_mem, MP3_SIZE_MAX);\r
281 shared_mem = mp3_mem = NULL;\r
282 shared_data = NULL;\r
283 shared_ctl = NULL;\r
284}\r
285\r
286\r
287extern char **g_argv;\r
288\r
289void YM2612Init_940(int baseclock, int rate)\r
290{\r
291 printf("YM2612Init_940()\n");\r
292 printf("Mem usage: shared_data: %i, shared_ctl: %i\n", sizeof(*shared_data), sizeof(*shared_ctl));\r
293\r
294 Reset940(1, 2);\r
295 Pause940(1);\r
296\r
297 gp2x_memregs[0x3B40>>1] = 0; // disable DUALCPU interrupts for 920\r
298 gp2x_memregs[0x3B42>>1] = 1; // enable DUALCPU interrupts for 940\r
299\r
300 gp2x_memregl[0x4504>>2] = 0; // make sure no FIQs will be generated\r
301 gp2x_memregl[0x4508>>2] = ~(1<<26); // unmask DUALCPU ints in the undocumented 940's interrupt controller\r
302\r
303\r
304 if (crashed_940)\r
305 {\r
306 unsigned char ucData[1024];\r
307 int nRead, i, nLen = 0;\r
308 char binpath[1024];\r
309 FILE *fp;\r
310\r
311 strncpy(binpath, g_argv[0], 1023);\r
312 binpath[1023] = 0;\r
313 for (i = strlen(binpath); i > 0; i--)\r
314 if (binpath[i] == '/') { binpath[i] = 0; break; }\r
315 strcat(binpath, "/" CODE940_FILE);\r
316\r
317 fp = fopen(binpath, "rb");\r
318 if(!fp)\r
319 {\r
320 memset(gp2x_screen, 0, 320*240*2);\r
321 text_out16(10, 100, "failed to open required file:");\r
322 text_out16(10, 110, CODE940_FILE);\r
323 gp2x_video_flip2();\r
324 printf("failed to open %s\n", binpath);\r
325 exit(1);\r
326 }\r
327\r
328 while(1)\r
329 {\r
330 nRead = fread(ucData, 1, 1024, fp);\r
331 if(nRead <= 0)\r
332 break;\r
333 memcpy(shared_mem + nLen, ucData, nRead);\r
334 nLen += nRead;\r
335 }\r
336 fclose(fp);\r
337 crashed_940 = 0;\r
338 }\r
339\r
340 memset(shared_data, 0, sizeof(*shared_data));\r
341 memset(shared_ctl, 0, sizeof(*shared_ctl));\r
342\r
343 /* cause local ym2612 to init REGS */\r
344 YM2612Init_(baseclock, rate);\r
345\r
346 internal_reset();\r
347\r
348 loaded_mp3 = 0;\r
349\r
350 gp2x_memregs[0x3B46>>1] = 0xffff; // clear pending DUALCPU interrupts for 940\r
351 gp2x_memregl[0x4500>>2] = 0xffffffff; // clear pending IRQs in SRCPND\r
352 gp2x_memregl[0x4510>>2] = 0xffffffff; // clear pending IRQs in INTPND\r
353\r
354 /* start the 940 */\r
355 Reset940(0, 2);\r
356 Pause940(0);\r
357\r
358 // YM2612ResetChip_940(); // will be done on JOB940_YM2612INIT\r
359\r
360 /* now cause 940 to init it's ym2612 stuff */\r
361 shared_ctl->baseclock = baseclock;\r
362 shared_ctl->rate = rate;\r
363 add_job_940(JOB940_INITALL);\r
364}\r
365\r
366\r
367void YM2612ResetChip_940(void)\r
368{\r
369 //printf("YM2612ResetChip_940()\n");\r
370 if (shared_data == NULL) {\r
371 printf("YM2612ResetChip_940: reset before init?\n");\r
372 return;\r
373 }\r
374\r
375 YM2612ResetChip_();\r
376 internal_reset();\r
377\r
378 add_job_940(JOB940_YM2612RESETCHIP);\r
379}\r
380\r
381\r
382int YM2612UpdateOne_940(int *buffer, int length, int stereo, int is_buf_empty)\r
383{\r
384 int *ym_buf = shared_data->ym_buffer;\r
385 int ym_active_chs;\r
386\r
387 //printf("YM2612UpdateOne_940()\n");\r
388\r
389 if (CHECK_BUSY(JOB940_YM2612UPDATEONE)) wait_busy_940(JOB940_YM2612UPDATEONE);\r
390\r
391 ym_active_chs = shared_ctl->ym_active_chs;\r
392\r
393 // mix in ym buffer. is_buf_empty means nobody mixed there anything yet and it may contain trash\r
394 if (is_buf_empty && ym_active_chs) memcpy32(buffer, ym_buf, length<<stereo);\r
395 else memset32(buffer, 0, length<<stereo);\r
396\r
397 if (shared_ctl->writebuffsel == 1) {\r
398 shared_ctl->writebuff0[writebuff_ptr & 0xffff] = 0xffff;\r
399 } else {\r
400 shared_ctl->writebuff1[writebuff_ptr & 0xffff] = 0xffff;\r
401 }\r
402 writebuff_ptr = 0;\r
403\r
404 /* predict sample counter for next frame */\r
405 if (PsndLen_exc_add) {\r
406 if (PsndLen_exc_cnt + PsndLen_exc_add >= 0x10000) length = PsndLen + 1;\r
407 else length = PsndLen;\r
408 }\r
409\r
410 /* give 940 ym job */\r
411 shared_ctl->writebuffsel ^= 1;\r
412 shared_ctl->length = length;\r
413 shared_ctl->stereo = stereo;\r
414\r
415 add_job_940(JOB940_YM2612UPDATEONE);\r
416\r
417 return ym_active_chs;\r
418}\r
419\r
420\r
421static int mp3_samples_ready = 0, mp3_buffer_offs = 0;\r
422static int mp3_play_bufsel = 0, mp3_job_started = 0;\r
423\r
424void mp3_update(int *buffer, int length, int stereo)\r
425{\r
426 int length_mp3;\r
427 int cdda_on;\r
428\r
429 // playback was started, track not ended\r
430 cdda_on = loaded_mp3 && shared_ctl->mp3_offs < shared_ctl->mp3_len;\r
431\r
432 if (!cdda_on) return;\r
433\r
434 if (!(PicoOpt&0x200)) {\r
435 mp3_update_local(buffer, length, stereo);\r
436 return;\r
437 }\r
438\r
439 length_mp3 = length;\r
440 if (PsndRate == 22050) length_mp3 <<= 1; // mp3s are locked to 44100Hz stereo\r
441 else if (PsndRate == 11025) length_mp3 <<= 2; // so make length 44100ish\r
442\r
443 /* do we have to wait? */\r
444 if (mp3_job_started && mp3_samples_ready < length_mp3) {\r
445 if (CHECK_BUSY(JOB940_MP3DECODE)) wait_busy_940(JOB940_MP3DECODE);\r
446 mp3_job_started = 0;\r
447 mp3_samples_ready += 1152;\r
448 }\r
449\r
450 /* mix mp3 data, only stereo */\r
451 if (mp3_samples_ready >= length_mp3)\r
452 {\r
453 int shr = 0;\r
454 void (*mix_samples)(int *dest_buf, short *mp3_buf, int count) = mix_16h_to_32;\r
455 if (PsndRate == 22050) { mix_samples = mix_16h_to_32_s1; shr = 1; }\r
456 else if (PsndRate == 11025) { mix_samples = mix_16h_to_32_s2; shr = 2; }\r
457\r
458 if (1152 - mp3_buffer_offs >= length_mp3) {\r
459 mix_samples(buffer, shared_data->mp3_buffer[mp3_play_bufsel] + mp3_buffer_offs*2, length<<1);\r
460\r
461 mp3_buffer_offs += length_mp3;\r
462 } else {\r
463 // collect samples from both buffers..\r
464 int left = 1152 - mp3_buffer_offs;\r
465 if (mp3_play_bufsel == 0)\r
466 {\r
467 mix_samples(buffer, shared_data->mp3_buffer[0] + mp3_buffer_offs*2, length<<1);\r
468 mp3_buffer_offs = length_mp3 - left;\r
469 mp3_play_bufsel = 1;\r
470 } else {\r
471 mix_samples(buffer, shared_data->mp3_buffer[1] + mp3_buffer_offs*2, (left>>shr)<<1);\r
472 mp3_buffer_offs = length_mp3 - left;\r
473 mix_samples(buffer + ((left>>shr)<<1),\r
474 shared_data->mp3_buffer[0], (mp3_buffer_offs>>shr)<<1);\r
475 mp3_play_bufsel = 0;\r
476 }\r
477 }\r
478 mp3_samples_ready -= length_mp3;\r
479 }\r
480\r
481 // ask to decode more if we already can\r
482 if (!mp3_job_started)\r
483 {\r
484 mp3_job_started = 1;\r
485 shared_ctl->mp3_buffsel ^= 1;\r
486 add_job_940(JOB940_MP3DECODE);\r
487 }\r
488}\r
489\r
490\r
491/***********************************************************/\r
492\r
493void mp3_start_play(FILE *f, int pos) // pos is 0-1023\r
494{\r
495 int byte_offs = 0;\r
496\r
497 if (!(PicoOpt&0x800)) { // cdda disabled?\r
498 return;\r
499 }\r
500\r
501 if (loaded_mp3 != f)\r
502 {\r
503 if (PicoMessage != NULL)\r
504 {\r
505 fseek(f, 0, SEEK_END);\r
506 if (ftell(f) > 2*1024*1024)\r
507 PicoMessage("Loading MP3...");\r
508 }\r
509 fseek(f, 0, SEEK_SET);\r
510 fread(mp3_mem, 1, MP3_SIZE_MAX, f);\r
511 if (!feof(f)) printf("Warning: mp3 was too large, not all data loaded.\n");\r
512 shared_ctl->mp3_len = ftell(f);\r
513 loaded_mp3 = f;\r
514\r
515 if (PicoOpt&0x200) {\r
516 // as we are going to change 940's cacheable area, we must invalidate it's cache..\r
517 if (CHECK_BUSY(JOB940_MP3DECODE)) wait_busy_940(JOB940_MP3DECODE);\r
518 add_job_940(JOB940_INVALIDATE_DCACHE);\r
519 }\r
520 reset_timing = 1;\r
521 }\r
522\r
523 // seek..\r
524 if (pos) {\r
525 byte_offs = (shared_ctl->mp3_len << 6) >> 10;\r
526 byte_offs *= pos;\r
527 byte_offs >>= 6;\r
528 }\r
529 // printf("mp3 pos1024: %i, byte_offs %i/%i\n", pos, byte_offs, shared_ctl->mp3_len);\r
530\r
531 shared_ctl->mp3_offs = byte_offs;\r
532\r
533 // reset buffer pointers and stuff..\r
534 mp3_samples_ready = mp3_buffer_offs = mp3_play_bufsel = 0;\r
535 mp3_job_started = 0;\r
536 shared_ctl->mp3_buffsel = 1; // will change to 0 on first decode\r
537\r
538 if (!(PicoOpt&0x200)) mp3_start_local();\r
539}\r
540\r
541\r
542int mp3_get_offset(void)\r
543{\r
544 unsigned int offs1024 = 0;\r
545 int cdda_on;\r
546\r
547 cdda_on = (PicoAHW & PAHW_MCD) && (PicoOpt&0x800) && !(Pico_mcd->s68k_regs[0x36] & 1) &&\r
548 (Pico_mcd->scd.Status_CDC & 1) && loaded_mp3;\r
549\r
550 if (cdda_on) {\r
551 offs1024 = shared_ctl->mp3_offs << 7;\r
552 offs1024 /= shared_ctl->mp3_len >> 3;\r
553 }\r
554 printf("offs1024=%u (%i/%i)\n", offs1024, shared_ctl->mp3_offs, shared_ctl->mp3_len);\r
555\r
556 return offs1024;\r
557}\r
558\r
559\r