initial code for Nemesis' blip discovery
[picodrive.git] / platform / gp2x / 940ctl.c
CommitLineData
6cadc2da 1// Code for communication with ARM940 and control of it.\r
2// (c) Copyright 2007, Grazvydas "notaz" Ignotas\r
3\r
cc68a136 4#include <stdio.h>\r
5#include <stdlib.h>\r
6#include <string.h>\r
7#include <unistd.h>\r
8#include <sys/mman.h>\r
9#include <sys/ioctl.h>\r
10#include <fcntl.h>\r
11#include <errno.h>\r
12\r
42c7b147 13#include "code940/940shared.h"\r
cc68a136 14#include "gp2x.h"\r
15#include "emu.h"\r
16#include "menu.h"\r
da42200b 17#include "../common/mp3.h"\r
e5f426aa 18#include "../common/arm_utils.h"\r
19#include "../common/menu.h"\r
ea8c405f 20#include "../common/emu.h"\r
cb0316e4 21#include "../../Pico/PicoInt.h"\r
5f8c85be 22#include "../../Pico/sound/ym2612.h"\r
4f265db7 23#include "../../Pico/sound/mix.h"\r
24\r
cc68a136 25/* we will need some gp2x internals here */\r
26extern volatile unsigned short *gp2x_memregs; /* from minimal library rlyeh */\r
27extern volatile unsigned long *gp2x_memregl;\r
28\r
00bd648e 29extern int reset_timing;\r
cc68a136 30static unsigned char *shared_mem = 0;\r
31static _940_data_t *shared_data = 0;\r
abe0ea43 32_940_ctl_t *shared_ctl = 0;\r
33unsigned char *mp3_mem = 0;\r
cb0316e4 34\r
e362c573 35#define MP3_SIZE_MAX (0x400000 + 0x800000) // 12M\r
8f8fe01e 36#define CODE940_FILE "pico940_v2.bin"\r
cc68a136 37\r
38int crashed_940 = 0;\r
39\r
51a902ae 40static FILE *loaded_mp3 = 0;\r
cc68a136 41\r
42/***********************************************************/\r
43\r
44#define MAXOUT (+32767)\r
45#define MINOUT (-32768)\r
46\r
47/* limitter */\r
48#define Limit(val, max,min) { \\r
49 if ( val > max ) val = max; \\r
50 else if ( val < min ) val = min; \\r
51}\r
52\r
53/* these will be managed locally on our side */\r
cc68a136 54static UINT8 ST_address; /* address register */\r
4b9c5888 55static INT32 addr_A1; /* address line A1 */\r
cc68a136 56\r
57static int writebuff_ptr = 0;\r
58\r
59\r
cc68a136 60/* YM2612 write */\r
61/* a = address */\r
62/* v = value */\r
63/* returns 1 if sample affecting state changed */\r
4b9c5888 64int YM2612Write_940(unsigned int a, unsigned int v, int scanline)\r
cc68a136 65{\r
2433f409 66 int upd = 1; /* the write affects sample generation */\r
cc68a136 67\r
cc68a136 68 a &= 3;\r
69\r
2433f409 70 //printf("%05i:%03i: ym w ([%i] %02x)\n", Pico.m.frame_count, Pico.m.scanline, a, v);\r
71\r
4b9c5888 72 switch (a) {\r
73 case 0: /* address port 0 */\r
74 if (addr_A1 == 0 && ST_address == v)\r
75 return 0; /* address already selected, don't send this command to 940 */\r
76 ST_address = v;\r
77 addr_A1 = 0;\r
78 /* don't send DAC or timer related address changes to 940 */\r
79 if (v == 0x24 || v == 0x25 || v == 0x26 || v == 0x2a)\r
4ff2d527 80 return 0;\r
4b9c5888 81 upd = 0;\r
82 break;\r
cc68a136 83\r
4b9c5888 84 case 1: /* data port 0 */\r
85 if (ST_address == 0x2b) upd = 0; /* DAC sel */\r
86 break;\r
cc68a136 87\r
4b9c5888 88 case 2: /* address port 1 */\r
89 if (addr_A1 == 1 && ST_address == v)\r
cc68a136 90 return 0;\r
4b9c5888 91 ST_address = v;\r
92 addr_A1 = 1;\r
93 upd = 0;\r
cc68a136 94 break;\r
cc68a136 95 }\r
96\r
2433f409 97 //printf("ym pass\n");\r
98\r
4b9c5888 99 if (currentConfig.EmuOpt & 4)\r
100 {\r
2433f409 101 UINT16 *writebuff = shared_ctl->writebuffsel ? shared_ctl->writebuff0 : shared_ctl->writebuff1;\r
102\r
103 /* detect rapid ym updates */\r
4b9c5888 104 if (upd && !(writebuff_ptr & 0x80000000) && scanline < 224)\r
105 {\r
2433f409 106 int mid = Pico.m.pal ? 68 : 93;\r
4b9c5888 107 if (scanline > mid) {\r
108 //printf("%05i:%03i: rapid ym\n", Pico.m.frame_count, scanline);\r
2433f409 109 writebuff[writebuff_ptr++ & 0xffff] = 0xfffe;\r
110 writebuff_ptr |= 0x80000000;\r
4b9c5888 111 //printf("%05i:%03i: ym w ([%02x] %02x, upd=%i)\n", Pico.m.frame_count, scanline, addr, v, upd);\r
cc68a136 112 }\r
2433f409 113 }\r
114\r
115 /* queue this write for 940 */\r
116 if ((writebuff_ptr&0xffff) < 2047) {\r
117 writebuff[writebuff_ptr++ & 0xffff] = (a<<8)|v;\r
cc68a136 118 } else {\r
4ff2d527 119 printf("warning: writebuff_ptr > 2047 ([%i] %02x)\n", a, v);\r
cc68a136 120 }\r
121 }\r
122\r
123 return 0; // cause the engine to do updates once per frame only\r
124}\r
125\r
cc68a136 126\r
abe0ea43 127#define CHECK_BUSY(job) \\r
128 (gp2x_memregs[0x3b46>>1] & (1<<(job-1)))\r
129\r
130static void wait_busy_940(int job)\r
cc68a136 131{\r
132 int i;\r
cc68a136 133\r
abe0ea43 134 job--;\r
135 for (i = 0; (gp2x_memregs[0x3b46>>1] & (1<<job)) && i < 0x10000; i++)\r
42c7b147 136 spend_cycles(8*1024); // tested to be best for mp3 dec\r
cc68a136 137 if (i < 0x10000) return;\r
138\r
139 /* 940 crashed */\r
42c7b147 140 printf("940 crashed (cnt: %i, ve: ", shared_ctl->loopc);\r
cc68a136 141 for (i = 0; i < 8; i++)\r
142 printf("%i ", shared_ctl->vstarts[i]);\r
143 printf(")\n");\r
abe0ea43 144 printf("irq pending flags: DUALCPU %04x, SRCPND %08lx (see 26), INTPND %08lx\n",\r
4f265db7 145 gp2x_memregs[0x3b46>>1], gp2x_memregl[0x4500>>2], gp2x_memregl[0x4510>>2]);\r
abe0ea43 146 printf("last lr: %08x, lastjob: %i\n", shared_ctl->last_lr, shared_ctl->lastjob);\r
4f265db7 147 printf("trying to interrupt..\n");\r
148 gp2x_memregs[0x3B3E>>1] = 0xffff;\r
abe0ea43 149 for (i = 0; gp2x_memregs[0x3b46>>1] && i < 0x10000; i++)\r
4f265db7 150 spend_cycles(8*1024);\r
151 printf("i = 0x%x\n", i);\r
abe0ea43 152 printf("irq pending flags: DUALCPU %04x, SRCPND %08lx (see 26), INTPND %08lx\n",\r
4f265db7 153 gp2x_memregs[0x3b46>>1], gp2x_memregl[0x4500>>2], gp2x_memregl[0x4510>>2]);\r
abe0ea43 154 printf("last lr: %08x, lastjob: %i\n", shared_ctl->last_lr, shared_ctl->lastjob);\r
4f265db7 155\r
6cadc2da 156 strcpy(menuErrorMsg, "940 crashed, too much overclock?");\r
cc68a136 157 engineState = PGS_Menu;\r
158 crashed_940 = 1;\r
cc68a136 159}\r
160\r
161\r
abe0ea43 162static void add_job_940(int job)\r
cc68a136 163{\r
abe0ea43 164 if (job <= 0 || job > 16) {\r
165 printf("add_job_940: bad job: %i\n", job);\r
166 return;\r
4f265db7 167 }\r
abe0ea43 168\r
169 // generate interrupt for this job\r
170 job--;\r
171 gp2x_memregs[(0x3B20+job*2)>>1] = 1;\r
172\r
173// printf("added %i, pending %04x\n", job+1, gp2x_memregs[0x3b46>>1]);\r
cc68a136 174}\r
175\r
176\r
177void YM2612PicoStateLoad_940(void)\r
178{\r
4b9c5888 179 UINT8 *REGS = YM2612GetRegs();\r
180\r
d5d11924 181 /* make sure JOB940_PICOSTATELOAD gets done before next JOB940_YM2612UPDATEONE */\r
182 add_job_940(JOB940_PICOSTATELOAD);\r
183 if (CHECK_BUSY(JOB940_PICOSTATELOAD)) wait_busy_940(JOB940_PICOSTATELOAD);\r
184\r
185 writebuff_ptr = 0;\r
4b9c5888 186 addr_A1 = *(INT32 *) (REGS + 0x200);\r
cc68a136 187}\r
188\r
189\r
190static void internal_reset(void)\r
191{\r
192 writebuff_ptr = 0;\r
4b9c5888 193 ST_address = addr_A1 = -1;\r
cc68a136 194}\r
195\r
196\r
f80d67e1 197/* this must be called after mmu hack, the allocated regions must not get cached */\r
198void sharedmem_init(void)\r
199{\r
200 if (shared_mem != NULL) return;\r
201\r
202 shared_mem = (unsigned char *) mmap(0, 0x210000, PROT_READ|PROT_WRITE, MAP_SHARED, memdev, 0x2000000);\r
203 if(shared_mem == MAP_FAILED)\r
204 {\r
205 printf("mmap(shared_data) failed with %i\n", errno);\r
206 exit(1);\r
207 }\r
208 shared_data = (_940_data_t *) (shared_mem+0x100000);\r
209 /* this area must not get buffered on either side */\r
210 shared_ctl = (_940_ctl_t *) (shared_mem+0x200000);\r
e362c573 211 mp3_mem = (unsigned char *) mmap(0, MP3_SIZE_MAX, PROT_READ|PROT_WRITE, MAP_SHARED, memdev, 0x2400000);\r
f80d67e1 212 if (mp3_mem == MAP_FAILED)\r
213 {\r
214 printf("mmap(mp3_mem) failed with %i\n", errno);\r
215 exit(1);\r
216 }\r
217 crashed_940 = 1;\r
218}\r
219\r
220\r
85f8e929 221void sharedmem_deinit(void)\r
222{\r
223 munmap(shared_mem, 0x210000);\r
224 munmap(mp3_mem, MP3_SIZE_MAX);\r
225 shared_mem = mp3_mem = NULL;\r
226 shared_data = NULL;\r
227 shared_ctl = NULL;\r
228}\r
229\r
230\r
cc68a136 231extern char **g_argv;\r
232\r
233/* none of the functions in this file should be called before this one */\r
234void YM2612Init_940(int baseclock, int rate)\r
235{\r
236 printf("YM2612Init_940()\n");\r
b837b69b 237 printf("Mem usage: shared_data: %i, shared_ctl: %i\n", sizeof(*shared_data), sizeof(*shared_ctl));\r
cc68a136 238\r
b837b69b 239 Reset940(1, 2);\r
cc68a136 240 Pause940(1);\r
241\r
4f265db7 242 gp2x_memregs[0x3B40>>1] = 0; // disable DUALCPU interrupts for 920\r
243 gp2x_memregs[0x3B42>>1] = 1; // enable DUALCPU interrupts for 940\r
cc68a136 244\r
abe0ea43 245 gp2x_memregl[0x4504>>2] = 0; // make sure no FIQs will be generated\r
246 gp2x_memregl[0x4508>>2] = ~(1<<26); // unmask DUALCPU ints in the undocumented 940's interrupt controller\r
247\r
248\r
cc68a136 249 if (crashed_940)\r
250 {\r
251 unsigned char ucData[1024];\r
252 int nRead, i, nLen = 0;\r
253 char binpath[1024];\r
254 FILE *fp;\r
255\r
256 strncpy(binpath, g_argv[0], 1023);\r
257 binpath[1023] = 0;\r
258 for (i = strlen(binpath); i > 0; i--)\r
259 if (binpath[i] == '/') { binpath[i] = 0; break; }\r
d524c827 260 strcat(binpath, "/" CODE940_FILE);\r
cc68a136 261\r
262 fp = fopen(binpath, "rb");\r
263 if(!fp)\r
264 {\r
a12e0116 265 memset(gp2x_screen, 0, 320*240*2);\r
266 text_out16(10, 100, "failed to open required file:");\r
267 text_out16(10, 110, CODE940_FILE);\r
268 gp2x_video_flip2();\r
cc68a136 269 printf("failed to open %s\n", binpath);\r
270 exit(1);\r
271 }\r
272\r
273 while(1)\r
274 {\r
275 nRead = fread(ucData, 1, 1024, fp);\r
276 if(nRead <= 0)\r
277 break;\r
278 memcpy(shared_mem + nLen, ucData, nRead);\r
279 nLen += nRead;\r
280 }\r
281 fclose(fp);\r
282 crashed_940 = 0;\r
283 }\r
284\r
285 memset(shared_data, 0, sizeof(*shared_data));\r
286 memset(shared_ctl, 0, sizeof(*shared_ctl));\r
287\r
5f8c85be 288 /* cause local ym2612 to init REGS */\r
289 YM2612Init_(baseclock, rate);\r
290\r
cc68a136 291 internal_reset();\r
292\r
51a902ae 293 loaded_mp3 = 0;\r
294\r
4f265db7 295 gp2x_memregs[0x3B46>>1] = 0xffff; // clear pending DUALCPU interrupts for 940\r
abe0ea43 296 gp2x_memregl[0x4500>>2] = 0xffffffff; // clear pending IRQs in SRCPND\r
297 gp2x_memregl[0x4510>>2] = 0xffffffff; // clear pending IRQs in INTPND\r
cc68a136 298\r
299 /* start the 940 */\r
b837b69b 300 Reset940(0, 2);\r
cc68a136 301 Pause940(0);\r
302\r
303 // YM2612ResetChip_940(); // will be done on JOB940_YM2612INIT\r
abe0ea43 304\r
305 /* now cause 940 to init it's ym2612 stuff */\r
306 shared_ctl->baseclock = baseclock;\r
307 shared_ctl->rate = rate;\r
308 add_job_940(JOB940_INITALL);\r
cc68a136 309}\r
310\r
311\r
312void YM2612ResetChip_940(void)\r
313{\r
daec7253 314 //printf("YM2612ResetChip_940()\n");\r
cc68a136 315 if (shared_data == NULL) {\r
316 printf("YM2612ResetChip_940: reset before init?\n");\r
317 return;\r
318 }\r
319\r
4b9c5888 320 YM2612ResetChip_();\r
cc68a136 321 internal_reset();\r
322\r
abe0ea43 323 add_job_940(JOB940_YM2612RESETCHIP);\r
cc68a136 324}\r
325\r
326\r
abe0ea43 327int YM2612UpdateOne_940(int *buffer, int length, int stereo, int is_buf_empty)\r
cb0316e4 328{\r
abe0ea43 329 int *ym_buf = shared_data->ym_buffer;\r
85f8e929 330 int ym_active_chs;\r
4f265db7 331\r
abe0ea43 332 //printf("YM2612UpdateOne_940()\n");\r
333\r
334 if (CHECK_BUSY(JOB940_YM2612UPDATEONE)) wait_busy_940(JOB940_YM2612UPDATEONE);\r
335\r
85f8e929 336 ym_active_chs = shared_ctl->ym_active_chs;\r
abe0ea43 337\r
85f8e929 338 // mix in ym buffer. is_buf_empty means nobody mixed there anything yet and it may contain trash\r
339 if (is_buf_empty && ym_active_chs) memcpy32(buffer, ym_buf, length<<stereo);\r
340 else memset32(buffer, 0, length<<stereo);\r
abe0ea43 341\r
342 if (shared_ctl->writebuffsel == 1) {\r
2433f409 343 shared_ctl->writebuff0[writebuff_ptr & 0xffff] = 0xffff;\r
4f265db7 344 } else {\r
2433f409 345 shared_ctl->writebuff1[writebuff_ptr & 0xffff] = 0xffff;\r
cb0316e4 346 }\r
abe0ea43 347 writebuff_ptr = 0;\r
348\r
349 /* predict sample counter for next frame */\r
350 if (PsndLen_exc_add) {\r
351 if (PsndLen_exc_cnt + PsndLen_exc_add >= 0x10000) length = PsndLen + 1;\r
352 else length = PsndLen;\r
353 }\r
354\r
355 /* give 940 ym job */\r
356 shared_ctl->writebuffsel ^= 1;\r
357 shared_ctl->length = length;\r
358 shared_ctl->stereo = stereo;\r
359\r
360 add_job_940(JOB940_YM2612UPDATEONE);\r
361\r
85f8e929 362 return ym_active_chs;\r
cb0316e4 363}\r
cb0316e4 364\r
cb0316e4 365\r
51a902ae 366static int mp3_samples_ready = 0, mp3_buffer_offs = 0;\r
abe0ea43 367static int mp3_play_bufsel = 0, mp3_job_started = 0;\r
cb0316e4 368\r
abe0ea43 369void mp3_update(int *buffer, int length, int stereo)\r
cc68a136 370{\r
abe0ea43 371 int length_mp3;\r
372 int cdda_on;\r
4f265db7 373\r
da42200b 374 // playback was started, track not ended\r
375 cdda_on = loaded_mp3 && shared_ctl->mp3_offs < shared_ctl->mp3_len;\r
cc68a136 376\r
abe0ea43 377 if (!cdda_on) return;\r
cc68a136 378\r
abe0ea43 379 if (!(PicoOpt&0x200)) {\r
380 mp3_update_local(buffer, length, stereo);\r
381 return;\r
382 }\r
cc68a136 383\r
abe0ea43 384 length_mp3 = length;\r
385 if (PsndRate == 22050) length_mp3 <<= 1; // mp3s are locked to 44100Hz stereo\r
386 else if (PsndRate == 11025) length_mp3 <<= 2; // so make length 44100ish\r
4f265db7 387\r
abe0ea43 388 /* do we have to wait? */\r
389 if (mp3_job_started && mp3_samples_ready < length_mp3) {\r
390 if (CHECK_BUSY(JOB940_MP3DECODE)) wait_busy_940(JOB940_MP3DECODE);\r
391 mp3_job_started = 0;\r
392 mp3_samples_ready += 1152;\r
393 }\r
cb0316e4 394\r
4f265db7 395 /* mix mp3 data, only stereo */\r
abe0ea43 396 if (mp3_samples_ready >= length_mp3)\r
cb0316e4 397 {\r
4f265db7 398 int shr = 0;\r
399 void (*mix_samples)(int *dest_buf, short *mp3_buf, int count) = mix_16h_to_32;\r
400 if (PsndRate == 22050) { mix_samples = mix_16h_to_32_s1; shr = 1; }\r
401 else if (PsndRate == 11025) { mix_samples = mix_16h_to_32_s2; shr = 2; }\r
cb0316e4 402\r
4f265db7 403 if (1152 - mp3_buffer_offs >= length_mp3) {\r
abe0ea43 404 mix_samples(buffer, shared_data->mp3_buffer[mp3_play_bufsel] + mp3_buffer_offs*2, length<<1);\r
4f265db7 405\r
406 mp3_buffer_offs += length_mp3;\r
cb0316e4 407 } else {\r
abe0ea43 408 // collect samples from both buffers..\r
cb0316e4 409 int left = 1152 - mp3_buffer_offs;\r
4f265db7 410 if (mp3_play_bufsel == 0)\r
411 {\r
abe0ea43 412 mix_samples(buffer, shared_data->mp3_buffer[0] + mp3_buffer_offs*2, length<<1);\r
4f265db7 413 mp3_buffer_offs = length_mp3 - left;\r
414 mp3_play_bufsel = 1;\r
415 } else {\r
416 mix_samples(buffer, shared_data->mp3_buffer[1] + mp3_buffer_offs*2, (left>>shr)<<1);\r
417 mp3_buffer_offs = length_mp3 - left;\r
418 mix_samples(buffer + ((left>>shr)<<1),\r
419 shared_data->mp3_buffer[0], (mp3_buffer_offs>>shr)<<1);\r
420 mp3_play_bufsel = 0;\r
421 }\r
cc68a136 422 }\r
4f265db7 423 mp3_samples_ready -= length_mp3;\r
cc68a136 424 }\r
425\r
abe0ea43 426 // ask to decode more if we already can\r
427 if (!mp3_job_started)\r
cb0316e4 428 {\r
abe0ea43 429 mp3_job_started = 1;\r
cb0316e4 430 shared_ctl->mp3_buffsel ^= 1;\r
abe0ea43 431 add_job_940(JOB940_MP3DECODE);\r
cb0316e4 432 }\r
cc68a136 433}\r
cb0316e4 434\r
435\r
436/***********************************************************/\r
437\r
438void mp3_start_play(FILE *f, int pos) // pos is 0-1023\r
439{\r
440 int byte_offs = 0;\r
441\r
1cd356a3 442 if (!(PicoOpt&0x800)) { // cdda disabled?\r
cb0316e4 443 return;\r
444 }\r
445\r
446 if (loaded_mp3 != f)\r
447 {\r
66fdc0f0 448 if (PicoMessage != NULL)\r
449 {\r
450 fseek(f, 0, SEEK_END);\r
451 if (ftell(f) > 2*1024*1024)\r
452 PicoMessage("Loading MP3...");\r
453 }\r
cb0316e4 454 fseek(f, 0, SEEK_SET);\r
455 fread(mp3_mem, 1, MP3_SIZE_MAX, f);\r
e362c573 456 if (!feof(f)) printf("Warning: mp3 was too large, not all data loaded.\n");\r
cb0316e4 457 shared_ctl->mp3_len = ftell(f);\r
458 loaded_mp3 = f;\r
abe0ea43 459\r
460 if (PicoOpt&0x200) {\r
461 // as we are going to change 940's cacheable area, we must invalidate it's cache..\r
462 if (CHECK_BUSY(JOB940_MP3DECODE)) wait_busy_940(JOB940_MP3DECODE);\r
463 add_job_940(JOB940_INVALIDATE_DCACHE);\r
464 }\r
00bd648e 465 reset_timing = 1;\r
cb0316e4 466 }\r
467\r
468 // seek..\r
469 if (pos) {\r
470 byte_offs = (shared_ctl->mp3_len << 6) >> 10;\r
471 byte_offs *= pos;\r
472 byte_offs >>= 6;\r
473 }\r
4f265db7 474 // printf("mp3 pos1024: %i, byte_offs %i/%i\n", pos, byte_offs, shared_ctl->mp3_len);\r
cb0316e4 475\r
476 shared_ctl->mp3_offs = byte_offs;\r
51a902ae 477\r
abe0ea43 478 // reset buffer pointers and stuff..\r
51a902ae 479 mp3_samples_ready = mp3_buffer_offs = mp3_play_bufsel = 0;\r
abe0ea43 480 mp3_job_started = 0;\r
51a902ae 481 shared_ctl->mp3_buffsel = 1; // will change to 0 on first decode\r
abe0ea43 482\r
483 if (!(PicoOpt&0x200)) mp3_start_local();\r
cb0316e4 484}\r
485\r
486\r
75736070 487int mp3_get_offset(void)\r
488{\r
da42200b 489 unsigned int offs1024 = 0;\r
75736070 490 int cdda_on;\r
491\r
602133e1 492 cdda_on = (PicoAHW & PAHW_MCD) && (PicoOpt&0x800) && !(Pico_mcd->s68k_regs[0x36] & 1) &&\r
abe0ea43 493 (Pico_mcd->scd.Status_CDC & 1) && loaded_mp3;\r
75736070 494\r
495 if (cdda_on) {\r
496 offs1024 = shared_ctl->mp3_offs << 7;\r
da42200b 497 offs1024 /= shared_ctl->mp3_len >> 3;\r
75736070 498 }\r
da42200b 499 printf("offs1024=%u (%i/%i)\n", offs1024, shared_ctl->mp3_offs, shared_ctl->mp3_len);\r
75736070 500\r
501 return offs1024;\r
502}\r
503\r
504\r