some conditional op emulation
[ginge.git] / loader / emu.c
... / ...
CommitLineData
1/*
2 * GINGE - GINGE Is Not Gp2x Emulator
3 * (C) notaz, 2010-2011,2016
4 *
5 * This work is licensed under the MAME license, see COPYING file for details.
6 */
7// a "gentle" reminder
8#ifdef __ARM_EABI__
9#error loader is meant to be OABI!
10#endif
11#include <stdio.h>
12#include <stdlib.h>
13#include <string.h>
14#include <alloca.h>
15#include <ctype.h>
16#include <sys/types.h>
17#include <sys/stat.h>
18#include <fcntl.h>
19#include <sys/mman.h>
20#include <sys/types.h>
21#include <unistd.h>
22#include <signal.h>
23#include <asm/ucontext.h>
24#include <pthread.h>
25#include <errno.h>
26#include <time.h>
27#include <sys/resource.h>
28#include <sys/ioctl.h>
29#include <linux/soundcard.h>
30#include <linux/fb.h>
31
32#include "header.h"
33#include "../common/host_fb.h"
34#include "../common/cmn.h"
35#include "sys_cacheflush.h"
36#include "realfuncs.h"
37
38#if (DBG & 2) && !(DBG & 4)
39#define LOG_IO_UNK
40#endif
41#if (DBG & 4)
42#define LOG_IO
43#endif
44//#define LOG_SEGV
45
46#ifdef LOG_IO
47#define iolog log_io
48#else
49#define iolog(...)
50#endif
51
52#ifdef LOG_IO_UNK
53#define iolog_unh log_io
54#else
55#define iolog_unh(...)
56#endif
57
58#ifdef LOG_SEGV
59#define segvlog printf
60#else
61#define segvlog(...)
62#endif
63
64#if defined(LOG_IO) || defined(LOG_IO_UNK)
65#include "mmsp2-regs.h"
66#endif
67
68typedef unsigned long long u64;
69typedef unsigned int u32;
70typedef unsigned short u16;
71typedef unsigned char u8;
72
73static pthread_mutex_t fb_mutex = PTHREAD_MUTEX_INITIALIZER;
74static pthread_cond_t fb_cond = PTHREAD_COND_INITIALIZER;
75
76static struct {
77 u32 dstctrl;
78 u32 dstaddr;
79 u32 dststride;
80 u32 srcctrl;
81 u32 srcaddr; //
82 u32 srcstride;
83 u32 srcforcolor;
84 u32 srcbackcolor;
85 u32 patctrl; //
86 u32 patforcolor;
87 u32 patbackcolor;
88 u32 size;
89 u32 ctrl; //
90 u32 run;
91 u32 intc;
92 u32 srcfifo;
93} blitter;
94
95#define SRCCTRL_INVIDEO (1 << 8)
96#define SRCCTRL_SRCENB (1 << 7)
97#define CTRL_TRANSPARENCYENB (1 << 11)
98
99static struct {
100 // mmsp2
101 u16 mlc_stl_cntl;
102 union {
103 u32 mlc_stl_adr; // mlcaddress for pollux
104 struct {
105 u16 mlc_stl_adrl;
106 u16 mlc_stl_adrh;
107 };
108 };
109 u16 mlc_stl_pallt_a;
110 union {
111 u16 mlc_stl_pallt_d[256*2];
112 u32 mlc_stl_pallt_d32[256];
113 };
114
115 // pollux
116 u32 mlccontrol;
117 u16 mlcpalette[256];
118
119 // state
120 void *umem;
121 u32 old_mlc_stl_adr;
122 u32 btn_state; // as seen through /dev/GPIO: 0PVdVu YXBA RLSeSt 0Ri0Dn 0Le0Up
123 struct {
124 u32 width, height;
125 u32 stride;
126 u32 bpp;
127 u32 dirty_pal:2;
128 } v;
129} mmsp2;
130#define pollux mmsp2 // so that code doesn't look that weird
131enum {
132 DIRTY_PAL_MMSP2 = 1,
133 DIRTY_PAL_POLLUX = 2,
134};
135
136
137#if defined(LOG_IO) || defined(LOG_IO_UNK)
138static void log_io(const char *pfx, u32 a, u32 d, int size)
139{
140 const char *fmt, *reg = "";
141 switch (size) {
142 case 8: fmt = "%s %08x %02x %s\n"; d &= 0xff; break;
143 case 32: fmt = "%s %08x %08x %s\n"; break;
144 default: fmt = "%s %08x %04x %s\n"; d &= 0xffff; break;
145 }
146
147 if ((a & ~0xffff) == 0x7f000000)
148 reg = regnames[a & 0xffff];
149
150 printf(fmt, pfx, a, d, reg);
151}
152#endif
153
154static void memset16(void *dst, u32 pattern, int count)
155{
156 u32 *dl;
157 u16 *d;
158
159 d = (u16 *)((long)dst & ~1);
160 if ((long)d & 2) {
161 *d++ = pattern;
162 count--;
163 }
164 dl = (void *)d;
165 pattern |= pattern << 16;
166
167 while (count >= 2) {
168 *dl++ = pattern;
169 count -= 2;
170 }
171 if (count)
172 *(u16 *)dl = pattern;
173}
174
175static void blt_tr(void *dst, void *src, u32 trc, int w)
176{
177 u16 *d = (u16 *)((long)dst & ~1);
178 u16 *s = (u16 *)((long)src & ~1);
179
180 // XXX: optimize
181 for (; w > 0; d++, s++, w--)
182 if (*s != trc)
183 *d = *s;
184}
185
186#define dump_blitter() \
187{ \
188 u32 *r = &blitter.dstctrl; \
189 int i; \
190 for (i = 0; i < 4*4; i++, r++) { \
191 printf("%08x ", *r); \
192 if ((i & 3) == 3) \
193 printf("\n"); \
194 } \
195}
196
197static void *uppermem_lookup(u32 addr, u8 **mem_end)
198{
199 // XXX: maybe support mirroring?
200 if ((addr & 0xfe000000) != 0x02000000)
201 return NULL;
202
203 *mem_end = (u8 *)mmsp2.umem + 0x02000000;
204 return (u8 *)mmsp2.umem - 0x02000000 + addr;
205}
206
207static void blitter_do(void)
208{
209 u8 *dst, *dste, *src = NULL, *srce = NULL;
210 int w, h, sstrd, dstrd;
211 int to_screen = 0;
212 u32 bpp, addr;
213
214 w = blitter.size & 0x7ff;
215 h = (blitter.size >> 16) & 0x7ff;
216 sstrd = blitter.srcstride;
217 dstrd = blitter.dststride;
218
219 // XXX: need to confirm this..
220 addr = (blitter.dstaddr & ~3) | ((blitter.dstctrl & 0x1f) >> 3);
221
222 // use dst bpp.. How does it do blits with different src bpp?
223 bpp = (blitter.dstctrl & 0x20) ? 16 : 8;
224
225 // maybe the screen?
226 if (((w == 320 && h == 240) || // blit whole screen
227 (w * h >= 320*240/2)) && // ..or at least half of the area
228 mmsp2.mlc_stl_adr <= addr && addr < mmsp2.mlc_stl_adr + 320*240*2)
229 to_screen = 1;
230
231 dst = uppermem_lookup(addr, &dste);
232
233 // XXX: assume fill if no SRCENB, but it could be pattern blit..
234 if (blitter.srcctrl & SRCCTRL_SRCENB) {
235 if (!(blitter.srcctrl & SRCCTRL_INVIDEO))
236 goto bad_blit;
237
238 addr = (blitter.srcaddr & ~3) | ((blitter.srcctrl & 0x1f) >> 3);
239 src = uppermem_lookup(addr, &srce);
240 if (src == NULL)
241 goto bad_blit;
242
243 if (src + sstrd * h > srce) {
244 err("blit %08x->%08x %dx%d did not fit src\n",
245 blitter.srcaddr, blitter.dstaddr, w, h);
246 h = (srce - src) / sstrd;
247 }
248 }
249
250 if (dst == NULL)
251 goto bad_blit;
252
253 if (dst + dstrd * h > dste) {
254 err("blit %08x->%08x %dx%d did not fit dst\n",
255 blitter.srcaddr, blitter.dstaddr, w, h);
256 h = (dste - dst) / dstrd;
257 }
258
259 if (src != NULL) {
260 // copy
261 if (bpp == 16 && (blitter.ctrl & CTRL_TRANSPARENCYENB)) {
262 u32 trc = blitter.ctrl >> 16;
263 for (; h > 0; h--, dst += dstrd, src += sstrd)
264 blt_tr(dst, src, trc, w);
265 }
266 else {
267 for (; h > 0; h--, dst += dstrd, src += sstrd)
268 memcpy(dst, src, w * bpp / 8);
269 }
270 }
271 else {
272 // fill. Assume the pattern is cleared and bg color is used
273 u32 bgc = blitter.patbackcolor & 0xffff;
274 if (bpp == 16) {
275 for (; h > 0; h--, dst += dstrd)
276 memset16(dst, bgc, w);
277 }
278 else {
279 for (; h > 0; h--, dst += dstrd)
280 memset(dst, bgc, w); // bgc?
281 }
282 }
283
284 if (to_screen)
285 pthread_cond_signal(&fb_cond);
286 return;
287
288bad_blit:
289 err("blit %08x->%08x %dx%d translated to %p->%p\n",
290 blitter.srcaddr, blitter.dstaddr, w, h, src, dst);
291 dump_blitter();
292}
293
294// FIXME: pass real dimensions to blitters
295static void mlc_flip(void *src, int bpp, int stride)
296{
297 static int old_bpp;
298
299 // only pass pal to host if it's dirty
300 if (bpp <= 8 && mmsp2.v.dirty_pal) {
301 if (mmsp2.v.dirty_pal == DIRTY_PAL_MMSP2)
302 host_video_update_pal32(mmsp2.mlc_stl_pallt_d32);
303 else
304 host_video_update_pal16(mmsp2.mlcpalette);
305 mmsp2.v.dirty_pal = 0;
306 }
307
308 if (bpp != old_bpp) {
309 host_video_change_bpp(bpp);
310 old_bpp = bpp;
311 }
312
313 switch (bpp) {
314 case 4:
315 host_video_blit4(src, 320, 240, stride);
316 break;
317
318 case 8:
319 host_video_blit8(src, 320, 240, stride);
320 break;
321
322 case 16:
323 host_video_blit16(src, 320, 240, stride);
324 break;
325
326 case 24:
327 // TODO
328 break;
329 }
330}
331
332#define ts_add_nsec(ts, ns) { \
333 ts.tv_nsec += ns; \
334 if (ts.tv_nsec >= 1000000000) { \
335 ts.tv_sec++; \
336 ts.tv_nsec -= 1000000000; \
337 } \
338}
339
340static int fb_sync_thread_paused;
341
342static void *fb_sync_thread(void *arg)
343{
344 int invalid_fb_addr = 1;
345 int manual_refresh = 0;
346 int frame_counter = 0;
347 struct timespec ts;
348 int ret, wait_ret;
349
350 //ret = pthread_setschedprio(pthread_self(), -1);
351 //log("pthread_setschedprio %d\n", ret);
352 //ret = setpriority(PRIO_PROCESS, 0, -1);
353 //log("setpriority %d\n", ret);
354
355 ret = clock_gettime(CLOCK_REALTIME, &ts);
356 if (ret != 0) {
357 perror(PFX "clock_gettime");
358 exit(1);
359 }
360
361 while (1) {
362 u8 *gp2x_fb, *gp2x_fb_end;
363
364 ret = pthread_mutex_lock(&fb_mutex);
365 wait_ret = pthread_cond_timedwait(&fb_cond, &fb_mutex, &ts);
366 ret |= pthread_mutex_unlock(&fb_mutex);
367
368 if (ret != 0) {
369 err("fb_thread: mutex error: %d\n", ret);
370 sleep(1);
371 goto check_keys;
372 }
373 if (wait_ret != 0 && wait_ret != ETIMEDOUT) {
374 err("fb_thread: cond error: %d\n", wait_ret);
375 sleep(1);
376 goto check_keys;
377 }
378 if (fb_sync_thread_paused) {
379 ts_add_nsec(ts, 100000000);
380 goto check_keys;
381 }
382
383 if (wait_ret != ETIMEDOUT) {
384 clock_gettime(CLOCK_REALTIME, &ts);
385 ts_add_nsec(ts, 50000000);
386 manual_refresh++;
387 if (manual_refresh == 2)
388 dbg("fb_thread: switch to manual refresh\n");
389 } else {
390 ts_add_nsec(ts, 16666667);
391 if (manual_refresh > 1)
392 dbg("fb_thread: switch to auto refresh\n");
393 manual_refresh = 0;
394 }
395
396 gp2x_fb = uppermem_lookup(mmsp2.mlc_stl_adr, &gp2x_fb_end);
397 if (gp2x_fb == NULL || gp2x_fb + 320*240 * mmsp2.v.bpp / 8 > gp2x_fb_end) {
398 if (!invalid_fb_addr) {
399 err("fb_thread: %08x is out of range\n", mmsp2.mlc_stl_adr);
400 invalid_fb_addr = 1;
401 }
402 continue;
403 }
404
405 invalid_fb_addr = 0;
406 mlc_flip(gp2x_fb, mmsp2.v.bpp, mmsp2.v.stride);
407
408 frame_counter++;
409 if (frame_counter & 0x0f)
410 continue;
411
412check_keys:
413 // this is to check for kill key, in case main thread hung
414 // or something else went wrong.
415 pollux.btn_state = host_read_btns();
416 }
417}
418
419static void fb_thread_pause(void)
420{
421 fb_sync_thread_paused = 1;
422 // wait until it finishes last refresh
423 // that it might be doing now
424 usleep(10000);
425}
426
427static void fb_thread_resume(void)
428{
429 fb_sync_thread_paused = 0;
430}
431
432static u32 xread32_io_cmn(u32 a, u32 *handled)
433{
434 u32 d = 0;
435
436 *handled = 1;
437 switch (a) {
438 // Wiz stuff
439 case 0x402c: // MLCVSTRIDE0
440 case 0x4060: // MLCVSTRIDE1
441 d = pollux.v.stride;
442 break;
443 case 0x4038: // MLCADDRESS0
444 case 0x406c: // MLCADDRESS1
445 d = pollux.mlc_stl_adr;
446 break;
447 // wiz_lib reads:
448 // ???? ???? YXBA DURiLe ???? VdVuMS LR?? ????
449 // | GPIOC[31:16] | GPIOB[31:16] |
450 case 0xa058: // GPIOBPAD
451 d = (pollux.btn_state >> 1) & 0x0100;
452 d |= (pollux.btn_state << 1) & 0x0200;
453 d |= (pollux.btn_state >> 3) & 0x0080;
454 d |= (pollux.btn_state >> 5) & 0x0040;
455 d |= (pollux.btn_state >> 6) & 0x0c00;
456 d <<= 16;
457 d = ~d;
458 break;
459 case 0xa098: // GPIOCPAD
460 pollux.btn_state = host_read_btns();
461 d = (pollux.btn_state >> 8) & 0x00f0;
462 d |= (pollux.btn_state >> 1) & 0x0008;
463 d |= (pollux.btn_state << 2) & 0x0004;
464 d |= (pollux.btn_state >> 5) & 0x0002;
465 d |= (pollux.btn_state >> 2) & 0x0001;
466 d <<= 16;
467 d = ~d;
468 break;
469 default:
470 *handled = 0;
471 break;
472 }
473
474 return d;
475}
476
477static u32 xread8(u32 a)
478{
479 iolog("r8 ", a, 0, 8);
480 iolog_unh("r8 ", a, 0, 8);
481 return 0;
482}
483
484static u32 xread16(u32 a)
485{
486 static u32 fudge, old_a;
487 u32 d = 0, t;
488
489 if ((a & 0xffff0000) == 0x7f000000) {
490 u32 a_ = a & 0xffff;
491 switch (a_) {
492 case 0x0910: // FPLL
493 case 0x0912:
494 d = 0x9407;
495 break;
496 // minilib reads as:
497 // 0000 P000 VuVd00 0000 YXBA RLSeSt 0Ri0D 0Le0U
498 // | GPIOD |GPIOC[8:15]|GPIOM[0:7] |
499 // /dev/GPIO:
500 // ... 0PVdVu ...
501 case 0x1184: // GPIOC
502 d = ~mmsp2.btn_state & 0xff00;
503 d |= 0x00ff;
504 break;
505 case 0x1186: // GPIOD
506 t = ~mmsp2.btn_state;
507 d = (t >> 9) & 0x0080;
508 d |= (t >> 11) & 0x0040;
509 d |= (t >> 7) & 0x0800;
510 d |= 0x373b;
511 break;
512 case 0x1198: // GPIOM
513 mmsp2.btn_state = host_read_btns();
514 d = ~mmsp2.btn_state & 0xff;
515 d |= 0x01aa;
516 break;
517 case 0x1836: // reserved
518 d = 0x2330;
519 break;
520 case 0x2816: // DPC_X_MAX
521 d = 319;
522 break;
523 case 0x2818: // DPC_Y_MAX
524 d = 239;
525 break;
526 case 0x28da:
527 d = mmsp2.mlc_stl_cntl;
528 break;
529 case 0x290e:
530 case 0x2912:
531 d = mmsp2.mlc_stl_adrl;
532 break;
533 case 0x2910:
534 case 0x2914:
535 d = mmsp2.mlc_stl_adrh;
536 break;
537 case 0x2958:
538 d = mmsp2.mlc_stl_pallt_a;
539 break;
540
541 default:
542 d = xread32_io_cmn(a_, &t);
543 if (!t)
544 goto unk;
545 if (!(a_ & 2))
546 d >>= 16;
547 break;
548 }
549 goto out;
550 }
551
552unk:
553 if (a == old_a) {
554 d = fudge;
555 fudge = ~fudge;
556 }
557 old_a = a;
558 iolog_unh("r16", a, d & 0xffff, 16);
559
560out:
561 d &= 0xffff;
562 iolog("r16", a, d, 16);
563 return d;
564}
565
566static u32 xread32(u32 a)
567{
568 u32 d = 0;
569 if ((a & 0xfff00000) == 0x7f000000) {
570 u32 a_ = a & 0xffff;
571 struct timespec ts;
572 u64 t64;
573 u32 t;
574
575 switch (a_) {
576 case 0x0a00: // TCOUNT, 1/7372800s
577 clock_gettime(CLOCK_REALTIME, &ts);
578 t64 = (u64)ts.tv_sec * 1000000000 + ts.tv_nsec;
579 // t * 7372800.0 / 1000000000 * 0x100000000 ~= t * 31665935
580 t64 *= 31665935;
581 d = t64 >> 32;
582 break;
583
584 default:
585 d = xread32_io_cmn(a_, &t);
586 if (!t)
587 goto unh;
588 break;
589 }
590 goto out;
591 }
592 if ((a & 0xfff00000) == 0x7f100000) {
593 u32 *bl = &blitter.dstctrl;
594 u32 a_ = a & 0xfff;
595 if (a_ < 0x40) {
596 d = bl[a_ / 4];
597 if (a_ == 0x34)
598 d = 0; // not busy
599 goto out;
600 }
601 }
602
603unh:
604 iolog_unh("r32", a, d, 32);
605
606out:
607 iolog("r32", a, d, 32);
608 return d;
609}
610
611static void xwrite8(u32 a, u32 d)
612{
613 iolog("w8 ", a, d, 8);
614 iolog_unh("w8 ", a, d, 8);
615}
616
617static void xwrite16(u32 a, u32 d)
618{
619 iolog("w16", a, d, 16);
620 if ((a & 0xfff00000) == 0x7f000000) {
621 u32 a_ = a & 0xffff;
622 switch (a_) {
623 case 0x28da: {
624 int mode;
625 mmsp2.mlc_stl_cntl = d | 0xaa;
626 mode = (d >> 9) & 3;
627 mmsp2.v.bpp = mode ? mode * 8 : 4;
628 break;
629 }
630 case 0x290c:
631 mmsp2.v.stride = d;
632 return;
633 case 0x290e:
634 case 0x2910:
635 // odd addresses don't affect LCD. What about TV?
636 return;
637 case 0x2912:
638 mmsp2.mlc_stl_adrl = d;
639 return;
640 case 0x2914:
641 mmsp2.mlc_stl_adrh = d;
642 if (mmsp2.mlc_stl_adr != mmsp2.old_mlc_stl_adr)
643 // ask for refresh
644 pthread_cond_signal(&fb_cond);
645 mmsp2.old_mlc_stl_adr = mmsp2.mlc_stl_adr;
646 return;
647 case 0x2958:
648 mmsp2.mlc_stl_pallt_a = d & 0x1ff;
649 return;
650 case 0x295a:
651 mmsp2.mlc_stl_pallt_d[mmsp2.mlc_stl_pallt_a++] = d;
652 mmsp2.mlc_stl_pallt_a &= 0x1ff;
653 mmsp2.v.dirty_pal = DIRTY_PAL_MMSP2;
654 return;
655 }
656 }
657 iolog_unh("w16", a, d, 16);
658}
659
660static void xwrite32(u32 a, u32 d)
661{
662 iolog("w32", a, d, 32);
663
664 if ((a & 0xfff00000) == 0x7f000000) {
665 u32 a_ = a & 0xffff;
666 switch (a_) {
667 // Wiz
668 case 0x4024: // MLCCONTROL0
669 case 0x4058: // MLCCONTROL1
670 pollux.mlccontrol = d;
671 if (!(d & 0x20))
672 return; // layer not enabled
673 if ((d >> 16) == 0x443A)
674 pollux.v.bpp = 8;
675 else
676 pollux.v.bpp = 16;
677 return;
678 case 0x402c: // MLCVSTRIDE0
679 case 0x4060: // MLCVSTRIDE1
680 pollux.v.stride = d;
681 return;
682 case 0x4038: // MLCADDRESS0
683 case 0x406c: // MLCADDRESS1
684 pollux.mlc_stl_adr = d;
685 if (d != mmsp2.old_mlc_stl_adr)
686 // ask for refresh
687 pthread_cond_signal(&fb_cond);
688 mmsp2.old_mlc_stl_adr = d;
689 return;
690 case 0x403c: // MLCPALETTE0
691 case 0x4070: // MLCPALETTE1
692 pollux.mlcpalette[d >> 24] = d;
693 pollux.v.dirty_pal = DIRTY_PAL_POLLUX;
694 return;
695 }
696 }
697 if ((a & 0xfff00000) == 0x7f100000) {
698 u32 *bl = &blitter.dstctrl;
699 u32 a_ = a & 0xfff;
700 if (a_ < 0x40) {
701 bl[a_ / 4] = d;
702 if (a_ == 0x34 && (d & 1))
703 blitter_do();
704 return;
705 }
706 }
707 iolog_unh("w32", a, d, 32);
708}
709
710#define LINKPAGE_SIZE 0x1000
711#define LINKPAGE_COUNT 4
712#define LINKPAGE_ALLOC (LINKPAGE_SIZE * LINKPAGE_COUNT)
713
714struct op_context {
715 u32 pc;
716 u32 op;
717 u32 code[0];
718};
719
720struct op_linkpage {
721 void (*handler)(struct op_context *op_ctx);
722 u32 code[0];
723};
724
725struct op_stackframe {
726 u32 saved_regs[15];
727 u32 cpsr;
728};
729
730static struct op_linkpage *g_linkpage;
731static u32 *g_code_ptr;
732static int g_linkpage_count;
733
734enum opcond {
735 C_EQ, C_NE, C_CS, C_CC, C_MI, C_PL, C_VS, C_VC,
736 C_HI, C_LS, C_GE, C_LT, C_GT, C_LE, C_AL,
737};
738enum cpsr_cond {
739 CPSR_N = (1u << 31),
740 CPSR_Z = (1u << 30),
741 CPSR_C = (1u << 29),
742 CPSR_V = (1u << 28),
743};
744
745#define BIT_SET(v, b) (v & (1 << (b)))
746
747void emu_handle_op(struct op_context *op_ctx, struct op_stackframe *sframe)
748{
749 u32 *regs = sframe->saved_regs;
750 u32 cpsr = sframe->cpsr;
751 u32 op = op_ctx->op;
752 u32 t, shift, ret, addr;
753 int i, rn, rd, cond;
754
755 cond = (op & 0xf0000000) >> 28;
756 rd = (op & 0x0000f000) >> 12;
757 rn = (op & 0x000f0000) >> 16;
758
759 if (cond != 0x0e) {
760 switch (cond) {
761 case C_EQ: if ( (cpsr & CPSR_Z)) break; return;
762 case C_NE: if (!(cpsr & CPSR_Z)) break; return;
763 case C_CS: if ( (cpsr & CPSR_C)) break; return;
764 case C_CC: if (!(cpsr & CPSR_C)) break; return;
765 case C_MI: if ( (cpsr & CPSR_N)) break; return;
766 case C_PL: if (!(cpsr & CPSR_N)) break; return;
767 case C_VS: if ( (cpsr & CPSR_V)) break; return;
768 case C_VC: if (!(cpsr & CPSR_V)) break; return;
769 default:
770 goto unhandled;
771 }
772 }
773
774 if ((op & 0x0f200090) == 0x01000090) { // AM3: LDRH, STRH
775 if (!BIT_SET(op, 5)) // !H
776 goto unhandled;
777 if (BIT_SET(op, 6) && !BIT_SET(op, 20)) // S && !L
778 goto unhandled;
779
780 if (BIT_SET(op, 22)) // imm offset
781 t = ((op & 0xf00) >> 4) | (op & 0x0f);
782 else // reg offset
783 t = regs[op & 0x000f];
784
785 if (!BIT_SET(op, 23))
786 t = -t;
787 addr = regs[rn] + t;
788
789 if (BIT_SET(op, 20)) { // Load
790 ret = xread16(addr);
791 if (BIT_SET(op, 6)) { // S
792 ret <<= 16;
793 ret = (signed int)ret >> 16;
794 }
795 regs[rd] = ret;
796 }
797 else
798 xwrite16(addr, regs[rd]);
799 }
800 else if ((op & 0x0c000000) == 0x04000000) { // load/store word/byte
801 if (BIT_SET(op, 21))
802 goto unhandled; // unprivileged
803 if (BIT_SET(op, 25)) { // reg offs
804 if (BIT_SET(op, 4))
805 goto unhandled; // nah it's media
806
807 t = regs[op & 0x000f];
808 shift = (op & 0x0f80) >> 7;
809 switch ((op & 0x0060) >> 5) {
810 case 0: t = t << shift; break;
811 case 1: t = t >> (shift + 1); break;
812 case 2: t = (signed int)t >> (shift + 1); break;
813 case 3: goto unhandled; // I'm just lazy
814 }
815 }
816 else // imm offs
817 t = op & 0x0fff;
818
819 if (!BIT_SET(op, 23))
820 t = -t;
821
822 addr = regs[rn];
823 if (BIT_SET(op, 24)) // pre-indexed
824 addr += t;
825 if (!BIT_SET(op, 24) || BIT_SET(op, 21))
826 regs[rn] += t; // writeback
827
828 if (BIT_SET(op, 20)) { // Load
829 if (BIT_SET(op, 22)) // Byte
830 ret = xread8(addr);
831 else
832 ret = xread32(addr);
833 regs[rd] = ret;
834 }
835 else {
836 if (BIT_SET(op, 22)) // Byte
837 xwrite8(addr, regs[rd]);
838 else
839 xwrite32(addr, regs[rd]);
840 }
841 }
842 else
843 goto unhandled;
844
845#if 0
846 if (addr != addr_check) {
847 fprintf(stderr, "bad calculated addr: %08x vs %08x\n", addr, addr_check);
848 abort();
849 }
850#endif
851 return;
852
853unhandled:
854 err("unhandled IO op %08x @ %08x\n", op, op_ctx->pc);
855 for (i = 0; i < 8-1; i++)
856 err(" r%d=%08x r%-2d=%08x\n", i, regs[i], i+8, regs[i+8]);
857 err(" r%d=%08x cpsr=%08x\n", i, regs[i], cpsr);
858 abort();
859}
860
861static u32 make_offset12(u32 *pc, u32 *target)
862{
863 int lp_offs, u = 1;
864
865 lp_offs = (char *)target - (char *)pc - 2*4;
866 if (lp_offs < 0) {
867 lp_offs = -lp_offs;
868 u = 0;
869 }
870 if (lp_offs >= LINKPAGE_SIZE) {
871 err("linkpage too far: %d\n", lp_offs);
872 abort();
873 }
874
875 return (u << 23) | lp_offs;
876}
877
878static u32 make_jmp(u32 *pc, u32 *target, int bl)
879{
880 int jmp_val;
881
882 jmp_val = target - pc - 2;
883 if (jmp_val < (int)0xff000000 || jmp_val > 0x00ffffff) {
884 err("jump out of range (%p -> %p)\n", pc, target);
885 abort();
886 }
887
888 return 0xea000000 | (bl << 24) | (jmp_val & 0x00ffffff);
889}
890
891static void emit_op(u32 op)
892{
893 *g_code_ptr++ = op;
894}
895
896static void emit_op_io(u32 op, u32 *target)
897{
898 op |= make_offset12(g_code_ptr, target);
899 emit_op(op);
900}
901
902static void init_linkpage(void)
903{
904 g_linkpage->handler = emu_call_handle_op;
905 g_code_ptr = g_linkpage->code;
906}
907
908static void segv_sigaction(int num, siginfo_t *info, void *ctx)
909{
910 struct ucontext *context = ctx;
911 u32 *regs = (u32 *)&context->uc_mcontext.arm_r0;
912 u32 *pc = (u32 *)regs[15];
913 struct op_context *op_ctx;
914 int i, lp_size;
915
916 if (((regs[15] ^ (u32)&segv_sigaction) & 0xff000000) == 0 || // PC is in our segment or
917 (((regs[15] ^ (u32)g_linkpage) & ~(LINKPAGE_ALLOC - 1)) == 0) || // .. in linkpage
918 ((long)info->si_addr & 0xffe00000) != 0x7f000000) // faulting not where expected
919 {
920 // real crash - time to die
921 err("segv %d %p @ %08x\n", info->si_code, info->si_addr, regs[15]);
922 for (i = 0; i < 8; i++)
923 dbg(" r%d=%08x r%-2d=%08x\n", i, regs[i], i+8, regs[i+8]);
924 signal(num, SIG_DFL);
925 raise(num);
926 return;
927 }
928 segvlog("segv %d %p @ %08x\n", info->si_code, info->si_addr, regs[15]);
929
930 // spit PC and op
931 op_ctx = (void *)g_code_ptr;
932 op_ctx->pc = (u32)pc;
933 op_ctx->op = *pc;
934 g_code_ptr = &op_ctx->code[0];
935
936 // emit jump to code ptr
937 *pc = make_jmp(pc, g_code_ptr, 0);
938
939 // generate code:
940 emit_op (0xe50d0000 + 0xf00 - 4 * 0); // str r0, [sp, #(-0xf00 + r0_offs)]
941 emit_op (0xe50de000 + 0xf00 - 4 * 14); // str lr, [sp, #(-0xf00 + lr_offs)]
942 emit_op (0xe24f0000 + (g_code_ptr - (u32 *)op_ctx + 2) * 4); // sub r0, pc, #op_ctx
943 emit_op (0xe1a0e00f); // mov lr, pc
944 emit_op_io(0xe51ff000, (u32 *)&g_linkpage->handler); // ldr pc, =handle_op
945 emit_op (0xe51de000 + 0xf00 - 4 * 14); // ldr lr, [sp, #(-0xf00 + lr_offs)]
946 emit_op (make_jmp(g_code_ptr, pc + 1, 0)); // jmp <back>
947
948 // sync caches
949 sys_cacheflush(pc, pc + 1);
950 sys_cacheflush(g_linkpage, g_code_ptr);
951
952 lp_size = (char *)g_code_ptr - (char *)g_linkpage;
953 segvlog("code #%d %d/%d\n", g_linkpage_count, lp_size, LINKPAGE_SIZE);
954
955 if (lp_size + 13*4 > LINKPAGE_SIZE) {
956 g_linkpage_count++;
957 if (g_linkpage_count >= LINKPAGE_COUNT) {
958 err("too many linkpages needed\n");
959 abort();
960 }
961 g_linkpage = (void *)((char *)g_linkpage + LINKPAGE_SIZE);
962 init_linkpage();
963 }
964 //handle_op(regs[15], op, regs, (u32)info->si_addr);
965 //regs[15] += 4;
966}
967
968void emu_init(void *map_bottom)
969{
970 sigaction_t segv_action = {
971 .sa_sigaction = segv_sigaction,
972 .sa_flags = SA_SIGINFO,
973 };
974 pthread_t tid;
975 void *pret;
976 int ret;
977
978#ifdef PND
979 if (geteuid() == 0) {
980 fprintf(stderr, "don't try to run as root, device registers or memory "
981 "might get trashed crashing the OS or even damaging the device.\n");
982 exit(1);
983 }
984#endif
985
986 g_linkpage = (void *)(((u32)map_bottom - LINKPAGE_ALLOC) & ~0xfff);
987 pret = mmap(g_linkpage, LINKPAGE_ALLOC, PROT_READ|PROT_WRITE,
988 MAP_PRIVATE|MAP_ANONYMOUS|MAP_FIXED, -1, 0);
989 if (pret != g_linkpage) {
990 perror(PFX "mmap linkpage");
991 exit(1);
992 }
993 log("linkpages @ %p\n", g_linkpage);
994 init_linkpage();
995
996 // host stuff
997 ret = host_init();
998 if (ret != 0) {
999 err("can't init host\n");
1000 exit(1);
1001 }
1002
1003 ret = host_video_init(NULL, 0);
1004 if (ret != 0) {
1005 err("can't init host video\n");
1006 exit(1);
1007 }
1008
1009 // TODO: check if this really fails on Wiz..
1010 mmsp2.umem = mmap(NULL, 0x2000000, PROT_READ|PROT_WRITE|PROT_EXEC,
1011 MAP_PRIVATE|MAP_ANONYMOUS, -1, 0);
1012#ifdef WIZ
1013 if (mmsp2.umem == MAP_FAILED) {
1014 // we are short on memmory on Wiz, need special handling
1015 extern void *host_mmap_upper(void);
1016 mmsp2.umem = host_mmap_upper();
1017 }
1018#endif
1019 if (mmsp2.umem == MAP_FAILED) {
1020 perror(PFX "mmap upper mem");
1021 exit(1);
1022 }
1023
1024 ret = pthread_create(&tid, NULL, fb_sync_thread, NULL);
1025 if (ret != 0) {
1026 err("failed to create fb_sync_thread: %d\n", ret);
1027 exit(1);
1028 }
1029 pthread_detach(tid);
1030
1031 // defaults
1032 mmsp2.mlc_stl_adr = 0x03101000; // fb2 is at 0x03381000
1033 mmsp2.mlc_stl_cntl = 0x4ab; // 16bpp, region 1 active
1034 mmsp2.v.width = 320;
1035 mmsp2.v.height = 240;
1036 mmsp2.v.stride = 320*2;
1037 mmsp2.v.bpp = 16;
1038 mmsp2.v.dirty_pal = 1;
1039
1040 sigemptyset(&segv_action.sa_mask);
1041 sigaction(SIGSEGV, &segv_action, NULL);
1042}
1043
1044int emu_read_gpiodev(void *buf, int count)
1045{
1046 if (count <= 0) {
1047 err("gpiodev read %d?\n", count);
1048 return -1;
1049 }
1050 if (count > 4)
1051 count = 4;
1052
1053 mmsp2.btn_state = host_read_btns();
1054 memcpy(buf, &mmsp2.btn_state, count);
1055 return count;
1056}
1057
1058static void *emu_mmap_dev(unsigned int length, int prot, int flags, unsigned int offset)
1059{
1060 u8 *umem, *umem_end;
1061
1062 // SoC regs
1063 if ((offset & ~0x1ffff) == 0xc0000000) {
1064 return mmap((void *)0x7f000000, length, PROT_NONE,
1065 MAP_PRIVATE|MAP_ANONYMOUS|MAP_FIXED|MAP_NORESERVE, -1, 0);
1066 }
1067 // MMSP2 blitter
1068 if ((offset & ~0xffff) == 0xe0020000) {
1069 return mmap((void *)0x7f100000, length, PROT_NONE,
1070 MAP_PRIVATE|MAP_ANONYMOUS|MAP_FIXED|MAP_NORESERVE, -1, 0);
1071 }
1072 // upper mem
1073 if ((offset & 0xfe000000) != 0x02000000) {
1074 err("unexpected devmem mmap @ %08x\n", offset);
1075 errno = EINVAL;
1076 return MAP_FAILED;
1077 }
1078
1079 umem = uppermem_lookup(offset, &umem_end);
1080 if (umem + length > umem_end)
1081 err("warning: uppermem @ %08x overflows by %d bytes\n",
1082 offset, umem + length - umem_end);
1083
1084 dbg("upper mem @ %08x %d\n", offset, length);
1085 return umem;
1086}
1087
1088void *emu_do_mmap(unsigned int length, int prot, int flags, int fd, unsigned int offset)
1089{
1090 if (fd == FAKEDEV_MEM)
1091 return emu_mmap_dev(length, prot, flags, offset);
1092
1093 if (fd == FAKEDEV_FB0)
1094 return emu_mmap_dev(length, prot, flags, offset + 0x03101000);
1095
1096 if (fd == FAKEDEV_FB1)
1097 return emu_mmap_dev(length, prot, flags, offset + 0x03381000);
1098
1099 err("bad/ni mmap(?, %d, %x, %x, %d, %08x)\n", length, prot, flags, fd, offset);
1100 errno = EINVAL;
1101 return MAP_FAILED;
1102}
1103
1104static void emu_sound_open(int fd)
1105{
1106#ifdef PND
1107 int ret, frag;
1108
1109 // set default buffer size to 16 * 1K
1110 frag = (16<<16) | 10; // 16K
1111 ret = ioctl(fd, SNDCTL_DSP_SETFRAGMENT, &frag);
1112 if (ret != 0) {
1113 err("snd ioctl SETFRAGMENT %08x: ", frag);
1114 perror(NULL);
1115 }
1116#endif
1117}
1118
1119static int emu_sound_ioctl(int fd, int request, void *argp)
1120{
1121 int *arg = argp;
1122
1123#if 0
1124 dbg("snd ioctl(%d, %08x, %p)", fd, request, argp);
1125 if (arg != NULL)
1126 dbg_c(" [%d]", *arg);
1127 dbg_c("\n");
1128#endif
1129
1130 /* People set strange frag settings on GP2X, which even manage
1131 * to break audio on pandora (causes writes to fail).
1132 * Catch this and set to something that works. */
1133 switch(request) {
1134 case SNDCTL_DSP_SETFRAGMENT: {
1135 int ret, bsize, frag, frag_cnt;
1136 if (arg == NULL)
1137 break;
1138
1139 frag = *arg & 0xffff;
1140 frag_cnt = *arg >> 16;
1141 bsize = frag_cnt << frag;
1142 if (frag < 10 || bsize < 4096*4 || bsize > 4096*4*2) {
1143 /*
1144 * ~4ms. gpSP wants small buffers or else it stutters
1145 * because of it's audio thread sync stuff
1146 * XXX: hardcoding, as low samplerates will result in small fragment size,
1147 * which itself causes ALSA stall and hangs the program.
1148 * Also some apps change samplerate without reopening /dev/dsp,
1149 * which causes ALSA to reject SNDCTL_DSP_SETFRAGMENT.
1150 */
1151 bsize = 44100 / 250 * 4;
1152
1153 for (frag = 0; bsize; bsize >>= 1, frag++)
1154 ;
1155
1156 frag_cnt = 16;
1157 }
1158
1159 frag |= frag_cnt << 16;
1160 ret = ioctl(fd, SNDCTL_DSP_SETFRAGMENT, &frag);
1161 if (ret != 0) {
1162 err("snd ioctl SETFRAGMENT %08x: ", frag);
1163 perror(NULL);
1164 }
1165 // indicate success even if we fail (because of ALSA mostly),
1166 // things like MikMod will bail out otherwise.
1167 return 0;
1168 }
1169 case SNDCTL_DSP_SYNC:
1170 // Franxis tends to use sync/write loops, bad idea under ALSA
1171 return 0;
1172 default:
1173 break;
1174 }
1175
1176 return ioctl(fd, request, argp);
1177}
1178
1179int emu_do_ioctl(int fd, int request, void *argp)
1180{
1181 if (fd == emu_interesting_fds[IFD_SOUND].fd)
1182 return emu_sound_ioctl(fd, request, argp);
1183
1184 switch (fd) {
1185 /* *********************** */
1186 case FAKEDEV_FB0:
1187 case FAKEDEV_FB1:
1188 if (argp == NULL)
1189 goto fail;
1190
1191 switch (request) {
1192 case FBIOGET_FSCREENINFO: {
1193 struct fb_fix_screeninfo *fix = argp;
1194
1195 memset(fix, 0, sizeof(*fix));
1196 strcpy(fix->id, "mmsp2_RGB0");
1197 fix->type = FB_TYPE_PACKED_PIXELS;
1198 fix->accel = FB_ACCEL_NONE;
1199 fix->visual = FB_VISUAL_TRUECOLOR;
1200 fix->line_length = 320*2;
1201 fix->smem_start = (fd == FAKEDEV_FB0) ? 0x03101000 : 0x03381000;
1202 fix->smem_len = 320*240*2;
1203 return 0;
1204 }
1205 case FBIOGET_VSCREENINFO: {
1206 struct fb_var_screeninfo *var = argp;
1207 static const struct fb_bitfield fbb_red = { offset: 11, length: 5, };
1208 static const struct fb_bitfield fbb_green = { offset: 5, length: 6, };
1209 static const struct fb_bitfield fbb_blue = { offset: 0, length: 5, };
1210
1211 memset(var, 0, sizeof(*var));
1212 var->activate = FB_ACTIVATE_NOW;
1213 var->xres =
1214 var->xres_virtual = 320;
1215 var->yres =
1216 var->yres_virtual = 240;
1217 var->width =
1218 var->height = -1;
1219 var->vmode = FB_VMODE_NONINTERLACED;
1220 var->bits_per_pixel = 16;
1221 var->red = fbb_red;
1222 var->green = fbb_green;
1223 var->blue = fbb_blue;
1224 return 0;
1225 }
1226 case FBIOPUT_VSCREENINFO: {
1227 struct fb_var_screeninfo *var = argp;
1228 dbg(" put vscreen: %dx%d@%d\n", var->xres, var->yres, var->bits_per_pixel);
1229 if (var->xres != 320 || var->yres != 240 || var->bits_per_pixel != 16)
1230 return -1;
1231 return 0;
1232 }
1233 }
1234
1235 /* *********************** */
1236 case FAKEDEV_TTY0:
1237 // fake tty0 to make GPH SDL happy
1238 if (request == 0x4b46) // KDGKBENT
1239 return -1;
1240 return 0;
1241 }
1242
1243fail:
1244 err("bad/ni ioctl(%d, %08x, %p)\n", fd, request, argp);
1245 errno = EINVAL;
1246 return -1;
1247}
1248
1249struct dev_fd_t emu_interesting_fds[] = {
1250 [IFD_SOUND] = { "/dev/dsp", -1, emu_sound_open },
1251 { NULL, 0, NULL },
1252};
1253
1254static const struct {
1255 const char *from;
1256 const char *to;
1257} path_map[] = {
1258 { "/mnt/tmp", "./tmp" },
1259};
1260
1261static const char *wrap_path(const char *path)
1262{
1263 char *buff, *p;
1264 size_t size;
1265 int i, len;
1266
1267 // do only path mapping for now
1268 for (i = 0; i < ARRAY_SIZE(path_map); i++) {
1269 p = strstr(path, path_map[i].from);
1270 if (p != NULL) {
1271 size = strlen(path) + strlen(path_map[i].to) + 1;
1272 buff = malloc(size);
1273 if (buff == NULL)
1274 break;
1275 len = p - path;
1276 strncpy(buff, path, len);
1277 snprintf(buff + len, size - len, "%s%s", path_map[i].to,
1278 path + len + strlen(path_map[i].from));
1279 dbg("mapped path \"%s\" -> \"%s\"\n", path, buff);
1280 return buff;
1281 }
1282 }
1283
1284 return path;
1285}
1286
1287static void wrap_path_free(const char *w_path, const char *old_path)
1288{
1289 if (w_path != old_path)
1290 free((void *)w_path);
1291}
1292
1293void *emu_do_fopen(const char *path, const char *mode)
1294{
1295 const char *w_path;
1296 FILE *ret;
1297
1298 w_path = wrap_path(path);
1299 ret = fopen(w_path, mode);
1300 wrap_path_free(w_path, path);
1301
1302 return ret;
1303}
1304
1305// FIXME: threads..
1306int emu_do_system(const char *command)
1307{
1308 static char tmp_path[512];
1309 int need_ginge = 0;
1310 const char *p2;
1311 char *p;
1312 int ret;
1313
1314 if (command == NULL)
1315 return -1;
1316
1317 for (p2 = command; *p2 && isspace(*p2); p2++)
1318 ;
1319
1320 if (*p2 == '.') // relative path?
1321 need_ginge = 1;
1322 else if (*p2 == '/' && strncmp(p2, "/bin", 4) && strncmp(p2, "/lib", 4)
1323 && strncmp(p2, "/sbin", 4) && strncmp(p2, "/usr", 4))
1324 // absolute path, but not a system command
1325 need_ginge = 1;
1326
1327 p2 = wrap_path(command);
1328 if (need_ginge) {
1329 make_local_path(tmp_path, sizeof(tmp_path), "ginge_prep");
1330 p = tmp_path + strlen(tmp_path);
1331
1332 snprintf(p, sizeof(tmp_path) - (p - tmp_path), " --nomenu %s", p2);
1333 }
1334 else
1335 snprintf(tmp_path, sizeof(tmp_path), "%s", p2);
1336 wrap_path_free(p2, command);
1337
1338 dbg("system: \"%s\"\n", tmp_path);
1339
1340 // the app might want the screen too..
1341 fb_thread_pause();
1342 ret = system(tmp_path);
1343 fb_thread_resume();
1344 return ret;
1345}
1346
1347int emu_do_execve(const char *filename, char *const argv[], char *const envp[])
1348{
1349 const char **new_argv;
1350 char *prep_path;
1351 int i, ret, argc;
1352
1353 if (filename == NULL)
1354 return -1;
1355
1356 if (strstr(filename, "/gp2xmenu") != NULL)
1357 exit(0);
1358
1359 for (i = 0; argv[i] != NULL; i++)
1360 ;
1361 argc = i + 1;
1362
1363 new_argv = calloc(argc + 2, sizeof(new_argv[0]));
1364 if (new_argv == NULL)
1365 return -1;
1366
1367 prep_path = malloc(512);
1368 if (prep_path == NULL)
1369 return -1;
1370
1371 make_local_path(prep_path, 512, "ginge_prep");
1372 new_argv[0] = prep_path;
1373 new_argv[1] = "--nomenu";
1374 new_argv[2] = wrap_path(filename);
1375
1376 if (argv[0] != NULL)
1377 for (i = 1; argv[i] != NULL; i++)
1378 new_argv[i + 2] = argv[i];
1379
1380 dbg("execve \"%s\" %s \"%s\"\n", new_argv[0], new_argv[1], new_argv[2]);
1381 ret = execve(new_argv[0], (char **)new_argv, envp);
1382 perror("execve");
1383 return ret;
1384}
1385
1386// vim:shiftwidth=2:expandtab