11913091 |
1 | // vim:shiftwidth=2:expandtab |
2 | #include <stdio.h> |
3 | #include <stdlib.h> |
3d295a9f |
4 | #include <string.h> |
c1ffd5ba |
5 | #include <alloca.h> |
11913091 |
6 | #include <sys/types.h> |
7 | #include <sys/stat.h> |
8 | #include <fcntl.h> |
9 | #include <sys/mman.h> |
10 | #include <sys/types.h> |
11 | #include <unistd.h> |
12 | #include <signal.h> |
13 | #include <asm/ucontext.h> |
c1ffd5ba |
14 | #include <pthread.h> |
15 | #include <errno.h> |
16 | #include <time.h> |
17 | #include <sys/resource.h> |
7fd42181 |
18 | #include <sys/ioctl.h> |
19 | #include <linux/soundcard.h> |
20 | #include <linux/fb.h> |
11913091 |
21 | |
22 | #include "header.h" |
7fd42181 |
23 | #include "../common/host_fb.h" |
24 | #include "../common/cmn.h" |
86418a84 |
25 | #include "sys_cacheflush.h" |
7fd42181 |
26 | #include "realfuncs.h" |
11913091 |
27 | |
3d3fa63b |
28 | #if (DBG & 2) && !(DBG & 4) |
7fd42181 |
29 | #define LOG_IO_UNK |
30 | #endif |
3d3fa63b |
31 | #if (DBG & 4) |
7fd42181 |
32 | #define LOG_IO |
33 | #endif |
6720e4e4 |
34 | //#define LOG_SEGV |
35 | |
36 | #ifdef LOG_IO |
37 | #define iolog log_io |
38 | #else |
86418a84 |
39 | #define iolog(...) |
6720e4e4 |
40 | #endif |
41 | |
c1ffd5ba |
42 | #ifdef LOG_IO_UNK |
6720e4e4 |
43 | #define iolog_unh log_io |
44 | #else |
45 | #define iolog_unh(...) |
46 | #endif |
47 | |
48 | #ifdef LOG_SEGV |
49 | #define segvlog printf |
50 | #else |
0881206b |
51 | #define segvlog(...) |
6720e4e4 |
52 | #endif |
53 | |
c1ffd5ba |
54 | #if defined(LOG_IO) || defined(LOG_IO_UNK) |
6720e4e4 |
55 | #include "mmsp2-regs.h" |
56 | #endif |
11913091 |
57 | |
3d3fa63b |
58 | typedef unsigned long long u64; |
11913091 |
59 | typedef unsigned int u32; |
60 | typedef unsigned short u16; |
61 | typedef unsigned char u8; |
62 | |
c1ffd5ba |
63 | static pthread_mutex_t fb_mutex = PTHREAD_MUTEX_INITIALIZER; |
64 | static pthread_cond_t fb_cond = PTHREAD_COND_INITIALIZER; |
65 | |
3d295a9f |
66 | static struct { |
67 | u32 dstctrl; |
68 | u32 dstaddr; |
69 | u32 dststride; |
70 | u32 srcctrl; |
71 | u32 srcaddr; // |
72 | u32 srcstride; |
73 | u32 srcforcolor; |
74 | u32 srcbackcolor; |
75 | u32 patctrl; // |
76 | u32 patforcolor; |
77 | u32 patbackcolor; |
78 | u32 size; |
79 | u32 ctrl; // |
80 | u32 run; |
81 | u32 intc; |
82 | u32 srcfifo; |
83 | } blitter; |
84 | |
0881206b |
85 | #define SRCCTRL_INVIDEO (1 << 8) |
86 | #define SRCCTRL_SRCENB (1 << 7) |
87 | #define CTRL_TRANSPARENCYENB (1 << 11) |
88 | |
3d295a9f |
89 | static struct { |
6720e4e4 |
90 | u16 mlc_stl_cntl; |
3d295a9f |
91 | union { |
6720e4e4 |
92 | u32 mlc_stl_adr; |
3d295a9f |
93 | struct { |
6720e4e4 |
94 | u16 mlc_stl_adrl; |
95 | u16 mlc_stl_adrh; |
3d295a9f |
96 | }; |
97 | }; |
6720e4e4 |
98 | u16 mlc_stl_pallt_a; |
99 | union { |
100 | u16 mlc_stl_pallt_d[256*2]; |
101 | u32 mlc_stl_pallt_d32[256]; |
102 | }; |
103 | |
104 | // state |
3d3fa63b |
105 | void *umem; |
6720e4e4 |
106 | u16 host_pal[256]; |
107 | u32 old_mlc_stl_adr; |
108 | u32 btn_state; // as seen through /dev/GPIO |
dc90c02d |
109 | u32 dirty_pal:1; |
3d295a9f |
110 | } mmsp2; |
111 | |
112 | static u16 *host_screen; |
113 | static int host_stride; |
11913091 |
114 | |
115 | |
c1ffd5ba |
116 | #if defined(LOG_IO) || defined(LOG_IO_UNK) |
6720e4e4 |
117 | static void log_io(const char *pfx, u32 a, u32 d, int size) |
118 | { |
119 | const char *fmt, *reg = ""; |
120 | switch (size) { |
c1ffd5ba |
121 | case 8: fmt = "%s %08x %02x %s\n"; d &= 0xff; break; |
122 | case 32: fmt = "%s %08x %08x %s\n"; break; |
123 | default: fmt = "%s %08x %04x %s\n"; d &= 0xffff; break; |
6720e4e4 |
124 | } |
125 | |
126 | if ((a & ~0xffff) == 0x7f000000) |
127 | reg = regnames[a & 0xffff]; |
128 | |
129 | printf(fmt, pfx, a, d, reg); |
130 | } |
131 | #endif |
132 | |
0881206b |
133 | static void memset16(void *dst, u32 pattern, int count) |
134 | { |
135 | u32 *dl; |
136 | u16 *d; |
137 | |
138 | d = (u16 *)((long)dst & ~1); |
139 | if ((long)d & 2) { |
140 | *d++ = pattern; |
141 | count--; |
142 | } |
143 | dl = (void *)d; |
144 | pattern |= pattern << 16; |
145 | |
146 | while (count >= 2) { |
147 | *dl++ = pattern; |
148 | count -= 2; |
149 | } |
150 | if (count) |
151 | *(u16 *)dl = pattern; |
152 | } |
153 | |
154 | static void blt_tr(void *dst, void *src, u32 trc, int w) |
155 | { |
156 | u16 *d = (u16 *)((long)dst & ~1); |
157 | u16 *s = (u16 *)((long)src & ~1); |
158 | |
159 | // XXX: optimize |
160 | for (; w > 0; d++, s++, w--) |
161 | if (*s != trc) |
162 | *d = *s; |
163 | } |
164 | |
165 | #define dump_blitter() \ |
166 | { \ |
167 | u32 *r = &blitter.dstctrl; \ |
168 | int i; \ |
169 | for (i = 0; i < 4*4; i++, r++) { \ |
170 | printf("%08x ", *r); \ |
171 | if ((i & 3) == 3) \ |
172 | printf("\n"); \ |
173 | } \ |
174 | } |
175 | |
6720e4e4 |
176 | static void *uppermem_lookup(u32 addr, u8 **mem_end) |
11913091 |
177 | { |
3d3fa63b |
178 | // XXX: maybe support mirroring? |
179 | if ((addr & 0xfe000000) != 0x02000000) |
180 | return NULL; |
3d295a9f |
181 | |
3d3fa63b |
182 | *mem_end = (u8 *)mmsp2.umem + 0x02000000; |
183 | return (u8 *)mmsp2.umem - 0x02000000 + addr; |
11913091 |
184 | } |
185 | |
3d295a9f |
186 | static void blitter_do(void) |
11913091 |
187 | { |
0881206b |
188 | u8 *dst, *dste, *src = NULL, *srce = NULL; |
3d295a9f |
189 | int w, h, sstrd, dstrd; |
6720e4e4 |
190 | int to_screen = 0; |
dc90c02d |
191 | u32 bpp, addr; |
3d295a9f |
192 | |
193 | w = blitter.size & 0x7ff; |
194 | h = (blitter.size >> 16) & 0x7ff; |
195 | sstrd = blitter.srcstride; |
196 | dstrd = blitter.dststride; |
197 | |
0881206b |
198 | // XXX: need to confirm this.. |
199 | addr = (blitter.dstaddr & ~3) | ((blitter.dstctrl & 0x1f) >> 3); |
c1ffd5ba |
200 | |
dc90c02d |
201 | // use dst bpp.. How does it do blits with different src bpp? |
202 | bpp = (blitter.dstctrl & 0x20) ? 16 : 8; |
203 | |
c1ffd5ba |
204 | // maybe the screen? |
dc90c02d |
205 | if (((w == 320 && h == 240) || // blit whole screen |
206 | (w * h >= 320*240/2)) && // ..or at least half of the area |
207 | mmsp2.mlc_stl_adr <= addr && addr < mmsp2.mlc_stl_adr + 320*240*2) |
c1ffd5ba |
208 | to_screen = 1; |
209 | |
210 | dst = uppermem_lookup(addr, &dste); |
0881206b |
211 | |
212 | // XXX: assume fill if no SRCENB, but it could be pattern blit.. |
213 | if (blitter.srcctrl & SRCCTRL_SRCENB) { |
214 | if (!(blitter.srcctrl & SRCCTRL_INVIDEO)) |
215 | goto bad_blit; |
216 | |
217 | addr = (blitter.srcaddr & ~3) | ((blitter.srcctrl & 0x1f) >> 3); |
c1ffd5ba |
218 | src = uppermem_lookup(addr, &srce); |
0881206b |
219 | if (src == NULL) |
220 | goto bad_blit; |
221 | |
222 | if (src + sstrd * h > srce) { |
6720e4e4 |
223 | err("blit %08x->%08x %dx%d did not fit src\n", |
0881206b |
224 | blitter.srcaddr, blitter.dstaddr, w, h); |
225 | h = (srce - src) / sstrd; |
226 | } |
3d295a9f |
227 | } |
228 | |
dc90c02d |
229 | if (dst == NULL) |
230 | goto bad_blit; |
231 | |
3d295a9f |
232 | if (dst + dstrd * h > dste) { |
6720e4e4 |
233 | err("blit %08x->%08x %dx%d did not fit dst\n", |
3d295a9f |
234 | blitter.srcaddr, blitter.dstaddr, w, h); |
235 | h = (dste - dst) / dstrd; |
236 | } |
237 | |
0881206b |
238 | if (src != NULL) { |
239 | // copy |
dc90c02d |
240 | if (bpp == 16 && (blitter.ctrl & CTRL_TRANSPARENCYENB)) { |
0881206b |
241 | u32 trc = blitter.ctrl >> 16; |
242 | for (; h > 0; h--, dst += dstrd, src += sstrd) |
243 | blt_tr(dst, src, trc, w); |
244 | } |
245 | else { |
246 | for (; h > 0; h--, dst += dstrd, src += sstrd) |
dc90c02d |
247 | memcpy(dst, src, w * bpp / 8); |
0881206b |
248 | } |
3d295a9f |
249 | } |
0881206b |
250 | else { |
251 | // fill. Assume the pattern is cleared and bg color is used |
252 | u32 bgc = blitter.patbackcolor & 0xffff; |
dc90c02d |
253 | if (bpp == 16) { |
254 | for (; h > 0; h--, dst += dstrd) |
255 | memset16(dst, bgc, w); |
256 | } |
257 | else { |
258 | for (; h > 0; h--, dst += dstrd) |
259 | memset(dst, bgc, w); // bgc? |
260 | } |
0881206b |
261 | } |
6720e4e4 |
262 | |
263 | if (to_screen) |
c1ffd5ba |
264 | pthread_cond_signal(&fb_cond); |
0881206b |
265 | return; |
3d295a9f |
266 | |
0881206b |
267 | bad_blit: |
6720e4e4 |
268 | err("blit %08x->%08x %dx%d translated to %p->%p\n", |
0881206b |
269 | blitter.srcaddr, blitter.dstaddr, w, h, src, dst); |
270 | dump_blitter(); |
3d295a9f |
271 | } |
272 | |
6720e4e4 |
273 | // TODO: hw scaler stuff |
c1ffd5ba |
274 | static void mlc_flip(u8 *src, int bpp) |
6720e4e4 |
275 | { |
6720e4e4 |
276 | u16 *dst = host_screen; |
277 | u16 *hpal = mmsp2.host_pal; |
6720e4e4 |
278 | int i, u; |
279 | |
6720e4e4 |
280 | if (bpp <= 8 && mmsp2.dirty_pal) { |
281 | u32 *srcp = mmsp2.mlc_stl_pallt_d32; |
282 | u16 *dstp = hpal; |
283 | |
284 | for (i = 0; i < 256; i++, srcp++, dstp++) { |
285 | u32 t = *srcp; |
286 | *dstp = ((t >> 8) & 0xf800) | ((t >> 5) & 0x07e0) | ((t >> 3) & 0x001f); |
287 | } |
288 | mmsp2.dirty_pal = 0; |
289 | } |
290 | |
291 | switch (bpp) { |
292 | case 4: |
293 | for (i = 0; i < 240; i++, dst += host_stride / 2 - 320) { |
294 | for (u = 320 / 2; u > 0; u--, src++) { |
295 | *dst++ = hpal[*src >> 4]; |
296 | *dst++ = hpal[*src & 0x0f]; |
297 | } |
298 | } |
299 | break; |
300 | |
301 | case 8: |
302 | for (i = 0; i < 240; i++, dst += host_stride / 2 - 320) { |
303 | for (u = 320 / 4; u > 0; u--) { |
304 | *dst++ = hpal[*src++]; |
305 | *dst++ = hpal[*src++]; |
306 | *dst++ = hpal[*src++]; |
307 | *dst++ = hpal[*src++]; |
308 | } |
309 | } |
310 | break; |
311 | |
312 | case 16: |
313 | for (i = 0; i < 240; i++, dst += host_stride / 2, src += 320*2) |
314 | memcpy(dst, src, 320*2); |
315 | break; |
316 | |
317 | case 24: |
318 | // TODO |
319 | break; |
320 | } |
321 | |
322 | host_screen = host_video_flip(); |
323 | } |
324 | |
c1ffd5ba |
325 | #define ts_add_nsec(ts, ns) { \ |
326 | ts.tv_nsec += ns; \ |
327 | if (ts.tv_nsec >= 1000000000) { \ |
328 | ts.tv_sec++; \ |
329 | ts.tv_nsec -= 1000000000; \ |
330 | } \ |
331 | } |
332 | |
333 | static void *fb_sync_thread(void *arg) |
334 | { |
335 | int invalid_fb_addr = 1; |
336 | int manual_refresh = 0; |
337 | struct timespec ts; |
338 | int ret, wait_ret; |
339 | |
340 | //ret = pthread_setschedprio(pthread_self(), -1); |
341 | //log("pthread_setschedprio %d\n", ret); |
342 | //ret = setpriority(PRIO_PROCESS, 0, -1); |
343 | //log("setpriority %d\n", ret); |
344 | |
345 | ret = clock_gettime(CLOCK_REALTIME, &ts); |
346 | if (ret != 0) { |
347 | perror(PFX "clock_gettime"); |
348 | exit(1); |
349 | } |
350 | |
351 | while (1) { |
352 | u8 *gp2x_fb, *gp2x_fb_end; |
353 | int mode, bpp; |
354 | |
355 | ret = pthread_mutex_lock(&fb_mutex); |
356 | wait_ret = pthread_cond_timedwait(&fb_cond, &fb_mutex, &ts); |
357 | ret |= pthread_mutex_unlock(&fb_mutex); |
dc90c02d |
358 | |
c1ffd5ba |
359 | if (ret != 0) { |
360 | err("fb_thread: mutex error: %d\n", ret); |
361 | sleep(1); |
362 | continue; |
363 | } |
364 | if (wait_ret != 0 && wait_ret != ETIMEDOUT) { |
365 | err("fb_thread: cond error: %d\n", wait_ret); |
366 | sleep(1); |
367 | continue; |
368 | } |
369 | |
370 | if (wait_ret != ETIMEDOUT) { |
371 | clock_gettime(CLOCK_REALTIME, &ts); |
372 | ts_add_nsec(ts, 50000000); |
373 | manual_refresh++; |
374 | if (manual_refresh == 2) |
375 | log("fb_thread: switch to manual refresh\n"); |
376 | } else { |
377 | ts_add_nsec(ts, 16666667); |
378 | if (manual_refresh > 1) |
379 | log("fb_thread: switch to auto refresh\n"); |
380 | manual_refresh = 0; |
381 | } |
382 | |
383 | mode = (mmsp2.mlc_stl_cntl >> 9) & 3; |
384 | bpp = mode ? mode * 8 : 4; |
385 | |
386 | gp2x_fb = uppermem_lookup(mmsp2.mlc_stl_adr, &gp2x_fb_end); |
387 | if (gp2x_fb == NULL || gp2x_fb + 320*240 * bpp / 8 > gp2x_fb_end) { |
388 | if (!invalid_fb_addr) { |
389 | err("fb_thread: %08x is out of range\n", mmsp2.mlc_stl_adr); |
390 | invalid_fb_addr = 1; |
391 | } |
392 | continue; |
393 | } |
394 | |
395 | mlc_flip(gp2x_fb, bpp); |
396 | } |
397 | } |
398 | |
3d295a9f |
399 | static u32 xread8(u32 a) |
400 | { |
6720e4e4 |
401 | iolog("r8 ", a, 0, 8); |
402 | iolog_unh("r8 ", a, 0, 8); |
3d295a9f |
403 | return 0; |
11913091 |
404 | } |
405 | |
406 | static u32 xread16(u32 a) |
407 | { |
6720e4e4 |
408 | static u32 fudge, old_a; |
409 | u32 d = 0, t; |
410 | |
411 | if ((a & 0xffff0000) == 0x7f000000) { |
412 | u32 a_ = a & 0xffff; |
413 | switch (a_) { |
414 | case 0x0910: // FPLL |
415 | case 0x0912: |
416 | d = 0x9407; |
417 | break; |
418 | // minilib reads as: |
419 | // 0000 P000 VuVd00 0000 YXBA RLSeSt 0R0D 0L0U |
420 | // | GPIOD |GPIOC[8:15]|GPIOM[0:7]| |
421 | // /dev/GPIO: |
422 | // ... 0PVdVu ... |
423 | case 0x1184: // GPIOC |
424 | d = ~mmsp2.btn_state & 0xff00; |
425 | d |= 0x00ff; |
426 | break; |
427 | case 0x1186: // GPIOD |
428 | t = ~mmsp2.btn_state; |
429 | d = (t >> 9) & 0x0080; |
430 | d |= (t >> 11) & 0x0040; |
431 | d |= (t >> 7) & 0x0800; |
432 | d |= 0x373b; |
433 | break; |
434 | case 0x1198: // GPIOM |
435 | mmsp2.btn_state = host_read_btns(); |
436 | d = ~mmsp2.btn_state & 0xff; |
437 | d |= 0x01aa; |
438 | break; |
c1ffd5ba |
439 | case 0x1836: // reserved |
440 | d = 0x2330; |
441 | break; |
442 | case 0x2816: // DPC_X_MAX |
443 | d = 319; |
444 | break; |
445 | case 0x2818: // DPC_Y_MAX |
446 | d = 239; |
447 | break; |
6720e4e4 |
448 | case 0x28da: |
449 | d = mmsp2.mlc_stl_cntl; |
450 | break; |
c1ffd5ba |
451 | case 0x290e: |
452 | case 0x2912: |
453 | d = mmsp2.mlc_stl_adrl; |
454 | break; |
455 | case 0x2910: |
456 | case 0x2914: |
457 | d = mmsp2.mlc_stl_adrh; |
458 | break; |
6720e4e4 |
459 | case 0x2958: |
460 | d = mmsp2.mlc_stl_pallt_a; |
461 | break; |
462 | default: |
463 | goto unh; |
464 | } |
465 | goto out; |
466 | } |
467 | |
468 | unh: |
469 | if (a == old_a) { |
470 | d = fudge; |
471 | fudge = ~fudge; |
472 | } |
473 | old_a = a; |
474 | iolog_unh("r16", a, d & 0xffff, 16); |
475 | |
476 | out: |
477 | d &= 0xffff; |
478 | iolog("r16", a, d, 16); |
479 | return d; |
11913091 |
480 | } |
481 | |
482 | static u32 xread32(u32 a) |
483 | { |
3d295a9f |
484 | u32 d = 0; |
dc90c02d |
485 | if ((a & 0xfff00000) == 0x7f000000) { |
486 | u32 a_ = a & 0xffff; |
3d3fa63b |
487 | struct timespec ts; |
488 | u64 t64; |
489 | |
dc90c02d |
490 | switch (a_) { |
491 | case 0x0a00: // TCOUNT, 1/7372800s |
3d3fa63b |
492 | clock_gettime(CLOCK_REALTIME, &ts); |
493 | t64 = (u64)ts.tv_sec * 1000000000 + ts.tv_nsec; |
494 | // t * 7372800.0 / 1000000000 * 0x100000000 ~= t * 31665935 |
495 | t64 *= 31665935; |
496 | d = t64 >> 32; |
dc90c02d |
497 | break; |
498 | } |
499 | } |
3d295a9f |
500 | if ((a & 0xfff00000) == 0x7f100000) { |
501 | u32 *bl = &blitter.dstctrl; |
6720e4e4 |
502 | u32 a_ = a & 0xfff; |
503 | if (a_ < 0x40) { |
504 | d = bl[a_ / 4]; |
505 | if (a_ == 0x34) |
506 | d = 0; // not busy |
507 | goto out; |
508 | } |
3d295a9f |
509 | } |
6720e4e4 |
510 | iolog_unh("r32", a, d, 32); |
511 | |
512 | out: |
513 | iolog("r32", a, d, 32); |
3d295a9f |
514 | return d; |
11913091 |
515 | } |
516 | |
517 | static void xwrite8(u32 a, u32 d) |
518 | { |
6720e4e4 |
519 | iolog("w8 ", a, d, 8); |
520 | iolog_unh("w8 ", a, d, 8); |
11913091 |
521 | } |
522 | |
523 | static void xwrite16(u32 a, u32 d) |
524 | { |
6720e4e4 |
525 | iolog("w16", a, d, 16); |
3d295a9f |
526 | if ((a & 0xfff00000) == 0x7f000000) { |
6720e4e4 |
527 | u32 a_ = a & 0xffff; |
528 | switch (a_) { |
529 | case 0x28da: |
530 | mmsp2.mlc_stl_cntl = d | 0xaa; |
531 | break; |
532 | case 0x290e: |
533 | case 0x2910: |
534 | // odd addresses don't affect LCD. What about TV? |
535 | return; |
536 | case 0x2912: |
537 | mmsp2.mlc_stl_adrl = d; |
538 | return; |
539 | case 0x2914: |
540 | mmsp2.mlc_stl_adrh = d; |
541 | if (mmsp2.mlc_stl_adr != mmsp2.old_mlc_stl_adr) |
c1ffd5ba |
542 | // ask for refresh |
543 | pthread_cond_signal(&fb_cond); |
6720e4e4 |
544 | mmsp2.old_mlc_stl_adr = mmsp2.mlc_stl_adr; |
545 | return; |
546 | case 0x2958: |
547 | mmsp2.mlc_stl_pallt_a = d & 0x1ff; |
548 | return; |
549 | case 0x295a: |
550 | mmsp2.mlc_stl_pallt_d[mmsp2.mlc_stl_pallt_a++] = d; |
551 | mmsp2.mlc_stl_pallt_a &= 0x1ff; |
552 | mmsp2.dirty_pal = 1; |
553 | return; |
3d295a9f |
554 | } |
3d295a9f |
555 | } |
6720e4e4 |
556 | iolog_unh("w16", a, d, 16); |
11913091 |
557 | } |
558 | |
559 | static void xwrite32(u32 a, u32 d) |
560 | { |
6720e4e4 |
561 | iolog("w32", a, d, 32); |
562 | |
3d295a9f |
563 | if ((a & 0xfff00000) == 0x7f100000) { |
564 | u32 *bl = &blitter.dstctrl; |
6720e4e4 |
565 | u32 a_ = a & 0xfff; |
566 | if (a_ < 0x40) { |
567 | bl[a_ / 4] = d; |
568 | if (a_ == 0x34 && (d & 1)) |
569 | blitter_do(); |
570 | return; |
571 | } |
3d295a9f |
572 | } |
6720e4e4 |
573 | iolog_unh("w32", a, d, 32); |
11913091 |
574 | } |
575 | |
6720e4e4 |
576 | #define LINKPAGE_SIZE 0x1000 |
577 | #define LINKPAGE_COUNT 4 |
578 | #define LINKPAGE_ALLOC (LINKPAGE_SIZE * LINKPAGE_COUNT) |
579 | |
580 | struct op_context { |
581 | u32 pc; |
582 | u32 op; |
583 | u32 code[0]; |
584 | }; |
585 | |
3d3fa63b |
586 | struct op_linkpage { |
6720e4e4 |
587 | void (*handler)(struct op_context *op_ctx); |
588 | u32 code[0]; |
589 | }; |
590 | |
3d3fa63b |
591 | struct op_stackframe { |
592 | u32 saved_regs[15]; |
593 | u32 cpsr; |
594 | }; |
595 | |
596 | static struct op_linkpage *g_linkpage; |
6720e4e4 |
597 | static u32 *g_code_ptr; |
598 | static int g_linkpage_count; |
599 | |
11913091 |
600 | #define BIT_SET(v, b) (v & (1 << (b))) |
601 | |
3d3fa63b |
602 | void emu_handle_op(struct op_context *op_ctx, struct op_stackframe *sframe) |
11913091 |
603 | { |
3d3fa63b |
604 | u32 *regs = sframe->saved_regs; |
6720e4e4 |
605 | u32 op = op_ctx->op; |
11913091 |
606 | u32 t, shift, ret, addr; |
607 | int rn, rd; |
608 | |
609 | rd = (op & 0x0000f000) >> 12; |
610 | rn = (op & 0x000f0000) >> 16; |
611 | |
612 | if ((op & 0x0f200090) == 0x01000090) { // AM3: LDRH, STRH |
86418a84 |
613 | if (!BIT_SET(op, 5)) // !H |
614 | goto unhandled; |
615 | if (BIT_SET(op, 6) && !BIT_SET(op, 20)) // S && !L |
11913091 |
616 | goto unhandled; |
617 | |
618 | if (BIT_SET(op, 22)) // imm offset |
619 | t = ((op & 0xf00) >> 4) | (op & 0x0f); |
620 | else // reg offset |
621 | t = regs[op & 0x000f]; |
622 | |
623 | if (!BIT_SET(op, 23)) |
624 | t = -t; |
625 | addr = regs[rn] + t; |
626 | |
627 | if (BIT_SET(op, 20)) { // Load |
628 | ret = xread16(addr); |
86418a84 |
629 | if (BIT_SET(op, 6)) { // S |
630 | ret <<= 16; |
631 | ret = (signed int)ret >> 16; |
632 | } |
11913091 |
633 | regs[rd] = ret; |
634 | } |
635 | else |
636 | xwrite16(addr, regs[rd]); |
637 | } |
638 | else if ((op & 0x0d200000) == 0x05000000) { // AM2: LDR[B], STR[B] |
639 | if (BIT_SET(op, 25)) { // reg offs |
640 | if (BIT_SET(op, 4)) |
641 | goto unhandled; |
642 | |
643 | t = regs[op & 0x000f]; |
644 | shift = (op & 0x0f80) >> 7; |
645 | switch ((op & 0x0060) >> 5) { |
646 | case 0: t = t << shift; break; |
647 | case 1: t = t >> (shift + 1); break; |
648 | case 2: t = (signed int)t >> (shift + 1); break; |
649 | case 3: goto unhandled; // I'm just lazy |
650 | } |
651 | } |
652 | else // imm offs |
653 | t = op & 0x0fff; |
654 | |
655 | if (!BIT_SET(op, 23)) |
656 | t = -t; |
657 | addr = regs[rn] + t; |
658 | |
659 | if (BIT_SET(op, 20)) { // Load |
660 | if (BIT_SET(op, 22)) // Byte |
661 | ret = xread8(addr); |
662 | else |
663 | ret = xread32(addr); |
664 | regs[rd] = ret; |
665 | } |
666 | else { |
667 | if (BIT_SET(op, 22)) // Byte |
668 | xwrite8(addr, regs[rd]); |
669 | else |
670 | xwrite32(addr, regs[rd]); |
671 | } |
672 | } |
673 | else |
674 | goto unhandled; |
675 | |
86418a84 |
676 | #if 0 |
11913091 |
677 | if (addr != addr_check) { |
678 | fprintf(stderr, "bad calculated addr: %08x vs %08x\n", addr, addr_check); |
679 | abort(); |
680 | } |
86418a84 |
681 | #endif |
11913091 |
682 | return; |
683 | |
684 | unhandled: |
6720e4e4 |
685 | err("unhandled IO op %08x @ %08x\n", op, op_ctx->pc); |
86418a84 |
686 | } |
687 | |
688 | static u32 make_offset12(u32 *pc, u32 *target) |
689 | { |
690 | int lp_offs, u = 1; |
691 | |
692 | lp_offs = (char *)target - (char *)pc - 2*4; |
693 | if (lp_offs < 0) { |
694 | lp_offs = -lp_offs; |
695 | u = 0; |
696 | } |
697 | if (lp_offs >= LINKPAGE_SIZE) { |
6720e4e4 |
698 | err("linkpage too far: %d\n", lp_offs); |
86418a84 |
699 | abort(); |
700 | } |
701 | |
702 | return (u << 23) | lp_offs; |
703 | } |
704 | |
6720e4e4 |
705 | static u32 make_jmp(u32 *pc, u32 *target, int bl) |
86418a84 |
706 | { |
707 | int jmp_val; |
708 | |
709 | jmp_val = target - pc - 2; |
710 | if (jmp_val < (int)0xff000000 || jmp_val > 0x00ffffff) { |
6720e4e4 |
711 | err("jump out of range (%p -> %p)\n", pc, target); |
86418a84 |
712 | abort(); |
713 | } |
714 | |
6720e4e4 |
715 | return 0xea000000 | (bl << 24) | (jmp_val & 0x00ffffff); |
86418a84 |
716 | } |
717 | |
718 | static void emit_op(u32 op) |
719 | { |
720 | *g_code_ptr++ = op; |
721 | } |
722 | |
723 | static void emit_op_io(u32 op, u32 *target) |
724 | { |
725 | op |= make_offset12(g_code_ptr, target); |
726 | emit_op(op); |
727 | } |
728 | |
6720e4e4 |
729 | static void init_linkpage(void) |
730 | { |
3d3fa63b |
731 | g_linkpage->handler = emu_call_handle_op; |
6720e4e4 |
732 | g_code_ptr = g_linkpage->code; |
6720e4e4 |
733 | } |
734 | |
86418a84 |
735 | static void segv_sigaction(int num, siginfo_t *info, void *ctx) |
736 | { |
737 | struct ucontext *context = ctx; |
738 | u32 *regs = (u32 *)&context->uc_mcontext.arm_r0; |
739 | u32 *pc = (u32 *)regs[15]; |
6720e4e4 |
740 | struct op_context *op_ctx; |
7fd42181 |
741 | int i, lp_size; |
86418a84 |
742 | |
6720e4e4 |
743 | if (((regs[15] ^ (u32)&segv_sigaction) & 0xff000000) == 0 || // PC is in our segment or |
744 | (((regs[15] ^ (u32)g_linkpage) & ~(LINKPAGE_ALLOC - 1)) == 0) || // .. in linkpage |
745 | ((long)info->si_addr & 0xffe00000) != 0x7f000000) // faulting not where expected |
86418a84 |
746 | { |
747 | // real crash - time to die |
6720e4e4 |
748 | err("segv %d %p @ %08x\n", info->si_code, info->si_addr, regs[15]); |
7fd42181 |
749 | for (i = 0; i < 8; i++) |
750 | err(" r%d=%08x r%2d=%08x\n", i, regs[i], i+8, regs[i+8]); |
86418a84 |
751 | signal(num, SIG_DFL); |
752 | raise(num); |
c1ffd5ba |
753 | return; |
86418a84 |
754 | } |
0881206b |
755 | segvlog("segv %d %p @ %08x\n", info->si_code, info->si_addr, regs[15]); |
86418a84 |
756 | |
757 | // spit PC and op |
6720e4e4 |
758 | op_ctx = (void *)g_code_ptr; |
759 | op_ctx->pc = (u32)pc; |
760 | op_ctx->op = *pc; |
761 | g_code_ptr = &op_ctx->code[0]; |
86418a84 |
762 | |
763 | // emit jump to code ptr |
6720e4e4 |
764 | *pc = make_jmp(pc, g_code_ptr, 0); |
86418a84 |
765 | |
766 | // generate code: |
3d3fa63b |
767 | emit_op (0xe50d0000 + 0xf00 - 4 * 0); // str r0, [sp, #(-0xf00 + r0_offs)] |
768 | emit_op (0xe50de000 + 0xf00 - 4 * 14); // str lr, [sp, #(-0xf00 + lr_offs)] |
6720e4e4 |
769 | emit_op (0xe24f0000 + (g_code_ptr - (u32 *)op_ctx + 2) * 4); // sub r0, pc, #op_ctx |
3d3fa63b |
770 | emit_op (0xe1a0e00f); // mov lr, pc |
771 | emit_op_io(0xe51ff000, (u32 *)&g_linkpage->handler); // ldr pc, =handle_op |
772 | emit_op (0xe51de000 + 0xf00 - 4 * 14); // ldr lr, [sp, #(-0xf00 + lr_offs)] |
6720e4e4 |
773 | emit_op (make_jmp(g_code_ptr, pc + 1, 0)); // jmp <back> |
86418a84 |
774 | |
775 | // sync caches |
776 | sys_cacheflush(pc, pc + 1); |
777 | sys_cacheflush(g_linkpage, g_code_ptr); |
778 | |
779 | lp_size = (char *)g_code_ptr - (char *)g_linkpage; |
0881206b |
780 | segvlog("code #%d %d/%d\n", g_linkpage_count, lp_size, LINKPAGE_SIZE); |
86418a84 |
781 | |
782 | if (lp_size + 13*4 > LINKPAGE_SIZE) { |
783 | g_linkpage_count++; |
784 | if (g_linkpage_count >= LINKPAGE_COUNT) { |
6720e4e4 |
785 | err("too many linkpages needed\n"); |
86418a84 |
786 | abort(); |
787 | } |
788 | g_linkpage = (void *)((char *)g_linkpage + LINKPAGE_SIZE); |
789 | init_linkpage(); |
790 | } |
791 | //handle_op(regs[15], op, regs, (u32)info->si_addr); |
792 | //regs[15] += 4; |
793 | } |
11913091 |
794 | |
795 | void emu_init(void *map_bottom) |
796 | { |
7fd42181 |
797 | sigaction_t segv_action = { |
11913091 |
798 | .sa_sigaction = segv_sigaction, |
799 | .sa_flags = SA_SIGINFO, |
800 | }; |
c1ffd5ba |
801 | pthread_t tid; |
6720e4e4 |
802 | void *pret; |
803 | int ret; |
11913091 |
804 | |
86418a84 |
805 | g_linkpage = (void *)(((u32)map_bottom - LINKPAGE_ALLOC) & ~0xfff); |
7fd42181 |
806 | pret = mmap(g_linkpage, LINKPAGE_ALLOC, PROT_READ|PROT_WRITE, |
807 | MAP_PRIVATE|MAP_ANONYMOUS, -1, 0); |
6720e4e4 |
808 | if (pret != g_linkpage) { |
809 | perror(PFX "mmap linkpage"); |
11913091 |
810 | exit(1); |
811 | } |
c1ffd5ba |
812 | log("linkpages @ %p\n", g_linkpage); |
86418a84 |
813 | init_linkpage(); |
11913091 |
814 | |
3d3fa63b |
815 | mmsp2.umem = mmap(NULL, 0x2000000, PROT_READ|PROT_WRITE|PROT_EXEC, |
816 | MAP_PRIVATE|MAP_ANONYMOUS, -1, 0); |
817 | if (mmsp2.umem == MAP_FAILED) { |
818 | perror(PFX "mmap upper mem"); |
819 | exit(1); |
820 | } |
821 | |
3d295a9f |
822 | // host stuff |
2ce69bdf |
823 | ret = host_video_init(&host_stride, 0); |
824 | if (ret != 0) { |
7fd42181 |
825 | err("can't init video\n"); |
3d295a9f |
826 | exit(1); |
827 | } |
2ce69bdf |
828 | host_screen = host_video_flip(); |
c1ffd5ba |
829 | |
830 | ret = pthread_create(&tid, NULL, fb_sync_thread, NULL); |
831 | if (ret != 0) { |
832 | err("failed to create fb_sync_thread: %d\n", ret); |
833 | exit(1); |
834 | } |
835 | pthread_detach(tid); |
836 | |
837 | // mmsp2 defaults |
838 | mmsp2.mlc_stl_adr = 0x03101000; // fb2 is at 0x03381000 |
7fd42181 |
839 | mmsp2.mlc_stl_cntl = 0x4ab; // 16bpp, region 1 active |
c1ffd5ba |
840 | |
841 | sigemptyset(&segv_action.sa_mask); |
842 | sigaction(SIGSEGV, &segv_action, NULL); |
3d295a9f |
843 | } |
844 | |
845 | int emu_read_gpiodev(void *buf, int count) |
846 | { |
847 | unsigned int btns; |
848 | |
849 | if (count < 4) { |
6720e4e4 |
850 | err("gpiodev read %d?\n", count); |
3d295a9f |
851 | return -1; |
852 | } |
853 | |
854 | btns = host_read_btns(); |
855 | memcpy(buf, &btns, 4); |
856 | return 4; |
11913091 |
857 | } |
858 | |
dc90c02d |
859 | struct dev_fd_t emu_interesting_fds[] = { |
860 | [IFD_SOUND] = { "/dev/dsp", -1 }, |
861 | { NULL, 0 }, |
862 | }; |
863 | |
864 | static void *emu_mmap_dev(unsigned int length, int prot, int flags, unsigned int offset) |
11913091 |
865 | { |
3d3fa63b |
866 | u8 *umem, *umem_end; |
11913091 |
867 | |
3d295a9f |
868 | // SoC regs |
11913091 |
869 | if ((offset & ~0xffff) == 0xc0000000) { |
870 | return mmap((void *)0x7f000000, length, PROT_NONE, |
871 | MAP_PRIVATE|MAP_ANONYMOUS|MAP_FIXED|MAP_NORESERVE, -1, 0); |
872 | } |
3d295a9f |
873 | // blitter |
11913091 |
874 | if ((offset & ~0xffff) == 0xe0020000) { |
875 | return mmap((void *)0x7f100000, length, PROT_NONE, |
876 | MAP_PRIVATE|MAP_ANONYMOUS|MAP_FIXED|MAP_NORESERVE, -1, 0); |
877 | } |
3d295a9f |
878 | // upper mem |
3d3fa63b |
879 | if ((offset & 0xfe000000) != 0x02000000) { |
6720e4e4 |
880 | err("unexpected devmem mmap @ %08x\n", offset); |
dc90c02d |
881 | errno = EINVAL; |
3d295a9f |
882 | return MAP_FAILED; |
883 | } |
884 | |
3d3fa63b |
885 | umem = uppermem_lookup(offset, &umem_end); |
886 | if (umem + length > umem_end) |
887 | err("warning: uppermem @ %08x overflows by %d bytes\n", |
888 | offset, umem + length - umem_end); |
889 | |
890 | dbg("upper mem @ %08x %d\n", offset, length); |
891 | return umem; |
11913091 |
892 | } |
893 | |
dc90c02d |
894 | void *emu_do_mmap(unsigned int length, int prot, int flags, int fd, unsigned int offset) |
895 | { |
896 | if (fd == FAKEDEV_MEM) |
897 | return emu_mmap_dev(length, prot, flags, offset); |
898 | |
899 | if (fd == FAKEDEV_FB0) |
900 | return emu_mmap_dev(length, prot, flags, offset + 0x03101000); |
901 | |
902 | if (fd == FAKEDEV_FB1) |
903 | return emu_mmap_dev(length, prot, flags, offset + 0x03381000); |
904 | |
7fd42181 |
905 | err("bad/ni mmap(?, %d, %x, %x, %d, %08x)\n", length, prot, flags, fd, offset); |
dc90c02d |
906 | errno = EINVAL; |
907 | return MAP_FAILED; |
908 | } |
909 | |
dc90c02d |
910 | static int emu_sound_ioctl(int fd, int request, void *argp) |
911 | { |
912 | int *arg = argp; |
913 | |
914 | #if 0 |
915 | dbg("snd ioctl(%d, %08x, %p)", fd, request, argp); |
916 | if (arg != NULL) |
917 | dbg_c(" [%d]", *arg); |
918 | dbg_c("\n"); |
919 | #endif |
920 | |
921 | /* People set strange frag settings on GP2X, which even manage |
922 | * to break audio on pandora (causes writes to fail). |
923 | * Catch this and set to something that works. */ |
924 | if (request == SNDCTL_DSP_SPEED) { |
925 | int ret, bsize, frag; |
926 | |
927 | // ~4ms. gpSP wants small buffers or else it stutters |
928 | // because of it's audio thread sync stuff |
929 | bsize = *arg / 250 * 4; |
930 | for (frag = 0; bsize; bsize >>= 1, frag++) |
931 | ; |
932 | |
933 | frag |= 16 << 16; // fragment count |
934 | ret = ioctl(fd, SNDCTL_DSP_SETFRAGMENT, &frag); |
935 | if (ret != 0) { |
936 | err("snd ioctl SETFRAGMENT %08x: ", frag); |
937 | perror(NULL); |
938 | } |
939 | } |
940 | else if (request == SNDCTL_DSP_SETFRAGMENT) |
941 | return 0; |
942 | |
943 | return ioctl(fd, request, argp); |
944 | } |
945 | |
dc90c02d |
946 | int emu_do_ioctl(int fd, int request, void *argp) |
947 | { |
948 | if (fd == emu_interesting_fds[IFD_SOUND].fd) |
949 | return emu_sound_ioctl(fd, request, argp); |
950 | |
7fd42181 |
951 | switch (fd) { |
952 | /* *********************** */ |
953 | case FAKEDEV_FB0: |
954 | case FAKEDEV_FB1: |
955 | if (argp == NULL) |
956 | goto fail; |
dc90c02d |
957 | |
dc90c02d |
958 | switch (request) { |
959 | case FBIOGET_FSCREENINFO: { |
960 | struct fb_fix_screeninfo *fix = argp; |
961 | |
962 | memset(fix, 0, sizeof(*fix)); |
963 | strcpy(fix->id, "mmsp2_RGB0"); |
964 | fix->type = FB_TYPE_PACKED_PIXELS; |
965 | fix->accel = FB_ACCEL_NONE; |
7fd42181 |
966 | fix->visual = FB_VISUAL_TRUECOLOR; |
967 | fix->line_length = 320*2; |
dc90c02d |
968 | fix->smem_start = (fd == FAKEDEV_FB0) ? 0x03101000 : 0x03381000; |
969 | fix->smem_len = 320*240*2; |
970 | return 0; |
971 | } |
972 | case FBIOGET_VSCREENINFO: { |
973 | struct fb_var_screeninfo *var = argp; |
7fd42181 |
974 | static const struct fb_bitfield fbb_red = { offset: 11, length: 5, }; |
975 | static const struct fb_bitfield fbb_green = { offset: 5, length: 6, }; |
976 | static const struct fb_bitfield fbb_blue = { offset: 0, length: 5, }; |
dc90c02d |
977 | |
978 | memset(var, 0, sizeof(*var)); |
979 | var->activate = FB_ACTIVATE_NOW; |
980 | var->xres = |
981 | var->xres_virtual = 320; |
982 | var->yres = |
983 | var->yres_virtual = 240; |
984 | var->width = |
985 | var->height = -1; |
986 | var->vmode = FB_VMODE_NONINTERLACED; |
987 | var->bits_per_pixel = 16; |
988 | var->red = fbb_red; |
989 | var->green = fbb_green; |
990 | var->blue = fbb_blue; |
991 | return 0; |
992 | } |
7fd42181 |
993 | case FBIOPUT_VSCREENINFO: { |
994 | struct fb_var_screeninfo *var = argp; |
995 | dbg(" put vscreen: %dx%d@%d\n", var->xres, var->yres, var->bits_per_pixel); |
996 | if (var->xres != 320 || var->yres != 240 || var->bits_per_pixel != 16) |
997 | return -1; |
998 | return 0; |
999 | } |
dc90c02d |
1000 | } |
7fd42181 |
1001 | |
1002 | /* *********************** */ |
1003 | case FAKEDEV_TTY0: |
1004 | // fake tty0 to make GPH SDL happy |
1005 | if (request == 0x4b46) // KDGKBENT |
1006 | return -1; |
1007 | return 0; |
dc90c02d |
1008 | } |
1009 | |
1010 | fail: |
7fd42181 |
1011 | err("bad/ni ioctl(%d, %08x, %p)\n", fd, request, argp); |
dc90c02d |
1012 | errno = EINVAL; |
1013 | return -1; |
1014 | } |
1015 | |
7fd42181 |
1016 | static const struct { |
1017 | const char *from; |
1018 | const char *to; |
1019 | } path_map[] = { |
1020 | { "/mnt/tmp/", "/tmp/" }, |
1021 | }; |
1022 | |
7fd42181 |
1023 | static const char *wrap_path(const char *path) |
1024 | { |
3d3fa63b |
1025 | char *buff; |
1026 | size_t size; |
7fd42181 |
1027 | int i, len; |
1028 | |
1029 | // do only path mapping for now |
1030 | for (i = 0; i < ARRAY_SIZE(path_map); i++) { |
1031 | len = strlen(path_map[i].from); |
1032 | if (strncmp(path, path_map[i].from, len) == 0) { |
3d3fa63b |
1033 | size = strlen(path) + strlen(path_map[i].to) + 1; |
1034 | buff = malloc(size); |
1035 | if (buff == NULL) |
1036 | break; |
1037 | snprintf(buff, size, "%s%s", path_map[i].to, path + len); |
1038 | dbg("mapped path \"%s\" -> \"%s\"\n", path, buff); |
1039 | return buff; |
7fd42181 |
1040 | } |
1041 | } |
1042 | |
1043 | return path; |
1044 | } |
1045 | |
1046 | void *emu_do_fopen(const char *path, const char *mode) |
1047 | { |
3d3fa63b |
1048 | const char *w_path = wrap_path(path); |
1049 | FILE *ret; |
1050 | ret = fopen(w_path, mode); |
1051 | if (w_path != path) |
1052 | free((void *)w_path); |
1053 | return ret; |
7fd42181 |
1054 | } |
1055 | |
3d3fa63b |
1056 | // FIXME: threads.. |
7fd42181 |
1057 | int emu_do_system(const char *command) |
1058 | { |
1059 | static char tmp_path[512]; |
3d3fa63b |
1060 | const char *p2; |
1061 | char *p; |
7fd42181 |
1062 | |
1063 | if (command == NULL) |
1064 | return -1; |
1065 | |
1066 | // pass through stuff in PATH |
1067 | p = strchr(command, ' '); |
1068 | p2 = strchr(command, '/'); |
1069 | if (p2 == NULL || (p != NULL && p2 > p)) |
1070 | return system(command); |
1071 | |
1072 | make_local_path(tmp_path, sizeof(tmp_path), "ginge_prep"); |
1073 | p = tmp_path + strlen(tmp_path); |
1074 | |
3d3fa63b |
1075 | p2 = wrap_path(command); |
1076 | snprintf(p, sizeof(tmp_path) - (p - tmp_path), " %s", p2); |
1077 | if (p2 != command) |
1078 | free((void *)p2); |
1079 | |
7fd42181 |
1080 | dbg("system: \"%s\"\n", tmp_path); |
1081 | return system(tmp_path); |
1082 | } |
1083 | |