4 * This work is licensed under the terms of the GNU GPLv2 or later.
5 * See the COPYING file in the top-level directory.
14 #include <sys/types.h>
20 #include "libpicofe/fonts.h"
21 #include "libpicofe/input.h"
22 #include "libpicofe/plat.h"
23 #include "libpicofe/arm/neon_scale2x.h"
24 #include "libpicofe/arm/neon_eagle2x.h"
25 #include "plugin_lib.h"
30 #include "pl_gun_ts.h"
32 #include "psemu_plugin_defs.h"
33 #include "../libpcsxcore/new_dynarec/new_dynarec.h"
34 #include "../libpcsxcore/psxmem_map.h"
35 #include "../plugins/dfinput/externals.h"
42 int in_analog_left[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
43 int in_analog_right[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
44 int in_adev[2] = { -1, -1 }, in_adev_axis[2][2] = {{ 0, 1 }, { 0, 1 }};
45 int in_adev_is_nublike[2];
46 unsigned short in_keystate[8];
49 int in_enable_vibration;
52 int g_layer_x, g_layer_y, g_layer_w, g_layer_h;
53 static int pl_vout_w, pl_vout_h, pl_vout_bpp; /* output display/layer */
54 static int pl_vout_scale_w, pl_vout_scale_h, pl_vout_yoffset;
55 static int psx_w, psx_h, psx_bpp;
57 static int is_pal, frame_interval, frame_interval1024;
58 static int vsync_usec_time;
61 void (*pl_plat_clear)(void);
62 void (*pl_plat_blit)(int doffs, const void *src, int w, int h,
63 int sstride, int bgr24);
64 void (*pl_plat_hud_print)(int x, int y, const char *str, int bpp);
67 static __attribute__((noinline)) int get_cpu_ticks(void)
69 static unsigned long last_utime;
71 unsigned long utime, ret;
75 fd = open("/proc/self/stat", O_RDONLY);
76 lseek(fd, 0, SEEK_SET);
78 read(fd, buf, sizeof(buf));
79 buf[sizeof(buf) - 1] = 0;
81 sscanf(buf, "%*d %*s %*c %*d %*d %*d %*d %*d %*u %*u %*u %*u %*u %lu", &utime);
82 ret = utime - last_utime;
89 static void hud_print(void *fb, int w, int x, int y, const char *text)
91 if (pl_plat_hud_print)
92 pl_plat_hud_print(x, y, text, pl_vout_bpp);
93 else if (pl_vout_bpp == 16)
94 basic_text_out16_nf(fb, w, x, y, text);
97 static void hud_printf(void *fb, int w, int x, int y, const char *texto, ...)
102 va_start(args, texto);
103 vsnprintf(buffer, sizeof(buffer), texto, args);
106 hud_print(fb, w, x, y, buffer);
109 static void print_msg(int h, int border)
111 hud_print(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT, hud_msg);
114 static void print_fps(int h, int border)
116 hud_printf(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT,
117 "%2d %4.1f", pl_rearmed_cbs.flips_per_sec,
118 pl_rearmed_cbs.vsps_cur);
121 static void print_cpu_usage(int w, int h, int border)
123 hud_printf(pl_vout_buf, pl_vout_w, pl_vout_w - border - 28,
124 h - HUD_HEIGHT, "%3d", pl_rearmed_cbs.cpu_usage);
127 // draw 192x8 status of 24 sound channels
128 static __attribute__((noinline)) void draw_active_chans(int vout_w, int vout_h)
130 extern void spu_get_debug_info(int *chans_out, int *run_chans,
131 int *fmod_chans_out, int *noise_chans_out); // hack
132 int live_chans, run_chans, fmod_chans, noise_chans;
134 static const unsigned short colors[2] = { 0x1fe3, 0x0700 };
135 unsigned short *dest = (unsigned short *)pl_vout_buf +
136 vout_w * (vout_h - HUD_HEIGHT) + vout_w / 2 - 192/2;
137 unsigned short *d, p;
140 if (dest == NULL || pl_vout_bpp != 16)
143 spu_get_debug_info(&live_chans, &run_chans, &fmod_chans, &noise_chans);
145 for (c = 0; c < 24; c++) {
147 p = !(live_chans & (1<<c)) ? (run_chans & (1<<c) ? 0x01c0 : 0) :
148 (fmod_chans & (1<<c)) ? 0xf000 :
149 (noise_chans & (1<<c)) ? 0x001f :
151 for (y = 0; y < 8; y++, d += vout_w)
152 for (x = 0; x < 8; x++)
157 static void print_hud(int w, int h, int xborder)
163 xborder += (pl_vout_w - w) / 2;
167 if (g_opts & OPT_SHOWSPU)
168 draw_active_chans(w, h);
171 print_msg(h, xborder);
172 else if (g_opts & OPT_SHOWFPS)
173 print_fps(h, xborder);
175 if (g_opts & OPT_SHOWCPU)
176 print_cpu_usage(w, h, xborder);
179 /* update scaler target size according to user settings */
180 static void update_layer_size(int w, int h)
187 g_layer_w = w; g_layer_h = h;
191 g_layer_w = w; g_layer_h = h;
192 if (w * 2 <= g_menuscreen_w)
194 if (h * 2 <= g_menuscreen_h)
199 if (h > g_menuscreen_h || (240 < h && h <= 360))
202 // 4:3 that prefers integer scaling
203 imult = g_menuscreen_h / h;
204 g_layer_w = w * imult;
205 g_layer_h = h * imult;
206 mult = (float)g_layer_w / (float)g_layer_h;
207 if (mult < 1.25f || mult > 1.666f)
208 g_layer_w = 4.0f/3.0f * (float)g_layer_h;
209 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
214 mult = 240.0f / (float)h * 4.0f / 3.0f;
217 g_layer_w = mult * (float)g_menuscreen_h;
218 g_layer_h = g_menuscreen_h;
219 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
222 case SCALE_FULLSCREEN:
223 g_layer_w = g_menuscreen_w;
224 g_layer_h = g_menuscreen_h;
231 g_layer_x = g_menuscreen_w / 2 - g_layer_w / 2;
232 g_layer_y = g_menuscreen_h / 2 - g_layer_h / 2;
233 if (g_layer_x < 0) g_layer_x = 0;
234 if (g_layer_y < 0) g_layer_y = 0;
235 if (g_layer_w > g_menuscreen_w) g_layer_w = g_menuscreen_w;
236 if (g_layer_h > g_menuscreen_h) g_layer_h = g_menuscreen_h;
239 // XXX: this is platform specific really
240 static inline int resolution_ok(int w, int h)
242 return w <= 1024 && h <= 512;
245 static void pl_vout_set_mode(int w, int h, int raw_w, int raw_h, int bpp)
247 int vout_w, vout_h, vout_bpp;
250 // special h handling, Wipeout likes to change it by 1-6
251 static int vsync_cnt_ms_prev;
252 if ((unsigned int)(vsync_cnt - vsync_cnt_ms_prev) < 5*60)
254 vsync_cnt_ms_prev = vsync_cnt;
262 if (pl_rearmed_cbs.only_16bpp)
265 // don't use very low heights
267 buf_yoffset = (192 - vout_h) / 2;
271 pl_vout_scale_w = pl_vout_scale_h = 1;
274 if (resolution_ok(w * 2, h * 2) && bpp == 16) {
279 // filter unavailable
283 else if (scanlines != 0 && scanline_level != 100 && bpp == 16) {
288 vout_w *= pl_vout_scale_w;
289 vout_h *= pl_vout_scale_h;
291 update_layer_size(vout_w, vout_h);
293 pl_vout_buf = plat_gvideo_set_mode(&vout_w, &vout_h, &vout_bpp);
294 if (pl_vout_buf == NULL && pl_plat_blit == NULL)
295 fprintf(stderr, "failed to set mode %dx%d@%d\n",
296 vout_w, vout_h, vout_bpp);
300 pl_vout_bpp = vout_bpp;
301 pl_vout_yoffset = buf_yoffset;
303 if (pl_vout_buf != NULL)
304 pl_vout_buf = (char *)pl_vout_buf
305 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
307 menu_notify_mode_change(pl_vout_w, pl_vout_h, pl_vout_bpp);
310 static void pl_vout_flip(const void *vram, int stride, int bgr24, int w, int h)
312 static int doffs_old, clear_counter;
313 unsigned char *dest = pl_vout_buf;
314 const unsigned short *src = vram;
315 int dstride = pl_vout_w, h1 = h;
316 int h_full = pl_vout_h - pl_vout_yoffset;
319 pcnt_start(PCNT_BLIT);
326 memset(pl_vout_buf, 0,
327 dstride * h_full * pl_vout_bpp / 8);
332 doffs = (dstride - w * pl_vout_scale_w) / 2 & ~1;
334 if (doffs > doffs_old)
338 if (clear_counter > 0) {
342 memset(pl_vout_buf, 0,
343 dstride * h_full * pl_vout_bpp / 8);
349 pl_plat_blit(doffs, src, w, h, stride, bgr24);
360 if (pl_rearmed_cbs.only_16bpp) {
361 for (; h1-- > 0; dest += dstride * 2, src += stride)
363 bgr888_to_rgb565(dest, src, w * 3);
368 dest += (doffs / 8) * 24;
370 for (; h1-- > 0; dest += dstride * 3, src += stride)
372 bgr888_to_rgb888(dest, src, w * 3);
377 else if (soft_filter == SOFT_FILTER_SCALE2X && pl_vout_scale_w == 2)
379 neon_scale2x_16_16(src, (void *)dest, w,
380 stride * 2, dstride * 2, h);
382 else if (soft_filter == SOFT_FILTER_EAGLE2X && pl_vout_scale_w == 2)
384 neon_eagle2x_16_16(src, (void *)dest, w,
385 stride * 2, dstride * 2, h);
387 else if (scanlines != 0 && scanline_level != 100)
389 int l = scanline_level * 2048 / 100;
390 int stride_0 = pl_vout_scale_h >= 2 ? 0 : stride;
392 h1 *= pl_vout_scale_h;
393 for (; h1 >= 2; h1 -= 2)
395 bgr555_to_rgb565(dest, src, w * 2);
396 dest += dstride * 2, src += stride_0;
398 bgr555_to_rgb565_b(dest, src, w * 2, l);
399 dest += dstride * 2, src += stride;
405 for (; h1-- > 0; dest += dstride * 2, src += stride)
407 bgr555_to_rgb565(dest, src, w * 2);
412 print_hud(w * pl_vout_scale_w, h * pl_vout_scale_h, 0);
418 pl_vout_buf = plat_gvideo_flip();
419 if (pl_vout_buf != NULL)
420 pl_vout_buf = (char *)pl_vout_buf
421 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
423 pl_rearmed_cbs.flip_cnt++;
426 static int pl_vout_open(void)
430 // force mode update on pl_vout_set_mode() call from gpulib/vout_pl
433 plat_gvideo_open(is_pal);
435 gettimeofday(&now, 0);
436 vsync_usec_time = now.tv_usec;
437 while (vsync_usec_time >= frame_interval)
438 vsync_usec_time -= frame_interval;
443 static void pl_vout_close(void)
448 static void pl_set_gpu_caps(int caps)
450 pl_rearmed_cbs.gpu_caps = caps;
453 void *pl_prepare_screenshot(int *w, int *h, int *bpp)
455 void *ret = plat_prepare_screenshot(w, h, bpp);
466 /* display/redering mode switcher */
467 static int dispmode_default(void)
469 pl_rearmed_cbs.gpu_neon.enhancement_enable = 0;
470 soft_filter = SOFT_FILTER_NONE;
471 snprintf(hud_msg, sizeof(hud_msg), "default mode");
475 #ifdef BUILTIN_GPU_NEON
476 static int dispmode_doubleres(void)
478 if (!(pl_rearmed_cbs.gpu_caps & GPU_CAP_SUPPORTS_2X)
479 || !resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
483 pl_rearmed_cbs.gpu_neon.enhancement_enable = 1;
484 snprintf(hud_msg, sizeof(hud_msg), "double resolution");
490 static int dispmode_scale2x(void)
492 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
496 soft_filter = SOFT_FILTER_SCALE2X;
497 snprintf(hud_msg, sizeof(hud_msg), "scale2x");
501 static int dispmode_eagle2x(void)
503 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
507 soft_filter = SOFT_FILTER_EAGLE2X;
508 snprintf(hud_msg, sizeof(hud_msg), "eagle2x");
513 static int (*dispmode_switchers[])(void) = {
515 #ifdef BUILTIN_GPU_NEON
524 static int dispmode_current;
526 void pl_switch_dispmode(void)
528 if (pl_rearmed_cbs.gpu_caps & GPU_CAP_OWNS_DISPLAY)
533 if (dispmode_current >=
534 sizeof(dispmode_switchers) / sizeof(dispmode_switchers[0]))
535 dispmode_current = 0;
536 if (dispmode_switchers[dispmode_current]())
542 /* adjust circle-like analog inputs to better match
543 * more square-like analogs in PSX */
544 static void update_analog_nub_adjust(int *x_, int *y_)
547 static const int scale[] =
548 { 0 - d*2, 0 - d*2, 0 - d*2, 12 - d*2,
549 30 - d*2, 60 - d*2, 75 - d*2, 60 - d*2, 60 - d*2 };
552 int scale_x = scale[y / 16];
553 int scale_y = scale[x / 16];
556 x += d + (x * scale_x >> 8);
561 y += d + (y * scale_y >> 8);
571 static void update_analogs(void)
573 int *nubp[2] = { in_analog_left[0], in_analog_right[0] };
577 for (i = 0; i < 2; i++)
582 for (a = 0; a < 2; a++) {
585 ret = in_update_analog(in_adev[i], in_adev_axis[i][a], &v);
587 vals[a] = 128 * v / IN_ABS_RANGE;
590 if (in_adev_is_nublike[i])
591 update_analog_nub_adjust(&vals[0], &vals[1]);
593 for (a = 0; a < 2; a++) {
596 else if (v > 255) v = 255;
603 static void update_input(void)
605 int actions[IN_BINDTYPE_COUNT] = { 0, };
606 unsigned int emu_act;
609 if (in_type[0] == PSE_PAD_TYPE_ANALOGJOY || in_type[0] == PSE_PAD_TYPE_ANALOGPAD)
611 emu_act = actions[IN_BINDTYPE_EMU];
612 in_state_gun = (emu_act & SACTION_GUN_MASK) >> SACTION_GUN_TRIGGER;
614 emu_act &= ~SACTION_GUN_MASK;
617 for (; !(emu_act & 1); emu_act >>= 1, which++)
621 emu_set_action(emu_act);
623 in_keystate[0] = actions[IN_BINDTYPE_PLAYER12];
626 extern void update_input(void);
629 void pl_update_gun(int *xn, int *yn, int *xres, int *yres, int *in)
632 pl_gun_ts_update(tsdev, xn, yn, in);
638 #define MAX_LAG_FRAMES 3
640 #define tvdiff(tv, tv_old) \
641 ((tv.tv_sec - tv_old.tv_sec) * 1000000 + tv.tv_usec - tv_old.tv_usec)
643 /* called on every vsync */
644 void pl_frame_limit(void)
646 static struct timeval tv_old, tv_expect;
647 static int vsync_cnt_prev, drc_active_vsyncs;
656 /* doing input here because the pad is polled
657 * thousands of times per frame for some reason */
661 gettimeofday(&now, 0);
663 if (now.tv_sec != tv_old.tv_sec) {
664 diff = tvdiff(now, tv_old);
665 pl_rearmed_cbs.vsps_cur = 0.0f;
666 if (0 < diff && diff < 2000000)
667 pl_rearmed_cbs.vsps_cur = 1000000.0f * (vsync_cnt - vsync_cnt_prev) / diff;
668 vsync_cnt_prev = vsync_cnt;
670 if (g_opts & OPT_SHOWFPS)
671 pl_rearmed_cbs.flips_per_sec = pl_rearmed_cbs.flip_cnt;
672 pl_rearmed_cbs.flip_cnt = 0;
673 if (g_opts & OPT_SHOWCPU)
674 pl_rearmed_cbs.cpu_usage = get_cpu_ticks();
676 if (hud_new_msg > 0) {
678 if (hud_new_msg == 0)
682 //new_dynarec_print_stats();
685 static int ya_vsync_count;
686 if (++ya_vsync_count == PCNT_FRAMES) {
687 pcnt_print(pl_rearmed_cbs.vsps_cur);
692 // tv_expect uses usec*1024 units instead of usecs for better accuracy
693 tv_expect.tv_usec += frame_interval1024;
694 if (tv_expect.tv_usec >= (1000000 << 10)) {
695 tv_expect.tv_usec -= (1000000 << 10);
698 diff = (tv_expect.tv_sec - now.tv_sec) * 1000000 + (tv_expect.tv_usec >> 10) - now.tv_usec;
700 if (diff > MAX_LAG_FRAMES * frame_interval || diff < -MAX_LAG_FRAMES * frame_interval) {
701 //printf("pl_frame_limit reset, diff=%d, iv %d\n", diff, frame_interval);
704 // try to align with vsync
705 usadj = vsync_usec_time;
706 while (usadj < tv_expect.tv_usec - frame_interval)
707 usadj += frame_interval;
708 tv_expect.tv_usec = usadj << 10;
711 if (!(g_opts & OPT_NO_FRAMELIM) && diff > frame_interval) {
712 // yay for working usleep on pandora!
713 //printf("usleep %d\n", diff - frame_interval / 2);
714 usleep(diff - frame_interval);
717 if (pl_rearmed_cbs.frameskip) {
718 if (diff < -frame_interval)
719 pl_rearmed_cbs.fskip_advice = 1;
721 pl_rearmed_cbs.fskip_advice = 0;
723 // recompilation is not that fast and may cause frame skip on
724 // loading screens and such, resulting in flicker or glitches
725 if (new_dynarec_did_compile) {
726 if (drc_active_vsyncs < 32)
727 pl_rearmed_cbs.fskip_advice = 0;
731 drc_active_vsyncs = 0;
732 new_dynarec_did_compile = 0;
735 pcnt_start(PCNT_ALL);
738 void pl_timing_prepare(int is_pal_)
740 pl_rearmed_cbs.fskip_advice = 0;
741 pl_rearmed_cbs.flips_per_sec = 0;
742 pl_rearmed_cbs.cpu_usage = 0;
745 frame_interval = is_pal ? 20000 : 16667;
746 frame_interval1024 = is_pal ? 20000*1024 : 17066667;
748 // used by P.E.Op.S. frameskip code
749 pl_rearmed_cbs.gpu_peops.fFrameRateHz = is_pal ? 50.0f : 59.94f;
750 pl_rearmed_cbs.gpu_peops.dwFrameRateTicks =
751 (100000*100 / (unsigned long)(pl_rearmed_cbs.gpu_peops.fFrameRateHz*100));
754 static void pl_get_layer_pos(int *x, int *y, int *w, int *h)
762 static void *pl_mmap(unsigned int size);
763 static void pl_munmap(void *ptr, unsigned int size);
765 struct rearmed_cbs pl_rearmed_cbs = {
774 .pl_set_gpu_caps = pl_set_gpu_caps,
778 static void *watchdog_thread(void *unused)
780 int vsync_cnt_old = 0;
784 #if !defined(NDEBUG) || defined(DRC_DBG)
785 // don't interfere with debug
797 if (vsync_cnt != vsync_cnt_old) {
798 vsync_cnt_old = vsync_cnt;
807 fprintf(stderr, "watchdog: seen_dead %d\n", seen_dead);
809 fprintf(stderr, "watchdog: lockup detected, aborting\n");
810 // we can't do any cleanup here really, the main thread is
811 // likely touching resources and would crash anyway
817 void pl_start_watchdog(void)
823 pthread_attr_init(&attr);
824 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
826 ret = pthread_create(&tid, &attr, watchdog_thread, NULL);
828 fprintf(stderr, "could not start watchdog: %d\n", ret);
831 static void *pl_emu_mmap(unsigned long addr, size_t size, int is_fixed,
834 return plat_mmap(addr, size, 0, is_fixed);
837 static void pl_emu_munmap(void *ptr, size_t size, enum psxMapTag tag)
839 plat_munmap(ptr, size);
842 static void *pl_mmap(unsigned int size)
844 return psxMapHook(0, size, 0, MAP_TAG_VRAM);
847 static void pl_munmap(void *ptr, unsigned int size)
849 psxUnmapHook(ptr, size, MAP_TAG_VRAM);
854 extern unsigned int hSyncCount; // from psxcounters
855 extern unsigned int frame_counter;
857 psx_w = psx_h = pl_vout_w = pl_vout_h = 256;
858 psx_bpp = pl_vout_bpp = 16;
860 tsdev = pl_gun_ts_init();
862 pl_rearmed_cbs.gpu_hcnt = &hSyncCount;
863 pl_rearmed_cbs.gpu_frame_count = &frame_counter;
865 psxMapHook = pl_emu_mmap;
866 psxUnmapHook = pl_emu_munmap;