4 * This work is licensed under the terms of the GNU GPLv2 or later.
5 * See the COPYING file in the top-level directory.
14 #include <sys/types.h>
20 #include "libpicofe/fonts.h"
21 #include "libpicofe/input.h"
22 #include "libpicofe/plat.h"
23 #include "libpicofe/arm/neon_scale2x.h"
24 #include "libpicofe/arm/neon_eagle2x.h"
25 #include "plugin_lib.h"
30 #include "pl_gun_ts.h"
32 #include "psemu_plugin_defs.h"
33 #include "../libpcsxcore/new_dynarec/new_dynarec.h"
34 #include "../libpcsxcore/psxmem_map.h"
35 #include "../plugins/dfinput/externals.h"
42 int in_analog_left[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
43 int in_analog_right[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
44 int in_adev[2] = { -1, -1 }, in_adev_axis[2][2] = {{ 0, 1 }, { 0, 1 }};
45 int in_adev_is_nublike[2];
46 unsigned short in_keystate[8];
49 int in_enable_vibration;
52 int g_layer_x, g_layer_y, g_layer_w, g_layer_h;
53 static int pl_vout_w, pl_vout_h, pl_vout_bpp; /* output display/layer */
54 static int pl_vout_scale_w, pl_vout_scale_h, pl_vout_yoffset;
55 static int psx_w, psx_h, psx_bpp;
57 static int is_pal, frame_interval, frame_interval1024;
58 static int vsync_usec_time;
61 void (*pl_plat_clear)(void);
62 void (*pl_plat_blit)(int doffs, const void *src, int w, int h,
63 int sstride, int bgr24);
64 void (*pl_plat_hud_print)(int x, int y, const char *str, int bpp);
67 static __attribute__((noinline)) int get_cpu_ticks(void)
69 static unsigned long last_utime;
71 unsigned long utime, ret;
75 fd = open("/proc/self/stat", O_RDONLY);
76 lseek(fd, 0, SEEK_SET);
78 read(fd, buf, sizeof(buf));
79 buf[sizeof(buf) - 1] = 0;
81 sscanf(buf, "%*d %*s %*c %*d %*d %*d %*d %*d %*u %*u %*u %*u %*u %lu", &utime);
82 ret = utime - last_utime;
89 static void hud_print(void *fb, int w, int x, int y, const char *text)
91 if (pl_plat_hud_print)
92 pl_plat_hud_print(x, y, text, pl_vout_bpp);
93 else if (pl_vout_bpp == 16)
94 basic_text_out16_nf(fb, w, x, y, text);
97 static void hud_printf(void *fb, int w, int x, int y, const char *texto, ...)
102 va_start(args, texto);
103 vsnprintf(buffer, sizeof(buffer), texto, args);
106 hud_print(fb, w, x, y, buffer);
109 static void print_msg(int h, int border)
111 hud_print(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT, hud_msg);
114 static void print_fps(int h, int border)
116 hud_printf(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT,
117 "%2d %4.1f", pl_rearmed_cbs.flips_per_sec,
118 pl_rearmed_cbs.vsps_cur);
121 static void print_cpu_usage(int w, int h, int border)
123 hud_printf(pl_vout_buf, pl_vout_w, pl_vout_w - border - 28,
124 h - HUD_HEIGHT, "%3d", pl_rearmed_cbs.cpu_usage);
127 // draw 192x8 status of 24 sound channels
128 static __attribute__((noinline)) void draw_active_chans(int vout_w, int vout_h)
130 extern void spu_get_debug_info(int *chans_out, int *run_chans,
131 int *fmod_chans_out, int *noise_chans_out); // hack
132 int live_chans, run_chans, fmod_chans, noise_chans;
134 static const unsigned short colors[2] = { 0x1fe3, 0x0700 };
135 unsigned short *dest = (unsigned short *)pl_vout_buf +
136 vout_w * (vout_h - HUD_HEIGHT) + vout_w / 2 - 192/2;
137 unsigned short *d, p;
140 if (dest == NULL || pl_vout_bpp != 16)
143 spu_get_debug_info(&live_chans, &run_chans, &fmod_chans, &noise_chans);
145 for (c = 0; c < 24; c++) {
147 p = !(live_chans & (1<<c)) ? (run_chans & (1<<c) ? 0x01c0 : 0) :
148 (fmod_chans & (1<<c)) ? 0xf000 :
149 (noise_chans & (1<<c)) ? 0x001f :
151 for (y = 0; y < 8; y++, d += vout_w)
152 for (x = 0; x < 8; x++)
157 static void print_hud(int w, int h, int xborder)
163 xborder += (pl_vout_w - w) / 2;
167 if (g_opts & OPT_SHOWSPU)
168 draw_active_chans(w, h);
171 print_msg(h, xborder);
172 else if (g_opts & OPT_SHOWFPS)
173 print_fps(h, xborder);
175 if (g_opts & OPT_SHOWCPU)
176 print_cpu_usage(w, h, xborder);
179 /* update scaler target size according to user settings */
180 static void update_layer_size(int w, int h)
187 g_layer_w = w; g_layer_h = h;
191 g_layer_w = w; g_layer_h = h;
192 if (w * 2 <= g_menuscreen_w)
194 if (h * 2 <= g_menuscreen_h)
199 if (h > g_menuscreen_h || (240 < h && h <= 360))
202 // 4:3 that prefers integer scaling
203 imult = g_menuscreen_h / h;
204 g_layer_w = w * imult;
205 g_layer_h = h * imult;
206 mult = (float)g_layer_w / (float)g_layer_h;
207 if (mult < 1.25f || mult > 1.666f)
208 g_layer_w = 4.0f/3.0f * (float)g_layer_h;
209 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
214 mult = 240.0f / (float)h * 4.0f / 3.0f;
217 g_layer_w = mult * (float)g_menuscreen_h;
218 g_layer_h = g_menuscreen_h;
219 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
222 case SCALE_FULLSCREEN:
223 g_layer_w = g_menuscreen_w;
224 g_layer_h = g_menuscreen_h;
231 g_layer_x = g_menuscreen_w / 2 - g_layer_w / 2;
232 g_layer_y = g_menuscreen_h / 2 - g_layer_h / 2;
233 if (g_layer_x < 0) g_layer_x = 0;
234 if (g_layer_y < 0) g_layer_y = 0;
235 if (g_layer_w > g_menuscreen_w) g_layer_w = g_menuscreen_w;
236 if (g_layer_h > g_menuscreen_h) g_layer_h = g_menuscreen_h;
239 // XXX: this is platform specific really
240 static inline int resolution_ok(int w, int h)
242 return w <= 1024 && h <= 512;
245 static void pl_vout_set_mode(int w, int h, int raw_w, int raw_h, int bpp)
247 int vout_w, vout_h, vout_bpp;
250 // special h handling, Wipeout likes to change it by 1-6
251 static int vsync_cnt_ms_prev;
252 if ((unsigned int)(vsync_cnt - vsync_cnt_ms_prev) < 5*60)
254 vsync_cnt_ms_prev = vsync_cnt;
262 if (pl_rearmed_cbs.only_16bpp)
265 // don't use very low heights
267 buf_yoffset = (192 - vout_h) / 2;
271 pl_vout_scale_w = pl_vout_scale_h = 1;
274 if (resolution_ok(w * 2, h * 2) && bpp == 16) {
279 // filter unavailable
283 else if (scanlines != 0 && scanline_level != 100 && bpp == 16) {
288 vout_w *= pl_vout_scale_w;
289 vout_h *= pl_vout_scale_h;
291 update_layer_size(vout_w, vout_h);
293 pl_vout_buf = plat_gvideo_set_mode(&vout_w, &vout_h, &vout_bpp);
294 if (pl_vout_buf == NULL && pl_plat_blit == NULL)
295 fprintf(stderr, "failed to set mode %dx%d@%d\n",
296 vout_w, vout_h, vout_bpp);
300 pl_vout_bpp = vout_bpp;
301 pl_vout_yoffset = buf_yoffset;
303 if (pl_vout_buf != NULL)
304 pl_vout_buf = (char *)pl_vout_buf
305 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
307 menu_notify_mode_change(pl_vout_w, pl_vout_h, pl_vout_bpp);
310 static void pl_vout_flip(const void *vram, int stride, int bgr24, int w, int h)
312 static int doffs_old, clear_counter;
313 unsigned char *dest = pl_vout_buf;
314 const unsigned short *src = vram;
315 int dstride = pl_vout_w, h1 = h;
318 pcnt_start(PCNT_BLIT);
325 memset(pl_vout_buf, 0,
326 dstride * pl_vout_h * pl_vout_bpp / 8);
331 doffs = (dstride - w * pl_vout_scale_w) / 2 & ~1;
333 if (doffs > doffs_old)
337 if (clear_counter > 0) {
341 memset(pl_vout_buf, 0,
342 dstride * pl_vout_h * pl_vout_bpp / 8);
348 pl_plat_blit(doffs, src, w, h, stride, bgr24);
359 if (pl_rearmed_cbs.only_16bpp) {
360 for (; h1-- > 0; dest += dstride * 2, src += stride)
362 bgr888_to_rgb565(dest, src, w * 3);
367 dest += (doffs / 8) * 24;
369 for (; h1-- > 0; dest += dstride * 3, src += stride)
371 bgr888_to_rgb888(dest, src, w * 3);
376 else if (soft_filter == SOFT_FILTER_SCALE2X && pl_vout_scale_w == 2)
378 neon_scale2x_16_16(src, (void *)dest, w,
379 stride * 2, dstride * 2, h);
381 else if (soft_filter == SOFT_FILTER_EAGLE2X && pl_vout_scale_w == 2)
383 neon_eagle2x_16_16(src, (void *)dest, w,
384 stride * 2, dstride * 2, h);
386 else if (scanlines != 0 && scanline_level != 100)
388 int l = scanline_level * 2048 / 100;
389 int stride_0 = pl_vout_scale_h >= 2 ? 0 : stride;
391 h1 *= pl_vout_scale_h;
392 for (; h1 >= 2; h1 -= 2)
394 bgr555_to_rgb565(dest, src, w * 2);
395 dest += dstride * 2, src += stride_0;
397 bgr555_to_rgb565_b(dest, src, w * 2, l);
398 dest += dstride * 2, src += stride;
404 src = (void *)((uintptr_t)src & ~3); // align for the blitter
406 for (; h1-- > 0; dest += dstride * 2, src += stride)
408 bgr555_to_rgb565(dest, src, w * 2);
413 print_hud(w * pl_vout_scale_w, h * pl_vout_scale_h, 0);
419 pl_vout_buf = plat_gvideo_flip();
420 if (pl_vout_buf != NULL)
421 pl_vout_buf = (char *)pl_vout_buf
422 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
424 pl_rearmed_cbs.flip_cnt++;
427 static int pl_vout_open(void)
431 // force mode update on pl_vout_set_mode() call from gpulib/vout_pl
434 plat_gvideo_open(is_pal);
436 gettimeofday(&now, 0);
437 vsync_usec_time = now.tv_usec;
438 while (vsync_usec_time >= frame_interval)
439 vsync_usec_time -= frame_interval;
444 static void pl_vout_close(void)
449 static void pl_set_gpu_caps(int caps)
451 pl_rearmed_cbs.gpu_caps = caps;
454 void *pl_prepare_screenshot(int *w, int *h, int *bpp)
456 void *ret = plat_prepare_screenshot(w, h, bpp);
467 /* display/redering mode switcher */
468 static int dispmode_default(void)
470 pl_rearmed_cbs.gpu_neon.enhancement_enable = 0;
471 soft_filter = SOFT_FILTER_NONE;
472 snprintf(hud_msg, sizeof(hud_msg), "default mode");
476 #ifdef BUILTIN_GPU_NEON
477 static int dispmode_doubleres(void)
479 if (!(pl_rearmed_cbs.gpu_caps & GPU_CAP_SUPPORTS_2X)
480 || !resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
484 pl_rearmed_cbs.gpu_neon.enhancement_enable = 1;
485 snprintf(hud_msg, sizeof(hud_msg), "double resolution");
491 static int dispmode_scale2x(void)
493 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
497 soft_filter = SOFT_FILTER_SCALE2X;
498 snprintf(hud_msg, sizeof(hud_msg), "scale2x");
502 static int dispmode_eagle2x(void)
504 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
508 soft_filter = SOFT_FILTER_EAGLE2X;
509 snprintf(hud_msg, sizeof(hud_msg), "eagle2x");
514 static int (*dispmode_switchers[])(void) = {
516 #ifdef BUILTIN_GPU_NEON
525 static int dispmode_current;
527 void pl_switch_dispmode(void)
529 if (pl_rearmed_cbs.gpu_caps & GPU_CAP_OWNS_DISPLAY)
534 if (dispmode_current >=
535 sizeof(dispmode_switchers) / sizeof(dispmode_switchers[0]))
536 dispmode_current = 0;
537 if (dispmode_switchers[dispmode_current]())
543 /* adjust circle-like analog inputs to better match
544 * more square-like analogs in PSX */
545 static void update_analog_nub_adjust(int *x_, int *y_)
548 static const int scale[] =
549 { 0 - d*2, 0 - d*2, 0 - d*2, 12 - d*2,
550 30 - d*2, 60 - d*2, 75 - d*2, 60 - d*2, 60 - d*2 };
553 int scale_x = scale[y / 16];
554 int scale_y = scale[x / 16];
557 x += d + (x * scale_x >> 8);
562 y += d + (y * scale_y >> 8);
572 static void update_analogs(void)
574 int *nubp[2] = { in_analog_left[0], in_analog_right[0] };
578 for (i = 0; i < 2; i++)
583 for (a = 0; a < 2; a++) {
586 ret = in_update_analog(in_adev[i], in_adev_axis[i][a], &v);
588 vals[a] = 128 * v / IN_ABS_RANGE;
591 if (in_adev_is_nublike[i])
592 update_analog_nub_adjust(&vals[0], &vals[1]);
594 for (a = 0; a < 2; a++) {
597 else if (v > 255) v = 255;
602 //printf("%4d %4d %4d %4d\n", in_a1[0], in_a1[1], in_a2[0], in_a2[1]);
605 static void update_input(void)
607 int actions[IN_BINDTYPE_COUNT] = { 0, };
608 unsigned int emu_act;
611 if (in_type[0] == PSE_PAD_TYPE_ANALOGJOY || in_type[0] == PSE_PAD_TYPE_ANALOGPAD)
613 emu_act = actions[IN_BINDTYPE_EMU];
614 in_state_gun = (emu_act & SACTION_GUN_MASK) >> SACTION_GUN_TRIGGER;
616 emu_act &= ~SACTION_GUN_MASK;
619 for (; !(emu_act & 1); emu_act >>= 1, which++)
623 emu_set_action(emu_act);
625 in_keystate[0] = actions[IN_BINDTYPE_PLAYER12];
628 extern void update_input(void);
631 void pl_update_gun(int *xn, int *yn, int *xres, int *yres, int *in)
634 pl_gun_ts_update(tsdev, xn, yn, in);
640 #define MAX_LAG_FRAMES 3
642 #define tvdiff(tv, tv_old) \
643 ((tv.tv_sec - tv_old.tv_sec) * 1000000 + tv.tv_usec - tv_old.tv_usec)
645 /* called on every vsync */
646 void pl_frame_limit(void)
648 static struct timeval tv_old, tv_expect;
649 static int vsync_cnt_prev, drc_active_vsyncs;
658 /* doing input here because the pad is polled
659 * thousands of times per frame for some reason */
663 gettimeofday(&now, 0);
665 if (now.tv_sec != tv_old.tv_sec) {
666 diff = tvdiff(now, tv_old);
667 pl_rearmed_cbs.vsps_cur = 0.0f;
668 if (0 < diff && diff < 2000000)
669 pl_rearmed_cbs.vsps_cur = 1000000.0f * (vsync_cnt - vsync_cnt_prev) / diff;
670 vsync_cnt_prev = vsync_cnt;
672 if (g_opts & OPT_SHOWFPS)
673 pl_rearmed_cbs.flips_per_sec = pl_rearmed_cbs.flip_cnt;
674 pl_rearmed_cbs.flip_cnt = 0;
675 if (g_opts & OPT_SHOWCPU)
676 pl_rearmed_cbs.cpu_usage = get_cpu_ticks();
678 if (hud_new_msg > 0) {
680 if (hud_new_msg == 0)
684 //new_dynarec_print_stats();
687 static int ya_vsync_count;
688 if (++ya_vsync_count == PCNT_FRAMES) {
689 pcnt_print(pl_rearmed_cbs.vsps_cur);
694 // tv_expect uses usec*1024 units instead of usecs for better accuracy
695 tv_expect.tv_usec += frame_interval1024;
696 if (tv_expect.tv_usec >= (1000000 << 10)) {
697 tv_expect.tv_usec -= (1000000 << 10);
700 diff = (tv_expect.tv_sec - now.tv_sec) * 1000000 + (tv_expect.tv_usec >> 10) - now.tv_usec;
702 if (diff > MAX_LAG_FRAMES * frame_interval || diff < -MAX_LAG_FRAMES * frame_interval) {
703 //printf("pl_frame_limit reset, diff=%d, iv %d\n", diff, frame_interval);
706 // try to align with vsync
707 usadj = vsync_usec_time;
708 while (usadj < tv_expect.tv_usec - frame_interval)
709 usadj += frame_interval;
710 tv_expect.tv_usec = usadj << 10;
713 if (!(g_opts & OPT_NO_FRAMELIM) && diff > frame_interval) {
714 // yay for working usleep on pandora!
715 //printf("usleep %d\n", diff - frame_interval / 2);
716 usleep(diff - frame_interval);
719 if (pl_rearmed_cbs.frameskip) {
720 if (diff < -frame_interval)
721 pl_rearmed_cbs.fskip_advice = 1;
723 pl_rearmed_cbs.fskip_advice = 0;
725 // recompilation is not that fast and may cause frame skip on
726 // loading screens and such, resulting in flicker or glitches
727 if (new_dynarec_did_compile) {
728 if (drc_active_vsyncs < 32)
729 pl_rearmed_cbs.fskip_advice = 0;
733 drc_active_vsyncs = 0;
734 new_dynarec_did_compile = 0;
737 pcnt_start(PCNT_ALL);
740 void pl_timing_prepare(int is_pal_)
742 pl_rearmed_cbs.fskip_advice = 0;
743 pl_rearmed_cbs.flips_per_sec = 0;
744 pl_rearmed_cbs.cpu_usage = 0;
747 frame_interval = is_pal ? 20000 : 16667;
748 frame_interval1024 = is_pal ? 20000*1024 : 17066667;
750 // used by P.E.Op.S. frameskip code
751 pl_rearmed_cbs.gpu_peops.fFrameRateHz = is_pal ? 50.0f : 59.94f;
752 pl_rearmed_cbs.gpu_peops.dwFrameRateTicks =
753 (100000*100 / (unsigned long)(pl_rearmed_cbs.gpu_peops.fFrameRateHz*100));
756 static void pl_get_layer_pos(int *x, int *y, int *w, int *h)
764 static void *pl_mmap(unsigned int size);
765 static void pl_munmap(void *ptr, unsigned int size);
767 struct rearmed_cbs pl_rearmed_cbs = {
776 .pl_set_gpu_caps = pl_set_gpu_caps,
780 static void *watchdog_thread(void *unused)
782 int vsync_cnt_old = 0;
786 #if !defined(NDEBUG) || defined(DRC_DBG)
787 // don't interfere with debug
799 if (vsync_cnt != vsync_cnt_old) {
800 vsync_cnt_old = vsync_cnt;
809 fprintf(stderr, "watchdog: seen_dead %d\n", seen_dead);
811 fprintf(stderr, "watchdog: lockup detected, aborting\n");
812 // we can't do any cleanup here really, the main thread is
813 // likely touching resources and would crash anyway
819 void pl_start_watchdog(void)
825 pthread_attr_init(&attr);
826 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
828 ret = pthread_create(&tid, &attr, watchdog_thread, NULL);
830 fprintf(stderr, "could not start watchdog: %d\n", ret);
833 static void *pl_emu_mmap(unsigned long addr, size_t size, int is_fixed,
836 return plat_mmap(addr, size, 0, is_fixed);
839 static void pl_emu_munmap(void *ptr, size_t size, enum psxMapTag tag)
841 plat_munmap(ptr, size);
844 static void *pl_mmap(unsigned int size)
846 return psxMapHook(0, size, 0, MAP_TAG_VRAM);
849 static void pl_munmap(void *ptr, unsigned int size)
851 psxUnmapHook(ptr, size, MAP_TAG_VRAM);
856 extern unsigned int hSyncCount; // from psxcounters
857 extern unsigned int frame_counter;
859 psx_w = psx_h = pl_vout_w = pl_vout_h = 256;
860 psx_bpp = pl_vout_bpp = 16;
862 tsdev = pl_gun_ts_init();
864 pl_rearmed_cbs.gpu_hcnt = &hSyncCount;
865 pl_rearmed_cbs.gpu_frame_count = &frame_counter;
867 psxMapHook = pl_emu_mmap;
868 psxUnmapHook = pl_emu_munmap;