4 * This work is licensed under the terms of the GNU GPLv2 or later.
5 * See the COPYING file in the top-level directory.
14 #include <sys/types.h>
21 #include "libpicofe/fonts.h"
22 #include "libpicofe/input.h"
23 #include "libpicofe/plat.h"
24 #include "libpicofe/arm/neon_scale2x.h"
25 #include "libpicofe/arm/neon_eagle2x.h"
26 #include "plugin_lib.h"
31 #include "pl_gun_ts.h"
33 #include "psemu_plugin_defs.h"
34 #include "../libpcsxcore/new_dynarec/new_dynarec.h"
35 #include "../libpcsxcore/psxmem_map.h"
36 #include "../libpcsxcore/gpu.h"
43 int in_analog_left[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
44 int in_analog_right[8][2] = {{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 },{ 127, 127 }};
45 int in_adev[2] = { -1, -1 }, in_adev_axis[2][2] = {{ 0, 1 }, { 0, 1 }};
46 int in_adev_is_nublike[2];
47 unsigned short in_keystate[8];
50 int in_enable_vibration;
53 int g_layer_x, g_layer_y, g_layer_w, g_layer_h;
54 static int pl_vout_w, pl_vout_h, pl_vout_bpp; /* output display/layer */
55 static int pl_vout_scale_w, pl_vout_scale_h, pl_vout_yoffset;
56 static int psx_w, psx_h, psx_bpp;
58 static int is_pal, frame_interval, frame_interval1024;
59 static int vsync_usec_time;
62 void (*pl_plat_clear)(void);
63 void (*pl_plat_blit)(int doffs, const void *src, int w, int h,
64 int sstride, int bgr24);
65 void (*pl_plat_hud_print)(int x, int y, const char *str, int bpp);
68 static __attribute__((noinline)) int get_cpu_ticks(void)
70 static unsigned long last_utime;
72 unsigned long utime, ret;
76 fd = open("/proc/self/stat", O_RDONLY);
77 lseek(fd, 0, SEEK_SET);
79 read(fd, buf, sizeof(buf));
80 buf[sizeof(buf) - 1] = 0;
82 sscanf(buf, "%*d %*s %*c %*d %*d %*d %*d %*d %*u %*u %*u %*u %*u %lu", &utime);
83 ret = utime - last_utime;
90 static void hud_print(void *fb, int w, int x, int y, const char *text)
92 if (pl_plat_hud_print)
93 pl_plat_hud_print(x, y, text, pl_vout_bpp);
94 else if (pl_vout_bpp == 16)
95 basic_text_out16_nf(fb, w, x, y, text);
98 static void hud_printf(void *fb, int w, int x, int y, const char *texto, ...)
103 va_start(args, texto);
104 vsnprintf(buffer, sizeof(buffer), texto, args);
107 hud_print(fb, w, x, y, buffer);
110 static void print_msg(int h, int border)
112 hud_print(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT, hud_msg);
115 static void print_fps(int h, int border)
117 hud_printf(pl_vout_buf, pl_vout_w, border + 2, h - HUD_HEIGHT,
118 "%2d %4.1f", pl_rearmed_cbs.flips_per_sec,
119 pl_rearmed_cbs.vsps_cur);
122 static void print_cpu_usage(int x, int h)
124 hud_printf(pl_vout_buf, pl_vout_w, x - 28,
125 h - HUD_HEIGHT, "%3d", pl_rearmed_cbs.cpu_usage);
128 // draw 192x8 status of 24 sound channels
129 static __attribute__((noinline)) void draw_active_chans(int vout_w, int vout_h)
131 extern void spu_get_debug_info(int *chans_out, int *run_chans,
132 int *fmod_chans_out, int *noise_chans_out); // hack
133 int live_chans, run_chans, fmod_chans, noise_chans;
135 static const unsigned short colors[2] = { 0x1fe3, 0x0700 };
136 unsigned short *dest = (unsigned short *)pl_vout_buf +
137 pl_vout_w * (vout_h - HUD_HEIGHT) + pl_vout_w / 2 - 192/2;
138 unsigned short *d, p;
141 if (pl_vout_buf == NULL || pl_vout_bpp != 16)
144 spu_get_debug_info(&live_chans, &run_chans, &fmod_chans, &noise_chans);
146 for (c = 0; c < 24; c++) {
148 p = !(live_chans & (1<<c)) ? (run_chans & (1<<c) ? 0x01c0 : 0) :
149 (fmod_chans & (1<<c)) ? 0xf000 :
150 (noise_chans & (1<<c)) ? 0x001f :
152 for (y = 0; y < 8; y++, d += pl_vout_w)
153 for (x = 0; x < 8; x++)
158 static void print_hud(int x, int w, int h)
166 if (g_opts & OPT_SHOWSPU)
167 draw_active_chans(w, h);
171 else if (g_opts & OPT_SHOWFPS)
174 if (g_opts & OPT_SHOWCPU)
175 print_cpu_usage(x + w, h);
178 /* update scaler target size according to user settings */
179 static void update_layer_size(int w, int h)
186 g_layer_w = w; g_layer_h = h;
190 g_layer_w = w; g_layer_h = h;
191 if (w * 2 <= g_menuscreen_w)
193 if (h * 2 <= g_menuscreen_h)
198 if (h > g_menuscreen_h || (240 < h && h <= 360))
201 // 4:3 that prefers integer scaling
202 imult = g_menuscreen_h / h;
203 g_layer_w = w * imult;
204 g_layer_h = h * imult;
205 mult = (float)g_layer_w / (float)g_layer_h;
206 if (mult < 1.25f || mult > 1.666f)
207 g_layer_w = 4.0f/3.0f * (float)g_layer_h;
208 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
213 mult = 240.0f / (float)h * 4.0f / 3.0f;
216 g_layer_w = mult * (float)g_menuscreen_h;
217 g_layer_h = g_menuscreen_h;
218 printf(" -> %dx%d %.1f\n", g_layer_w, g_layer_h, mult);
221 case SCALE_FULLSCREEN:
222 g_layer_w = g_menuscreen_w;
223 g_layer_h = g_menuscreen_h;
230 g_layer_x = g_menuscreen_w / 2 - g_layer_w / 2;
231 g_layer_y = g_menuscreen_h / 2 - g_layer_h / 2;
232 if (g_layer_x < 0) g_layer_x = 0;
233 if (g_layer_y < 0) g_layer_y = 0;
234 if (g_layer_w > g_menuscreen_w) g_layer_w = g_menuscreen_w;
235 if (g_layer_h > g_menuscreen_h) g_layer_h = g_menuscreen_h;
238 // XXX: this is platform specific really
239 static inline int resolution_ok(int w, int h)
241 return w <= 1024 && h <= 512;
244 static void pl_vout_set_mode(int w, int h, int raw_w, int raw_h, int bpp)
246 int vout_w, vout_h, vout_bpp;
249 // special h handling, Wipeout likes to change it by 1-6
250 static int vsync_cnt_ms_prev;
251 if ((unsigned int)(vsync_cnt - vsync_cnt_ms_prev) < 5*60)
253 vsync_cnt_ms_prev = vsync_cnt;
261 if (pl_rearmed_cbs.only_16bpp)
264 assert(vout_h >= 192);
266 pl_vout_scale_w = pl_vout_scale_h = 1;
269 if (resolution_ok(w * 2, h * 2) && bpp == 16) {
274 // filter unavailable
278 else if (scanlines != 0 && scanline_level != 100 && bpp == 16) {
283 vout_w *= pl_vout_scale_w;
284 vout_h *= pl_vout_scale_h;
286 update_layer_size(vout_w, vout_h);
288 pl_vout_buf = plat_gvideo_set_mode(&vout_w, &vout_h, &vout_bpp);
289 if (pl_vout_buf == NULL && pl_plat_blit == NULL)
290 fprintf(stderr, "failed to set mode %dx%d@%d\n",
291 vout_w, vout_h, vout_bpp);
295 pl_vout_bpp = vout_bpp;
296 pl_vout_yoffset = buf_yoffset;
298 if (pl_vout_buf != NULL)
299 pl_vout_buf = (char *)pl_vout_buf
300 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
302 menu_notify_mode_change(pl_vout_w, pl_vout_h, pl_vout_bpp);
305 static int flip_clear_counter;
307 void pl_force_clear(void)
309 flip_clear_counter = 2;
312 static void pl_vout_flip(const void *vram, int stride, int bgr24,
313 int x, int y, int w, int h, int dims_changed)
315 unsigned char *dest = pl_vout_buf;
316 const unsigned short *src = vram;
317 int dstride = pl_vout_w, h1 = h;
318 int h_full = pl_vout_h - pl_vout_yoffset;
319 int xoffs = 0, doffs;
321 pcnt_start(PCNT_BLIT);
328 memset(pl_vout_buf, 0,
329 dstride * h_full * pl_vout_bpp / 8);
333 assert(x + w <= pl_vout_w);
334 assert(y + h <= pl_vout_h);
337 xoffs = x * pl_vout_scale_w;
338 doffs = xoffs + y * dstride;
341 flip_clear_counter = 2;
343 if (flip_clear_counter > 0) {
347 memset(pl_vout_buf, 0,
348 dstride * h_full * pl_vout_bpp / 8);
349 flip_clear_counter--;
354 pl_plat_blit(doffs, src, w, h, stride, bgr24);
365 if (pl_rearmed_cbs.only_16bpp) {
366 for (; h1-- > 0; dest += dstride * 2, src += stride)
368 bgr888_to_rgb565(dest, src, w * 3);
373 dest += (doffs / 8) * 24;
375 for (; h1-- > 0; dest += dstride * 3, src += stride)
377 bgr888_to_rgb888(dest, src, w * 3);
382 else if (soft_filter == SOFT_FILTER_SCALE2X && pl_vout_scale_w == 2)
384 neon_scale2x_16_16(src, (void *)dest, w,
385 stride * 2, dstride * 2, h);
387 else if (soft_filter == SOFT_FILTER_EAGLE2X && pl_vout_scale_w == 2)
389 neon_eagle2x_16_16(src, (void *)dest, w,
390 stride * 2, dstride * 2, h);
392 else if (scanlines != 0 && scanline_level != 100)
394 int l = scanline_level * 2048 / 100;
395 int stride_0 = pl_vout_scale_h >= 2 ? 0 : stride;
397 h1 *= pl_vout_scale_h;
398 for (; h1 >= 2; h1 -= 2)
400 bgr555_to_rgb565(dest, src, w * 2);
401 dest += dstride * 2, src += stride_0;
403 bgr555_to_rgb565_b(dest, src, w * 2, l);
404 dest += dstride * 2, src += stride;
410 for (; h1-- > 0; dest += dstride * 2, src += stride)
412 bgr555_to_rgb565(dest, src, w * 2);
417 print_hud(xoffs, w * pl_vout_scale_w, (y + h) * pl_vout_scale_h);
423 pl_vout_buf = plat_gvideo_flip();
424 if (pl_vout_buf != NULL)
425 pl_vout_buf = (char *)pl_vout_buf
426 + pl_vout_yoffset * pl_vout_w * pl_vout_bpp / 8;
428 pl_rearmed_cbs.flip_cnt++;
431 static int pl_vout_open(void)
435 // force mode update on pl_vout_set_mode() call from gpulib/vout_pl
438 plat_gvideo_open(is_pal);
440 gettimeofday(&now, 0);
441 vsync_usec_time = now.tv_usec;
442 while (vsync_usec_time >= frame_interval)
443 vsync_usec_time -= frame_interval;
448 static void pl_vout_close(void)
453 static void pl_set_gpu_caps(int caps)
455 pl_rearmed_cbs.gpu_caps = caps;
458 void *pl_prepare_screenshot(int *w, int *h, int *bpp)
460 void *ret = plat_prepare_screenshot(w, h, bpp);
471 /* display/redering mode switcher */
472 static int dispmode_default(void)
474 pl_rearmed_cbs.gpu_neon.enhancement_enable = 0;
475 soft_filter = SOFT_FILTER_NONE;
476 snprintf(hud_msg, sizeof(hud_msg), "default mode");
480 #ifdef BUILTIN_GPU_NEON
481 static int dispmode_doubleres(void)
483 if (!(pl_rearmed_cbs.gpu_caps & GPU_CAP_SUPPORTS_2X)
484 || !resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
488 pl_rearmed_cbs.gpu_neon.enhancement_enable = 1;
489 snprintf(hud_msg, sizeof(hud_msg), "double resolution");
495 static int dispmode_scale2x(void)
497 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
501 soft_filter = SOFT_FILTER_SCALE2X;
502 snprintf(hud_msg, sizeof(hud_msg), "scale2x");
506 static int dispmode_eagle2x(void)
508 if (!resolution_ok(psx_w * 2, psx_h * 2) || psx_bpp != 16)
512 soft_filter = SOFT_FILTER_EAGLE2X;
513 snprintf(hud_msg, sizeof(hud_msg), "eagle2x");
518 static int (*dispmode_switchers[])(void) = {
520 #ifdef BUILTIN_GPU_NEON
529 static int dispmode_current;
531 void pl_switch_dispmode(void)
533 if (pl_rearmed_cbs.gpu_caps & GPU_CAP_OWNS_DISPLAY)
538 if (dispmode_current >=
539 sizeof(dispmode_switchers) / sizeof(dispmode_switchers[0]))
540 dispmode_current = 0;
541 if (dispmode_switchers[dispmode_current]())
547 /* adjust circle-like analog inputs to better match
548 * more square-like analogs in PSX */
549 static void update_analog_nub_adjust(int *x_, int *y_)
552 static const int scale[] =
553 { 0 - d*2, 0 - d*2, 0 - d*2, 12 - d*2,
554 30 - d*2, 60 - d*2, 75 - d*2, 60 - d*2, 60 - d*2 };
557 int scale_x = scale[y / 16];
558 int scale_y = scale[x / 16];
561 x += d + (x * scale_x >> 8);
566 y += d + (y * scale_y >> 8);
576 static void update_analogs(void)
578 int *nubp[2] = { in_analog_left[0], in_analog_right[0] };
582 for (i = 0; i < 2; i++)
587 for (a = 0; a < 2; a++) {
590 ret = in_update_analog(in_adev[i], in_adev_axis[i][a], &v);
592 vals[a] = 128 * v / IN_ABS_RANGE;
595 if (in_adev_is_nublike[i])
596 update_analog_nub_adjust(&vals[0], &vals[1]);
598 for (a = 0; a < 2; a++) {
601 else if (v > 255) v = 255;
608 static void update_input(void)
610 int actions[IN_BINDTYPE_COUNT] = { 0, };
611 unsigned int emu_act;
614 if (in_type[0] == PSE_PAD_TYPE_ANALOGJOY || in_type[0] == PSE_PAD_TYPE_ANALOGPAD)
616 emu_act = actions[IN_BINDTYPE_EMU];
617 in_state_gun = (emu_act & SACTION_GUN_MASK) >> SACTION_GUN_TRIGGER;
619 emu_act &= ~SACTION_GUN_MASK;
622 for (; !(emu_act & 1); emu_act >>= 1, which++)
626 emu_set_action(emu_act);
628 in_keystate[0] = actions[IN_BINDTYPE_PLAYER12];
631 //if (in_type[0] == PSE_PAD_TYPE_GUNCON && tsdev)
632 // pl_gun_ts_update(tsdev, xn, yn, in);
633 // in_analog_left[0][0] = xn
636 extern void update_input(void);
639 void pl_gun_byte2(int port, unsigned char byte)
643 #define MAX_LAG_FRAMES 3
645 #define tvdiff(tv, tv_old) \
646 ((tv.tv_sec - tv_old.tv_sec) * 1000000 + tv.tv_usec - tv_old.tv_usec)
648 /* called on every vsync */
649 void pl_frame_limit(void)
651 static struct timeval tv_old, tv_expect;
652 static int vsync_cnt_prev, drc_active_vsyncs;
661 /* doing input here because the pad is polled
662 * thousands of times per frame for some reason */
666 gettimeofday(&now, 0);
668 if (now.tv_sec != tv_old.tv_sec) {
669 diff = tvdiff(now, tv_old);
670 pl_rearmed_cbs.vsps_cur = 0.0f;
671 if (0 < diff && diff < 2000000)
672 pl_rearmed_cbs.vsps_cur = 1000000.0f * (vsync_cnt - vsync_cnt_prev) / diff;
673 vsync_cnt_prev = vsync_cnt;
675 if (g_opts & OPT_SHOWFPS)
676 pl_rearmed_cbs.flips_per_sec = pl_rearmed_cbs.flip_cnt;
677 pl_rearmed_cbs.flip_cnt = 0;
678 if (g_opts & OPT_SHOWCPU)
679 pl_rearmed_cbs.cpu_usage = get_cpu_ticks();
681 if (hud_new_msg > 0) {
683 if (hud_new_msg == 0)
687 //new_dynarec_print_stats();
690 static int ya_vsync_count;
691 if (++ya_vsync_count == PCNT_FRAMES) {
692 pcnt_print(pl_rearmed_cbs.vsps_cur);
697 // tv_expect uses usec*1024 units instead of usecs for better accuracy
698 tv_expect.tv_usec += frame_interval1024;
699 if (tv_expect.tv_usec >= (1000000 << 10)) {
700 tv_expect.tv_usec -= (1000000 << 10);
703 diff = (tv_expect.tv_sec - now.tv_sec) * 1000000 + (tv_expect.tv_usec >> 10) - now.tv_usec;
705 if (diff > MAX_LAG_FRAMES * frame_interval || diff < -MAX_LAG_FRAMES * frame_interval) {
706 //printf("pl_frame_limit reset, diff=%d, iv %d\n", diff, frame_interval);
709 // try to align with vsync
710 usadj = vsync_usec_time;
711 while (usadj < tv_expect.tv_usec - frame_interval)
712 usadj += frame_interval;
713 tv_expect.tv_usec = usadj << 10;
716 if (!(g_opts & OPT_NO_FRAMELIM) && diff > frame_interval) {
717 // yay for working usleep on pandora!
718 //printf("usleep %d\n", diff - frame_interval / 2);
719 usleep(diff - frame_interval);
722 if (pl_rearmed_cbs.frameskip) {
723 if (diff < -frame_interval)
724 pl_rearmed_cbs.fskip_advice = 1;
726 pl_rearmed_cbs.fskip_advice = 0;
728 // recompilation is not that fast and may cause frame skip on
729 // loading screens and such, resulting in flicker or glitches
730 if (new_dynarec_did_compile) {
731 if (drc_active_vsyncs < 32)
732 pl_rearmed_cbs.fskip_advice = 0;
736 drc_active_vsyncs = 0;
737 new_dynarec_did_compile = 0;
740 pcnt_start(PCNT_ALL);
743 void pl_timing_prepare(int is_pal_)
745 pl_rearmed_cbs.fskip_advice = 0;
746 pl_rearmed_cbs.flips_per_sec = 0;
747 pl_rearmed_cbs.cpu_usage = 0;
750 frame_interval = is_pal ? 20000 : 16667;
751 frame_interval1024 = is_pal ? 20000*1024 : 17066667;
753 // used by P.E.Op.S. frameskip code
754 pl_rearmed_cbs.gpu_peops.fFrameRateHz = is_pal ? 50.0f : 59.94f;
755 pl_rearmed_cbs.gpu_peops.dwFrameRateTicks =
756 (100000*100 / (unsigned long)(pl_rearmed_cbs.gpu_peops.fFrameRateHz*100));
759 static void pl_get_layer_pos(int *x, int *y, int *w, int *h)
767 static void *pl_mmap(unsigned int size);
768 static void pl_munmap(void *ptr, unsigned int size);
770 struct rearmed_cbs pl_rearmed_cbs = {
779 .pl_set_gpu_caps = pl_set_gpu_caps,
780 .gpu_state_change = gpu_state_change,
784 static void *watchdog_thread(void *unused)
786 int vsync_cnt_old = 0;
790 #if !defined(NDEBUG) || defined(DRC_DBG)
791 // don't interfere with debug
803 if (vsync_cnt != vsync_cnt_old) {
804 vsync_cnt_old = vsync_cnt;
813 fprintf(stderr, "watchdog: seen_dead %d\n", seen_dead);
815 fprintf(stderr, "watchdog: lockup detected, aborting\n");
816 // we can't do any cleanup here really, the main thread is
817 // likely touching resources and would crash anyway
823 void pl_start_watchdog(void)
829 pthread_attr_init(&attr);
830 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED);
832 ret = pthread_create(&tid, &attr, watchdog_thread, NULL);
834 fprintf(stderr, "could not start watchdog: %d\n", ret);
837 static void *pl_emu_mmap(unsigned long addr, size_t size, int is_fixed,
840 return plat_mmap(addr, size, 0, is_fixed);
843 static void pl_emu_munmap(void *ptr, size_t size, enum psxMapTag tag)
845 plat_munmap(ptr, size);
848 static void *pl_mmap(unsigned int size)
850 return psxMapHook(0, size, 0, MAP_TAG_VRAM);
853 static void pl_munmap(void *ptr, unsigned int size)
855 psxUnmapHook(ptr, size, MAP_TAG_VRAM);
860 extern unsigned int hSyncCount; // from psxcounters
861 extern unsigned int frame_counter;
863 psx_w = psx_h = pl_vout_w = pl_vout_h = 256;
864 psx_bpp = pl_vout_bpp = 16;
866 tsdev = pl_gun_ts_init();
868 pl_rearmed_cbs.gpu_hcnt = &hSyncCount;
869 pl_rearmed_cbs.gpu_frame_count = &frame_counter;
871 psxMapHook = pl_emu_mmap;
872 psxUnmapHook = pl_emu_munmap;