gpu_unai: redo frameskip
[pcsx_rearmed.git] / plugins / gpu_unai / gpu.cpp
index abe7638..fefc277 100644 (file)
 #include "debug.h"
 
 int skipCount = 2; /* frame skip (0,1,2,3...) */
-int skCount=0; /* internal frame skip */
+int skCount = 0; /* internal frame skip */
 int linesInterlace = 0;  /* internal lines interlace */
 int linesInterlace_user = 0; /* Lines interlace */
 
-bool isSkip=false; /* skip frame (info coming from GPU) */
-bool skipFrame=false; /* skip frame (according to frame skip) */
+bool isSkip = false; /* skip frame (info coming from GPU) */
+bool wasSkip = false;
+bool skipFrame = false; /* skip frame (according to frame skip) */
 bool alt_fps = false; /* Alternative FPS algorithm */
 bool show_fps = false; /* Show FPS statistics */
 
-bool isPAL=false; /* PAL video timing */
+bool isPAL = false; /* PAL video timing */
 bool progressInterlace_flag = false; /* Progressive interlace flag */
 bool progressInterlace = false; /* Progressive interlace option*/
 bool frameLimit = false; /* frames to wait */
+
 bool light = true; /* lighting */
 bool blend = true; /* blending */
-
+bool FrameToRead = false; /* load image in progress */
+bool FrameToWrite = false; /* store image in progress */
 bool fb_dirty = false;
 
 bool enableAbbeyHack = false; /* Abe's Odyssey hack */
+
 u8 BLEND_MODE;
 u8 TEXT_MODE;
 u8 Masking;
@@ -60,9 +64,6 @@ s32           px,py;
 s32            x_end,y_end;
 u16*  pvram;
 
-u32 FrameToRead;
-u32 FrameToWrite;
-
 u32 GP0;
 s32 PacketCount;
 s32 PacketIndex;
@@ -184,9 +185,13 @@ long  GPU_freeze(unsigned int bWrite, GPUFreeze_t* p2)
        {
                p2->GPU_gp1 = GPU_GP1;
                memset(p2->Control, 0, sizeof(p2->Control));
-               p2->Control[5] = DisplayArea[0] | (DisplayArea[1] << 10);
-               p2->Control[7] = DisplayArea[4] | (DisplayArea[5] << 10);
-               p2->Control[8] = ((GPU_GP1 >> 17) & 0x3f) | ((GPU_GP1 >> 10) & 0x40);
+               // save resolution and registers for P.E.Op.S. compatibility
+               p2->Control[3] = (3 << 24) | ((GPU_GP1 >> 23) & 1);
+               p2->Control[4] = (4 << 24) | ((GPU_GP1 >> 29) & 3);
+               p2->Control[5] = (5 << 24) | (DisplayArea[0] | (DisplayArea[1] << 10));
+               p2->Control[6] = (6 << 24) | (2560 << 12);
+               p2->Control[7] = (7 << 24) | (DisplayArea[4] | (DisplayArea[5] << 10));
+               p2->Control[8] = (8 << 24) | ((GPU_GP1 >> 17) & 0x3f) | ((GPU_GP1 >> 10) & 0x40);
                memcpy(p2->FrameBuffer, (u16*)GPU_FrameBuffer, FRAME_BUFFER_SIZE);
                return (1);
        }
@@ -280,7 +285,7 @@ void  GPU_writeDataMem(u32* dmaAddress, s32 dmaCount)
                                        pvram += 1024;
                                        if (++py>=y_end) 
                                        {
-                                               FrameToWrite = 0;
+                                               FrameToWrite = false;
                                                GPU_GP1 &= ~0x08000000;
                                                break;
                                        }
@@ -293,7 +298,7 @@ void  GPU_writeDataMem(u32* dmaAddress, s32 dmaCount)
                                        pvram += 1024;
                                        if (++py>=y_end) 
                                        {
-                                               FrameToWrite = 0;
+                                               FrameToWrite = false;
                                                GPU_GP1 &= ~0x08000000;
                                                break;
                                        }
@@ -327,7 +332,7 @@ INLINE int CheckForEndlessLoop(u32 *laddr)
 }
 
 ///////////////////////////////////////////////////////////////////////////////
-void  GPU_dmaChain(u32* baseAddr, u32 dmaVAddr)
+long GPU_dmaChain(u32* baseAddr, u32 dmaVAddr)
 {
 #ifdef DEBUG_ANALYSIS
        dbg_anacnt_GPU_dmaChain++;
@@ -335,6 +340,7 @@ void  GPU_dmaChain(u32* baseAddr, u32 dmaVAddr)
        pcsx4all_prof_start_with_pause(PCSX4ALL_PROF_GPU,PCSX4ALL_PROF_HW_WRITE);
        u32 data, *address, count, offset;
        unsigned int DMACommandCounter = 0;
+       long dma_words = 0;
 
        GPU_GP1 &= ~0x14000000;
        lUsedAddr[0]=lUsedAddr[1]=lUsedAddr[2]=(u32*)0x1fffff;
@@ -351,9 +357,12 @@ void  GPU_dmaChain(u32* baseAddr, u32 dmaVAddr)
                else dmaVAddr = 0x1FFFFF;
 
                if(count>0) GPU_writeDataMem(address,count);
+               dma_words += 1 + count;
        }
        GPU_GP1 = (GPU_GP1 | 0x14000000) & ~0x60000000;
        pcsx4all_prof_end_with_resume(PCSX4ALL_PROF_GPU,PCSX4ALL_PROF_HW_WRITE);
+
+       return dma_words;
 }
 
 ///////////////////////////////////////////////////////////////////////////////
@@ -377,7 +386,7 @@ void  GPU_writeData(u32 data)
                        pvram += 1024;
                        if (++py>=y_end) 
                        {
-                               FrameToWrite = 0;
+                               FrameToWrite = false;
                                GPU_GP1 &= ~0x08000000;
                        }
                }
@@ -391,7 +400,7 @@ void  GPU_writeData(u32 data)
                                pvram += 1024;
                                if (++py>=y_end) 
                                {
-                                       FrameToWrite = 0;
+                                       FrameToWrite = false;
                                        GPU_GP1 &= ~0x08000000;
                                }
                        }
@@ -444,7 +453,7 @@ void  GPU_readDataMem(u32* dmaAddress, s32 dmaCount)
                        pvram += 1024;
                        if (++py>=y_end) 
                        {
-                               FrameToRead = 0;
+                               FrameToRead = false;
                                GPU_GP1 &= ~0x08000000;
                                break;
                        }
@@ -477,7 +486,7 @@ u32  GPU_readData(void)
                        pvram += 1024;
                        if (++py>=y_end) 
                        {
-                               FrameToRead = 0;
+                               FrameToRead = false;
                                GPU_GP1 &= ~0x08000000;
                        }
                }
@@ -489,7 +498,7 @@ u32  GPU_readData(void)
                        pvram +=1024;
                        if (++py>=y_end) 
                        {
-                               FrameToRead = 0;
+                               FrameToRead = false;
                                GPU_GP1 &= ~0x08000000;
                        }
                }
@@ -525,11 +534,11 @@ void  GPU_writeStatus(u32 data)
                break;
        case 0x01:
                GPU_GP1 &= ~0x08000000;
-               PacketCount = FrameToRead = FrameToWrite = 0;
+               PacketCount = 0; FrameToRead = FrameToWrite = false;
                break;
        case 0x02:
                GPU_GP1 &= ~0x08000000;
-               PacketCount = FrameToRead = FrameToWrite = 0;
+               PacketCount = 0; FrameToRead = FrameToWrite = false;
                break;
        case 0x03:
                GPU_GP1 = (GPU_GP1 & ~0x00800000) | ((data & 1) << 23);
@@ -543,6 +552,11 @@ void  GPU_writeStatus(u32 data)
                DisplayArea[0] = (data & 0x000003FF); //(short)(data & 0x3ff);
                DisplayArea[1] = ((data & 0x0007FC00)>>10); //(data & 0x000FFC00) >> 10; //(short)((data>>10)&0x1ff);
                fb_dirty = true;
+               wasSkip = isSkip;
+               if (isSkip)
+                       isSkip = false;
+               else
+                       isSkip = skipFrame;
                break;
        case 0x07:
                DisplayArea[4] = data & 0x000003FF; //(short)(data & 0x3ff);
@@ -630,15 +644,16 @@ INLINE void gpuVideoOutput(void)
        int incY = (h0==480) ? 2 : 1;
        h0=(h0==480 ? 2048 : 1024);
 
-       if (!progressInterlace)
        {
                const int li=linesInterlace;
+               bool pi=progressInterlace;
+               bool pif=progressInterlace_flag;
                switch ( w0 )
                {
                        case 256:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWWDWW(       src_screen16,   dest_screen16, isRGB24);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWWDWW(    src_screen16,   dest_screen16, isRGB24);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
@@ -646,7 +661,7 @@ INLINE void gpuVideoOutput(void)
                        case 368:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWWWWWWWWS(   src_screen16,   dest_screen16, isRGB24, 4);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWWWWWWWWS(        src_screen16,   dest_screen16, isRGB24, 4);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
@@ -654,7 +669,7 @@ INLINE void gpuVideoOutput(void)
                        case 320:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWW(  src_screen16,   dest_screen16, isRGB24);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWW(       src_screen16,   dest_screen16, isRGB24);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
@@ -662,7 +677,7 @@ INLINE void gpuVideoOutput(void)
                        case 384:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWWWWWS(      src_screen16,   dest_screen16, isRGB24);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWWWWWS(   src_screen16,   dest_screen16, isRGB24);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
@@ -670,7 +685,7 @@ INLINE void gpuVideoOutput(void)
                        case 512:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWWSWWSWS(    src_screen16, dest_screen16, isRGB24);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWWSWWSWS( src_screen16, dest_screen16, isRGB24);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
@@ -678,69 +693,13 @@ INLINE void gpuVideoOutput(void)
                        case 640:
                                for(int y1=y0+h1; y0<y1; y0+=incY)
                                {
-                                       if( 0 == (y0&li) ) GPU_BlitWS(  src_screen16, dest_screen16, isRGB24);
+                                       if(( 0 == (y0&li) ) && ((!pi) || (pif=!pif))) GPU_BlitWS(       src_screen16, dest_screen16, isRGB24);
                                        dest_screen16 += VIDEO_WIDTH;
                                        src_screen16  += h0;
                                }
                                break;
                }
-       }
-       else
-       {
-               const int li=linesInterlace;
-               bool flag=progressInterlace_flag; /* progressive interlace */
-               switch ( w0 )
-               {
-                       case 256:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWWDWW(     src_screen16,   dest_screen16, isRGB24);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-                       case 368:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWWWWWWWWS( src_screen16,   dest_screen16, isRGB24, 4);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-                       case 320:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWW(        src_screen16,   dest_screen16, isRGB24);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-                       case 384:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWWWWWS(    src_screen16,   dest_screen16, isRGB24);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-                       case 512:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWWSWWSWS(  src_screen16, dest_screen16, isRGB24);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-                       case 640:
-                               for(int y1=y0+h1; y0<y1; y0+=incY)
-                               {
-                                       if(( 0 == (y0&li) ) && (flag=!flag)) GPU_BlitWS(        src_screen16, dest_screen16, isRGB24);
-                                       dest_screen16 += VIDEO_WIDTH;
-                                       src_screen16  += h0;
-                               }
-                               break;
-               }
-               progressInterlace_flag=!flag;
+               progressInterlace_flag=!progressInterlace_flag;
        }
        video_flip();
 }
@@ -789,7 +748,7 @@ void  GPU_updateLace(void)
        GPU_GP1 ^= 0x80000000;
 
        // Update display
-       if ((!skipFrame) && (!isSkip) && (!(((GPU_GP1&0x08000000))||((GPU_GP1&0x00800000)))))
+       if ((!skipFrame) && (!isSkip) && (fb_dirty) && (!(((GPU_GP1&0x08000000))||((GPU_GP1&0x00800000)))))
        {
                gpuVideoOutput(); // Display updated
 
@@ -803,18 +762,18 @@ void  GPU_updateLace(void)
                        linesInterlace = linesInterlace_user; // resolution changed from 480 to lower one
                        video_clear();
                }
+       }
 
-               // Limit FPS
-               if (frameLimit)
+       // Limit FPS
+       if (frameLimit)
+       {
+               static unsigned next=get_ticks();
+               if (!skipFrame)
                {
-                       static unsigned next=get_ticks();
                        unsigned now=get_ticks();
-                       if (!skipFrame)
-                       {
-                               if (now<next) wait_ticks(next-now);
-                       }
-                       next+=(isPAL?(1000000/50):((unsigned)(1000000.0/59.94)));
+                       if (now<next) wait_ticks(next-now);
                }
+               next+=(isPAL?(1000000/50):((unsigned)(1000000.0/59.94)));
        }
 
        // Show FPS statistics
@@ -822,7 +781,7 @@ void  GPU_updateLace(void)
        {
                static u32 real_fps=0;
                static u32 prev=get_ticks();
-               static char msg[24]="FPS=000/00 SPD=000%";
+               static char msg[32]="FPS=000/00 SPD=000%";
                u32 now=get_ticks();
                real_fps++;
                if ((now-prev)>=1000000)
@@ -853,6 +812,7 @@ void  GPU_updateLace(void)
                        isSkip=true;
                }
        }
+       fb_dirty=false;
 
        pcsx4all_prof_end_with_resume(PCSX4ALL_PROF_GPU,PCSX4ALL_PROF_COUNTERS);
 }
@@ -860,11 +820,10 @@ void  GPU_updateLace(void)
 #else
 
 #include "../../frontend/plugin_lib.h"
+#include "../../frontend/arm_utils.h"
 
 extern "C" {
 
-extern void bgr555_to_rgb565(void *dst, void *src, int bytes);
-extern void bgr888_to_rgb888(void *dst, void *src, int bytes);
 static const struct rearmed_cbs *cbs;
 static void *screen_buf;
 
@@ -876,7 +835,7 @@ static void blit(void)
        u16 *srcs;
        u8  *dest;
 
-       x0 = DisplayArea[0] & ~3; // alignment needed by blitter
+       x0 = DisplayArea[0] & ~1; // alignment needed by blitter
        y0 = DisplayArea[1];
        srcs = &((u16*)GPU_FrameBuffer)[FRAME_OFFSET(x0,y0)];
 
@@ -894,16 +853,23 @@ static void blit(void)
                old_res_horz = w0;
                old_res_vert = h1;
                old_rgb24 = (s16)isRGB24;
-               screen_buf = cbs->pl_fbdev_set_mode(w0, h1, isRGB24 ? 24 : 16);
+               screen_buf = cbs->pl_vout_set_mode(w0, h1, isRGB24 ? 24 : 16);
        }
        dest = (u8 *)screen_buf;
 
        if (isRGB24)
        {
+#ifndef MAEMO
                for (; h1-- > 0; dest += w0 * 3, srcs += 1024)
                {
                        bgr888_to_rgb888(dest, srcs, w0 * 3);
                }
+#else
+               for (; h1-- > 0; dest += w0 * 2, srcs += 1024)
+               {
+                       bgr888_to_rgb565(dest, srcs, w0 * 3);
+               }
+#endif
        }
        else
        {
@@ -913,7 +879,7 @@ static void blit(void)
                }
        }
 
-       screen_buf = cbs->pl_fbdev_flip();
+       screen_buf = cbs->pl_vout_flip();
 }
 
 void GPU_updateLace(void)
@@ -924,27 +890,30 @@ void GPU_updateLace(void)
        if (!fb_dirty || (GPU_GP1&0x08800000))
                return;
 
-       if (!isSkip) {
+       if (!wasSkip) {
                blit();
-
                fb_dirty = false;
-               if (*cbs->fskip_option)
-                       isSkip = true;
+               skCount = 0;
        }
-       else
-               isSkip = false;
+       else {
+               skCount++;
+               if (skCount >= 8)
+                       wasSkip = isSkip = 0;
+       }
+
+       skipFrame = cbs->fskip_advice;
 }
 
 long GPUopen(unsigned long *, char *, char *)
 {
-       cbs->pl_fbdev_open();
-       screen_buf = cbs->pl_fbdev_flip();
+       cbs->pl_vout_open();
+       screen_buf = cbs->pl_vout_flip();
        return 0;
 }
 
 long GPUclose(void)
 {
-       cbs->pl_fbdev_close();
+       cbs->pl_vout_close();
        return 0;
 }
 
@@ -958,6 +927,10 @@ long GPUfreeze(unsigned int ulGetFreezeData, GPUFreeze_t* p2)
 
 void GPUrearmedCallbacks(const struct rearmed_cbs *cbs_)
 {
+       enableAbbeyHack = cbs_->gpu_unai.abe_hack;
+       light = !cbs_->gpu_unai.no_light;
+       blend = !cbs_->gpu_unai.no_blend;
+
        cbs = cbs_;
 }