+ unsigned int *dpal=(void *)localPal;
+ int i;
+
+ //for (i = 0x3f/2; i >= 0; i--)
+ // dpal[i] = ((spal[i]&0x000f000f)<< 1)|((spal[i]&0x00f000f0)<<3)|((spal[i]&0x0f000f00)<<4);
+ do_pal_convert(localPal, Pico.cram, currentConfig.gamma, currentConfig.gamma2);
+
+ Pico.m.dirtyPal = 0;
+ need_pal_upload = 1;
+
+ if (allow_sh && (Pico.video.reg[0xC]&8)) // shadow/hilight?
+ {
+ // shadowed pixels
+ for (i = 0x3f/2; i >= 0; i--)
+ dpal[0x20|i] = dpal[0x60|i] = (dpal[i]>>1)&0x7bcf7bcf;
+ // hilighted pixels
+ for (i = 0x3f; i >= 0; i--) {
+ int t=localPal[i]&0xf79e;t+=0x4208;
+ if (t&0x20) t|=0x1e;
+ if (t&0x800) t|=0x780;
+ if (t&0x10000) t|=0xf000;
+ t&=0xf79e;
+ localPal[0x80|i]=(unsigned short)t;
+ }
+ localPal[0xe0] = 0;
+ localPal[0xf0] = 0x001f;
+ }
+ else if (allow_as && (rendstatus & PDRAW_SPR_LO_ON_HI))
+ {
+ memcpy32((int *)dpal+0x80/2, (void *)localPal, 0x40*2/4);
+ }
+}
+
+static void do_slowmode_lines(int line_to)
+{
+ int line = 0, line_len = (Pico.video.reg[12]&1) ? 320 : 256;
+ unsigned short *dst = (unsigned short *)VRAM_STUFF + 512*240/2;
+ unsigned char *src = (unsigned char *)VRAM_CACHED_STUFF + 16;
+ if (!(Pico.video.reg[1]&8)) { line = 8; dst += 512*8; src += 512*8; }
+
+ for (; line < line_to; line++, dst+=512, src+=512)
+ amips_clut_f(dst, src, localPal, line_len);
+}
+
+static void EmuScanPrepare(void)
+{
+ HighCol = (unsigned char *)VRAM_CACHED_STUFF + 8;
+ if (!(Pico.video.reg[1]&8)) HighCol += 8*512;
+
+ if (dynamic_palette > 0)
+ dynamic_palette--;
+
+ if (Pico.m.dirtyPal)
+ do_pal_update(1, 1);
+ if ((rendstatus & PDRAW_SPR_LO_ON_HI) && !(Pico.video.reg[0xC]&8))
+ amips_clut_f = amips_clut_6bit;
+ else amips_clut_f = amips_clut;
+}
+
+static int EmuScanSlowBegin(unsigned int num)
+{
+ if (!dynamic_palette)
+ HighCol = (unsigned char *)VRAM_CACHED_STUFF + num * 512 + 8;
+
+ return 0;
+}
+
+static int EmuScanSlowEnd(unsigned int num)
+{
+ if (Pico.m.dirtyPal) {
+ if (!dynamic_palette) {
+ do_slowmode_lines(num);
+ dynamic_palette = 3; // last for 2 more frames
+ }
+ do_pal_update(1, 1);
+ }
+
+ if (dynamic_palette) {
+ int line_len = (Pico.video.reg[12]&1) ? 320 : 256;
+ void *dst = (char *)VRAM_STUFF + 512*240 + 512*2*num;
+ amips_clut_f(dst, HighCol + 8, localPal, line_len);
+ }
+
+ return 0;
+}
+
+static void blitscreen_clut(void)
+{
+ int offs = fbimg_offs;
+ offs += (psp_screen == VRAM_FB0) ? VRAMOFFS_FB0 : VRAMOFFS_FB1;
+
+ sceGuSync(0,0); // sync with prev
+ sceGuStart(GU_DIRECT, guCmdList);
+ sceGuDrawBuffer(GU_PSM_5650, (void *)offs, 512); // point to back buffer
+
+ if (dynamic_palette)
+ {
+ if (!blit_16bit_mode) { // the current mode is not 16bit
+ sceGuTexMode(GU_PSM_5650, 0, 0, 0);
+ sceGuTexImage(0,512,512,512,(char *)VRAM_STUFF + 512*240);
+
+ blit_16bit_mode = 1;
+ }
+ }
+ else
+ {
+ if (blit_16bit_mode) {
+ sceGuClutMode(GU_PSM_5650,0,0xff,0);
+ sceGuTexMode(GU_PSM_T8,0,0,0); // 8-bit image
+ sceGuTexImage(0,512,512,512,(char *)VRAM_STUFF + 16);
+ blit_16bit_mode = 0;
+ }
+
+ if ((PicoOpt&0x10) && Pico.m.dirtyPal)
+ do_pal_update(0, 0);
+
+ sceKernelDcacheWritebackAll();
+
+ if (need_pal_upload) {
+ need_pal_upload = 0;
+ sceGuClutLoad((256/8), localPal); // upload 32*8 entries (256)
+ }
+ }
+
+#if 1
+ if (g_vertices[0].u == 0 && g_vertices[1].u == g_vertices[1].x)
+ {
+ struct Vertex* vertices;
+ int x;
+
+ #define SLICE_WIDTH 32
+ for (x = 0; x < g_vertices[1].x; x += SLICE_WIDTH)
+ {
+ // render sprite
+ vertices = (struct Vertex*)sceGuGetMemory(2 * sizeof(struct Vertex));
+ memcpy(vertices, g_vertices, 2 * sizeof(struct Vertex));
+ vertices[0].u = vertices[0].x = x;
+ vertices[1].u = vertices[1].x = x + SLICE_WIDTH;
+ sceGuDrawArray(GU_SPRITES,GU_TEXTURE_16BIT|GU_VERTEX_16BIT|GU_TRANSFORM_2D,2,0,vertices);
+ }
+ // lprintf("listlen: %iB\n", sceGuCheckList()); // ~480 only
+ }
+ else
+#endif
+ sceGuDrawArray(GU_SPRITES,GU_TEXTURE_16BIT|GU_VERTEX_16BIT|GU_TRANSFORM_2D,2,0,g_vertices);
+
+ sceGuFinish();
+}
+
+
+static void cd_leds(void)
+{
+ unsigned int reg, col_g, col_r, *p;
+
+ reg = Pico_mcd->s68k_regs[0];
+
+ p = (unsigned int *)((short *)psp_screen + 512*2+4+2);
+ col_g = (reg & 2) ? 0x06000600 : 0;
+ col_r = (reg & 1) ? 0x00180018 : 0;
+ *p++ = col_g; *p++ = col_g; p+=2; *p++ = col_r; *p++ = col_r; p += 512/2 - 12/2;
+ *p++ = col_g; *p++ = col_g; p+=2; *p++ = col_r; *p++ = col_r; p += 512/2 - 12/2;
+ *p++ = col_g; *p++ = col_g; p+=2; *p++ = col_r; *p++ = col_r;
+}
+
+static void draw_pico_ptr(void)
+{
+ unsigned char *p = (unsigned char *)VRAM_STUFF + 16;
+
+ // only if pen enabled and for 8bit mode
+ if (pico_inp_mode == 0 || blit_16bit_mode) return;
+
+ p += 512 * (pico_pen_y + PICO_PEN_ADJUST_Y);
+ p += pico_pen_x + PICO_PEN_ADJUST_X;
+ p[ -1] = 0xe0; p[ 0] = 0xf0; p[ 1] = 0xe0;
+ p[ 511] = 0xf0; p[ 512] = 0xf0; p[ 513] = 0xf0;
+ p[1023] = 0xe0; p[1024] = 0xf0; p[1025] = 0xe0;
+}
+
+
+#if 0
+static void dbg_text(void)
+{
+ int *p, h, len;
+ char text[128];
+
+ sprintf(text, "sl: %i, 16b: %i", g_vertices[0].u == 0 && g_vertices[1].u == g_vertices[1].x, blit_16bit_mode);
+ len = strlen(text) * 8 / 2;
+ for (h = 0; h < 8; h++) {
+ p = (int *) ((unsigned short *) psp_screen+2+512*(256+h));
+ p = (int *) ((int)p & ~3); // align
+ memset32_uncached(p, 0, len);
+ }
+ emu_text_out16(2, 256, text);
+}
+#endif
+
+/* called after rendering is done, but frame emulation is not finished */
+void blit1(void)
+{
+ if (PicoOpt&0x10)
+ {
+ int i;
+ unsigned char *pd;
+ // clear top and bottom trash
+ for (pd = PicoDraw2FB+8, i = 8; i > 0; i--, pd += 512)
+ memset32((int *)pd, 0xe0e0e0e0, 320/4);
+ for (pd = PicoDraw2FB+512*232+8, i = 8; i > 0; i--, pd += 512)
+ memset32((int *)pd, 0xe0e0e0e0, 320/4);
+ }
+
+ if (PicoAHW & PAHW_PICO)
+ draw_pico_ptr();
+
+ blitscreen_clut();
+}
+
+
+static void blit2(const char *fps, const char *notice, int lagging_behind)
+{
+ int vsync = 0, emu_opt = currentConfig.EmuOpt;
+
+ if (notice || (emu_opt & 2)) {
+ if (notice) osd_text(4, notice, 0, 0);
+ if (emu_opt & 2) osd_text(OSD_FPS_X, fps, 0, 0);
+ }
+
+ //dbg_text();
+
+ if ((emu_opt & 0x400) && (PicoAHW & PAHW_MCD))
+ cd_leds();
+
+ if (currentConfig.EmuOpt & 0x2000) { // want vsync
+ if (!(currentConfig.EmuOpt & 0x10000) || !lagging_behind) vsync = 1;
+ }
+
+ psp_video_flip(vsync);
+}
+
+// clears whole screen or just the notice area (in all buffers)
+static void clearArea(int full)
+{
+ if (full) {
+ memset32_uncached(psp_screen, 0, 512*272*2/4);
+ psp_video_flip(0);
+ memset32_uncached(psp_screen, 0, 512*272*2/4);
+ memset32(VRAM_CACHED_STUFF, 0xe0e0e0e0, 512*240/4);
+ memset32((int *)VRAM_CACHED_STUFF+512*240/4, 0, 512*240*2/4);
+ } else {
+ void *fb = psp_video_get_active_fb();
+ memset32_uncached((int *)((char *)psp_screen + 512*264*2), 0, 512*8*2/4);
+ memset32_uncached((int *)((char *)fb + 512*264*2), 0, 512*8*2/4);
+ }
+}
+
+static void vidResetMode(void)
+{
+ // setup GU
+ sceGuSync(0,0); // sync with prev
+ sceGuStart(GU_DIRECT, guCmdList);
+
+ sceGuClutMode(GU_PSM_5650,0,0xff,0);
+ sceGuTexMode(GU_PSM_T8,0,0,0); // 8-bit image
+ sceGuTexFunc(GU_TFX_REPLACE,GU_TCC_RGB);
+ if (currentConfig.scaling)
+ sceGuTexFilter(GU_LINEAR, GU_LINEAR);
+ else sceGuTexFilter(GU_NEAREST, GU_NEAREST);
+ sceGuTexScale(1.0f,1.0f);
+ sceGuTexOffset(0.0f,0.0f);
+
+ sceGuTexImage(0,512,512,512,(char *)VRAM_STUFF + 16);
+
+ // slow rend.
+ PicoDrawSetOutFormat(PDF_NONE, 0);
+ PicoDrawSetCallbacks(EmuScanSlowBegin, EmuScanSlowEnd);
+
+ localPal[0xe0] = 0;
+ localPal[0xf0] = 0x001f;
+ Pico.m.dirtyPal = 1;
+ blit_16bit_mode = dynamic_palette = 0;
+
+ sceGuFinish();
+ set_scaling_params();
+ sceGuSync(0,0);
+}
+
+void plat_debug_cat(char *str)
+{
+ strcat(str, blit_16bit_mode ? "soft clut\n" : "hard clut\n");
+}
+
+
+/* sound stuff */
+#define SOUND_BLOCK_SIZE_NTSC (1470*2) // 1024 // 1152
+#define SOUND_BLOCK_SIZE_PAL (1764*2)
+#define SOUND_BLOCK_COUNT 8
+
+static short __attribute__((aligned(4))) sndBuffer[SOUND_BLOCK_SIZE_PAL*SOUND_BLOCK_COUNT + 44100/50*2];
+static short *snd_playptr = NULL, *sndBuffer_endptr = NULL;
+static int samples_made = 0, samples_done = 0, samples_block = 0;
+static int sound_thread_exit = 0;
+static SceUID sound_sem = -1;
+
+static void writeSound(int len);
+
+static int sound_thread(SceSize args, void *argp)
+{
+ int ret = 0;
+
+ lprintf("sthr: started, priority %i\n", sceKernelGetThreadCurrentPriority());
+
+ while (!sound_thread_exit)
+ {
+ if (samples_made - samples_done < samples_block) {
+ // wait for data (use at least 2 blocks)
+ //lprintf("sthr: wait... (%i)\n", samples_made - samples_done);
+ while (samples_made - samples_done <= samples_block*2 && !sound_thread_exit)
+ ret = sceKernelWaitSema(sound_sem, 1, 0);
+ if (ret < 0) lprintf("sthr: sceKernelWaitSema: %i\n", ret);
+ continue;
+ }
+
+ // lprintf("sthr: got data: %i\n", samples_made - samples_done);
+
+ ret = sceAudio_E0727056(PSP_AUDIO_VOLUME_MAX, snd_playptr);
+
+ samples_done += samples_block;
+ snd_playptr += samples_block;
+ if (snd_playptr >= sndBuffer_endptr)
+ snd_playptr = sndBuffer;
+ // 1.5 kernel returns 0, newer ones return # of samples queued
+ if (ret < 0)
+ lprintf("sthr: sceAudio_E0727056: %08x; pos %i/%i\n", ret, samples_done, samples_made);
+
+ // shouln't happen, but just in case
+ if (samples_made - samples_done >= samples_block*3) {
+ //lprintf("sthr: block skip (%i)\n", samples_made - samples_done);
+ samples_done += samples_block; // skip
+ snd_playptr += samples_block;
+ }
+