--- /dev/null
+/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
+ * Mupen64plus-rsp-hle - ucode1.cpp *
+ * Mupen64Plus homepage: http://code.google.com/p/mupen64plus/ *
+ * Copyright (C) 2009 Richard Goedeken *
+ * Copyright (C) 2002 Hacktarux *
+ * *
+ * This program is free software; you can redistribute it and/or modify *
+ * it under the terms of the GNU General Public License as published by *
+ * the Free Software Foundation; either version 2 of the License, or *
+ * (at your option) any later version. *
+ * *
+ * This program is distributed in the hope that it will be useful, *
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of *
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
+ * GNU General Public License for more details. *
+ * *
+ * You should have received a copy of the GNU General Public License *
+ * along with this program; if not, write to the *
+ * Free Software Foundation, Inc., *
+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. *
+ * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
+
+# include <string.h>
+
+extern "C" {
+ #include "hle.h"
+ #include "alist_internal.h"
+}
+
+//#include "rsp.h"
+//#define SAFE_MEMORY
+/*
+#ifndef SAFE_MEMORY
+# define wr8 (src , address);
+# define rd8 (dest, address);
+# define wr16 (src, address);
+# define rd16 (dest, address);
+# define wr32 (src, address);
+# define rd32 (dest, address);
+# define wr64 (src, address);
+# define rd64 (dest, address);
+# define dmamem (dest, src, size) memcpy (dest, src, size);
+# define clrmem (dest, size) memset (dest, 0, size);
+#else
+ void wr8 (u8 src, void *address);
+ void rd8 (u8 dest, void *address);
+ void wr16 (u16 src, void *address);
+ void rd16 (u16 dest, void *address);
+ void wr32 (u16 src, void *address);
+ void rd32 (u16 dest, void *address);
+ void wr64 (u16 src, void *address);
+ void rd64 (u16 dest, void *address);
+ void dmamem (void *dest, void *src, int size);
+ void clrmem (void *dest, int size);
+#endif
+*/
+/******** DMEM Memory Map for ABI 1 ***************
+Address/Range Description
+------------- -------------------------------
+0x000..0x2BF UCodeData
+ 0x000-0x00F Constants - 0000 0001 0002 FFFF 0020 0800 7FFF 4000
+ 0x010-0x02F Function Jump Table (16 Functions * 2 bytes each = 32) 0x20
+ 0x030-0x03F Constants - F000 0F00 00F0 000F 0001 0010 0100 1000
+ 0x040-0x03F Used by the Envelope Mixer (But what for?)
+ 0x070-0x07F Used by the Envelope Mixer (But what for?)
+0x2C0..0x31F <Unknown>
+0x320..0x35F Segments
+0x360 Audio In Buffer (Location)
+0x362 Audio Out Buffer (Location)
+0x364 Audio Buffer Size (Location)
+0x366 Initial Volume for Left Channel
+0x368 Initial Volume for Right Channel
+0x36A Auxillary Buffer #1 (Location)
+0x36C Auxillary Buffer #2 (Location)
+0x36E Auxillary Buffer #3 (Location)
+0x370 Loop Value (shared location)
+0x370 Target Volume (Left)
+0x372 Ramp?? (Left)
+0x374 Rate?? (Left)
+0x376 Target Volume (Right)
+0x378 Ramp?? (Right)
+0x37A Rate?? (Right)
+0x37C Dry??
+0x37E Wet??
+0x380..0x4BF Alist data
+0x4C0..0x4FF ADPCM CodeBook
+0x500..0x5BF <Unknown>
+0x5C0..0xF7F Buffers...
+0xF80..0xFFF <Unknown>
+***************************************************/
+#ifdef USE_EXPANSION
+ #define MEMMASK 0x7FFFFF
+#else
+ #define MEMMASK 0x3FFFFF
+#endif
+
+static void SPNOOP (u32 inst1, u32 inst2) {
+ //MessageBox (NULL, "Unknown Audio Command in ABI 1", "Audio HLE Error", MB_OK);
+}
+
+u32 SEGMENTS[0x10]; // 0x0320
+// T8 = 0x360
+u16 AudioInBuffer; // 0x0000(T8)
+u16 AudioOutBuffer; // 0x0002(T8)
+u16 AudioCount; // 0x0004(T8)
+s16 Vol_Left; // 0x0006(T8)
+s16 Vol_Right; // 0x0008(T8)
+u16 AudioAuxA; // 0x000A(T8)
+u16 AudioAuxC; // 0x000C(T8)
+u16 AudioAuxE; // 0x000E(T8)
+u32 loopval; // 0x0010(T8) // Value set by A_SETLOOP : Possible conflict with SETVOLUME???
+s16 VolTrg_Left; // 0x0010(T8)
+s32 VolRamp_Left; // m_LeftVolTarget
+//u16 VolRate_Left; // m_LeftVolRate
+s16 VolTrg_Right; // m_RightVol
+s32 VolRamp_Right; // m_RightVolTarget
+//u16 VolRate_Right; // m_RightVolRate
+s16 Env_Dry; // 0x001C(T8)
+s16 Env_Wet; // 0x001E(T8)
+
+u8 BufferSpace[0x10000];
+
+short hleMixerWorkArea[256];
+u16 adpcmtable[0x88];
+
+extern const u16 ResampleLUT [0x200] = {
+ 0x0C39, 0x66AD, 0x0D46, 0xFFDF, 0x0B39, 0x6696, 0x0E5F, 0xFFD8,
+ 0x0A44, 0x6669, 0x0F83, 0xFFD0, 0x095A, 0x6626, 0x10B4, 0xFFC8,
+ 0x087D, 0x65CD, 0x11F0, 0xFFBF, 0x07AB, 0x655E, 0x1338, 0xFFB6,
+ 0x06E4, 0x64D9, 0x148C, 0xFFAC, 0x0628, 0x643F, 0x15EB, 0xFFA1,
+ 0x0577, 0x638F, 0x1756, 0xFF96, 0x04D1, 0x62CB, 0x18CB, 0xFF8A,
+ 0x0435, 0x61F3, 0x1A4C, 0xFF7E, 0x03A4, 0x6106, 0x1BD7, 0xFF71,
+ 0x031C, 0x6007, 0x1D6C, 0xFF64, 0x029F, 0x5EF5, 0x1F0B, 0xFF56,
+ 0x022A, 0x5DD0, 0x20B3, 0xFF48, 0x01BE, 0x5C9A, 0x2264, 0xFF3A,
+ 0x015B, 0x5B53, 0x241E, 0xFF2C, 0x0101, 0x59FC, 0x25E0, 0xFF1E,
+ 0x00AE, 0x5896, 0x27A9, 0xFF10, 0x0063, 0x5720, 0x297A, 0xFF02,
+ 0x001F, 0x559D, 0x2B50, 0xFEF4, 0xFFE2, 0x540D, 0x2D2C, 0xFEE8,
+ 0xFFAC, 0x5270, 0x2F0D, 0xFEDB, 0xFF7C, 0x50C7, 0x30F3, 0xFED0,
+ 0xFF53, 0x4F14, 0x32DC, 0xFEC6, 0xFF2E, 0x4D57, 0x34C8, 0xFEBD,
+ 0xFF0F, 0x4B91, 0x36B6, 0xFEB6, 0xFEF5, 0x49C2, 0x38A5, 0xFEB0,
+ 0xFEDF, 0x47ED, 0x3A95, 0xFEAC, 0xFECE, 0x4611, 0x3C85, 0xFEAB,
+ 0xFEC0, 0x4430, 0x3E74, 0xFEAC, 0xFEB6, 0x424A, 0x4060, 0xFEAF,
+ 0xFEAF, 0x4060, 0x424A, 0xFEB6, 0xFEAC, 0x3E74, 0x4430, 0xFEC0,
+ 0xFEAB, 0x3C85, 0x4611, 0xFECE, 0xFEAC, 0x3A95, 0x47ED, 0xFEDF,
+ 0xFEB0, 0x38A5, 0x49C2, 0xFEF5, 0xFEB6, 0x36B6, 0x4B91, 0xFF0F,
+ 0xFEBD, 0x34C8, 0x4D57, 0xFF2E, 0xFEC6, 0x32DC, 0x4F14, 0xFF53,
+ 0xFED0, 0x30F3, 0x50C7, 0xFF7C, 0xFEDB, 0x2F0D, 0x5270, 0xFFAC,
+ 0xFEE8, 0x2D2C, 0x540D, 0xFFE2, 0xFEF4, 0x2B50, 0x559D, 0x001F,
+ 0xFF02, 0x297A, 0x5720, 0x0063, 0xFF10, 0x27A9, 0x5896, 0x00AE,
+ 0xFF1E, 0x25E0, 0x59FC, 0x0101, 0xFF2C, 0x241E, 0x5B53, 0x015B,
+ 0xFF3A, 0x2264, 0x5C9A, 0x01BE, 0xFF48, 0x20B3, 0x5DD0, 0x022A,
+ 0xFF56, 0x1F0B, 0x5EF5, 0x029F, 0xFF64, 0x1D6C, 0x6007, 0x031C,
+ 0xFF71, 0x1BD7, 0x6106, 0x03A4, 0xFF7E, 0x1A4C, 0x61F3, 0x0435,
+ 0xFF8A, 0x18CB, 0x62CB, 0x04D1, 0xFF96, 0x1756, 0x638F, 0x0577,
+ 0xFFA1, 0x15EB, 0x643F, 0x0628, 0xFFAC, 0x148C, 0x64D9, 0x06E4,
+ 0xFFB6, 0x1338, 0x655E, 0x07AB, 0xFFBF, 0x11F0, 0x65CD, 0x087D,
+ 0xFFC8, 0x10B4, 0x6626, 0x095A, 0xFFD0, 0x0F83, 0x6669, 0x0A44,
+ 0xFFD8, 0x0E5F, 0x6696, 0x0B39, 0xFFDF, 0x0D46, 0x66AD, 0x0C39
+};
+
+static void CLEARBUFF (u32 inst1, u32 inst2) {
+ u32 addr = (u32)(inst1 & 0xffff);
+ u32 count = (u32)(inst2 & 0xffff);
+ addr &= 0xFFFC;
+ memset(BufferSpace+addr, 0, (count+3)&0xFFFC);
+}
+
+//FILE *dfile = fopen ("d:\\envmix.txt", "wt");
+
+static void ENVMIXER (u32 inst1, u32 inst2) {
+ //static int envmixcnt = 0;
+ u8 flags = (u8)((inst1 >> 16) & 0xff);
+ u32 addy = (inst2 & 0xFFFFFF);// + SEGMENTS[(inst2>>24)&0xf];
+ //static
+// ********* Make sure these conditions are met... ***********
+ /*if ((AudioInBuffer | AudioOutBuffer | AudioAuxA | AudioAuxC | AudioAuxE | AudioCount) & 0x3) {
+ MessageBox (NULL, "Unaligned EnvMixer... please report this to Azimer with the following information: RomTitle, Place in the rom it occurred, and any save state just before the error", "AudioHLE Error", MB_OK);
+ }*/
+// ------------------------------------------------------------
+ short *inp=(short *)(BufferSpace+AudioInBuffer);
+ short *out=(short *)(BufferSpace+AudioOutBuffer);
+ short *aux1=(short *)(BufferSpace+AudioAuxA);
+ short *aux2=(short *)(BufferSpace+AudioAuxC);
+ short *aux3=(short *)(BufferSpace+AudioAuxE);
+ s32 MainR;
+ s32 MainL;
+ s32 AuxR;
+ s32 AuxL;
+ int i1,o1,a1,a2=0,a3=0;
+ unsigned short AuxIncRate=1;
+ short zero[8];
+ memset(zero,0,16);
+ s32 LVol, RVol;
+ s32 LAcc, RAcc;
+ s32 LTrg, RTrg;
+ s16 Wet, Dry;
+ u32 ptr = 0;
+ s32 RRamp, LRamp;
+ s32 LAdderStart, RAdderStart, LAdderEnd, RAdderEnd;
+ s32 oMainR, oMainL, oAuxR, oAuxL;
+
+ //envmixcnt++;
+
+ //fprintf (dfile, "\n----------------------------------------------------\n");
+ if (flags & A_INIT) {
+ LVol = ((Vol_Left * (s32)VolRamp_Left));
+ RVol = ((Vol_Right * (s32)VolRamp_Right));
+ Wet = (s16)Env_Wet; Dry = (s16)Env_Dry; // Save Wet/Dry values
+ LTrg = (VolTrg_Left << 16); RTrg = (VolTrg_Right << 16); // Save Current Left/Right Targets
+ LAdderStart = Vol_Left << 16;
+ RAdderStart = Vol_Right << 16;
+ LAdderEnd = LVol;
+ RAdderEnd = RVol;
+ RRamp = VolRamp_Right;
+ LRamp = VolRamp_Left;
+ } else {
+ // Load LVol, RVol, LAcc, and RAcc (all 32bit)
+ // Load Wet, Dry, LTrg, RTrg
+ memcpy((u8 *)hleMixerWorkArea, (rsp.RDRAM+addy), 80);
+ Wet = *(s16 *)(hleMixerWorkArea + 0); // 0-1
+ Dry = *(s16 *)(hleMixerWorkArea + 2); // 2-3
+ LTrg = *(s32 *)(hleMixerWorkArea + 4); // 4-5
+ RTrg = *(s32 *)(hleMixerWorkArea + 6); // 6-7
+ LRamp= *(s32 *)(hleMixerWorkArea + 8); // 8-9 (hleMixerWorkArea is a 16bit pointer)
+ RRamp= *(s32 *)(hleMixerWorkArea + 10); // 10-11
+ LAdderEnd = *(s32 *)(hleMixerWorkArea + 12); // 12-13
+ RAdderEnd = *(s32 *)(hleMixerWorkArea + 14); // 14-15
+ LAdderStart = *(s32 *)(hleMixerWorkArea + 16); // 12-13
+ RAdderStart = *(s32 *)(hleMixerWorkArea + 18); // 14-15
+ }
+
+ if(!(flags&A_AUX)) {
+ AuxIncRate=0;
+ aux2=aux3=zero;
+ }
+
+ oMainL = (Dry * (LTrg>>16) + 0x4000) >> 15;
+ oAuxL = (Wet * (LTrg>>16) + 0x4000) >> 15;
+ oMainR = (Dry * (RTrg>>16) + 0x4000) >> 15;
+ oAuxR = (Wet * (RTrg>>16) + 0x4000) >> 15;
+
+ for (int y = 0; y < AudioCount; y += 0x10) {
+
+ if (LAdderStart != LTrg) {
+ LAcc = LAdderStart;
+ LVol = (LAdderEnd - LAdderStart) >> 3;
+ LAdderEnd = (s32) (((s64)LAdderEnd * (s64)LRamp) >> 16);
+ LAdderStart = (s32) (((s64)LAcc * (s64)LRamp) >> 16);
+ } else {
+ LAcc = LTrg;
+ LVol = 0;
+ }
+
+ if (RAdderStart != RTrg) {
+ RAcc = RAdderStart;
+ RVol = (RAdderEnd - RAdderStart) >> 3;
+ RAdderEnd = (s32) (((s64)RAdderEnd * (s64)RRamp) >> 16);
+ RAdderStart = (s32) (((s64)RAcc * (s64)RRamp) >> 16);
+ } else {
+ RAcc = RTrg;
+ RVol = 0;
+ }
+
+ for (int x = 0; x < 8; x++) {
+ i1=(int)inp[ptr^S];
+ o1=(int)out[ptr^S];
+ a1=(int)aux1[ptr^S];
+ if (AuxIncRate) {
+ a2=(int)aux2[ptr^S];
+ a3=(int)aux3[ptr^S];
+ }
+ // TODO: here...
+ //LAcc = LTrg;
+ //RAcc = RTrg;
+
+ LAcc += LVol;
+ RAcc += RVol;
+
+ if (LVol <= 0) { // Decrementing
+ if (LAcc < LTrg) {
+ LAcc = LTrg;
+ LAdderStart = LTrg;
+ MainL = oMainL;
+ AuxL = oAuxL;
+ } else {
+ MainL = (Dry * ((s32)LAcc>>16) + 0x4000) >> 15;
+ AuxL = (Wet * ((s32)LAcc>>16) + 0x4000) >> 15;
+ }
+ } else {
+ if (LAcc > LTrg) {
+ LAcc = LTrg;
+ LAdderStart = LTrg;
+ MainL = oMainL;
+ AuxL = oAuxL;
+ } else {
+ MainL = (Dry * ((s32)LAcc>>16) + 0x4000) >> 15;
+ AuxL = (Wet * ((s32)LAcc>>16) + 0x4000) >> 15;
+ }
+ }
+
+ if (RVol <= 0) { // Decrementing
+ if (RAcc < RTrg) {
+ RAcc = RTrg;
+ RAdderStart = RTrg;
+ MainR = oMainR;
+ AuxR = oAuxR;
+ } else {
+ MainR = (Dry * ((s32)RAcc>>16) + 0x4000) >> 15;
+ AuxR = (Wet * ((s32)RAcc>>16) + 0x4000) >> 15;
+ }
+ } else {
+ if (RAcc > RTrg) {
+ RAcc = RTrg;
+ RAdderStart = RTrg;
+ MainR = oMainR;
+ AuxR = oAuxR;
+ } else {
+ MainR = (Dry * ((s32)RAcc>>16) + 0x4000) >> 15;
+ AuxR = (Wet * ((s32)RAcc>>16) + 0x4000) >> 15;
+ }
+ }
+
+ //fprintf (dfile, "%04X ", (LAcc>>16));
+
+ /*MainL = (((s64)Dry*2 * (s64)(LAcc>>16)) + 0x8000) >> 16;
+ MainR = (((s64)Dry*2 * (s64)(RAcc>>16)) + 0x8000) >> 16;
+ AuxL = (((s64)Wet*2 * (s64)(LAcc>>16)) + 0x8000) >> 16;
+ AuxR = (((s64)Wet*2 * (s64)(RAcc>>16)) + 0x8000) >> 16;*/
+/*
+ if (MainL>32767) MainL = 32767;
+ else if (MainL<-32768) MainL = -32768;
+ if (MainR>32767) MainR = 32767;
+ else if (MainR<-32768) MainR = -32768;
+ if (AuxL>32767) AuxL = 32767;
+ else if (AuxL<-32768) AuxR = -32768;
+ if (AuxR>32767) AuxR = 32767;
+ else if (AuxR<-32768) AuxR = -32768;*/
+ /*
+ MainR = (Dry * RTrg + 0x10000) >> 15;
+ MainL = (Dry * LTrg + 0x10000) >> 15;
+ AuxR = (Wet * RTrg + 0x8000) >> 16;
+ AuxL = (Wet * LTrg + 0x8000) >> 16;*/
+
+ o1+=(/*(o1*0x7fff)+*/(i1*MainR)+0x4000)>>15;
+ a1+=(/*(a1*0x7fff)+*/(i1*MainL)+0x4000)>>15;
+
+/* o1=((s64)(((s64)o1*0xfffe)+((s64)i1*MainR*2)+0x8000)>>16);
+
+ a1=((s64)(((s64)a1*0xfffe)+((s64)i1*MainL*2)+0x8000)>>16);*/
+
+ if(o1>32767) o1=32767;
+ else if(o1<-32768) o1=-32768;
+
+ if(a1>32767) a1=32767;
+ else if(a1<-32768) a1=-32768;
+
+ out[ptr^S]=o1;
+ aux1[ptr^S]=a1;
+ if (AuxIncRate) {
+ //a2=((s64)(((s64)a2*0xfffe)+((s64)i1*AuxR*2)+0x8000)>>16);
+
+ //a3=((s64)(((s64)a3*0xfffe)+((s64)i1*AuxL*2)+0x8000)>>16);
+ a2+=(/*(a2*0x7fff)+*/(i1*AuxR)+0x4000)>>15;
+ a3+=(/*(a3*0x7fff)+*/(i1*AuxL)+0x4000)>>15;
+
+ if(a2>32767) a2=32767;
+ else if(a2<-32768) a2=-32768;
+
+ if(a3>32767) a3=32767;
+ else if(a3<-32768) a3=-32768;
+
+ aux2[ptr^S]=a2;
+ aux3[ptr^S]=a3;
+ }
+ ptr++;
+ }
+ }
+
+ /*LAcc = LAdderEnd;
+ RAcc = RAdderEnd;*/
+
+ *(s16 *)(hleMixerWorkArea + 0) = Wet; // 0-1
+ *(s16 *)(hleMixerWorkArea + 2) = Dry; // 2-3
+ *(s32 *)(hleMixerWorkArea + 4) = LTrg; // 4-5
+ *(s32 *)(hleMixerWorkArea + 6) = RTrg; // 6-7
+ *(s32 *)(hleMixerWorkArea + 8) = LRamp; // 8-9 (hleMixerWorkArea is a 16bit pointer)
+ *(s32 *)(hleMixerWorkArea + 10) = RRamp; // 10-11
+ *(s32 *)(hleMixerWorkArea + 12) = LAdderEnd; // 12-13
+ *(s32 *)(hleMixerWorkArea + 14) = RAdderEnd; // 14-15
+ *(s32 *)(hleMixerWorkArea + 16) = LAdderStart; // 12-13
+ *(s32 *)(hleMixerWorkArea + 18) = RAdderStart; // 14-15
+ memcpy(rsp.RDRAM+addy, (u8 *)hleMixerWorkArea,80);
+}
+
+static void RESAMPLE (u32 inst1, u32 inst2) {
+ unsigned char Flags=(u8)((inst1>>16)&0xff);
+ unsigned int Pitch=((inst1&0xffff))<<1;
+ u32 addy = (inst2 & 0xffffff);// + SEGMENTS[(inst2>>24)&0xf];
+ unsigned int Accum=0;
+ unsigned int location;
+ s16 *lut/*, *lut2*/;
+ short *dst;
+ s16 *src;
+ dst=(short *)(BufferSpace);
+ src=(s16 *)(BufferSpace);
+ u32 srcPtr=(AudioInBuffer/2);
+ u32 dstPtr=(AudioOutBuffer/2);
+ s32 temp;
+ s32 accum;
+/*
+ if (addy > (1024*1024*8))
+ addy = (inst2 & 0xffffff);
+*/
+ srcPtr -= 4;
+
+ if ((Flags & 0x1) == 0) {
+ //memcpy (src+srcPtr, rsp.RDRAM+addy, 0x8);
+ for (int x=0; x < 4; x++)
+ src[(srcPtr+x)^S] = ((u16 *)rsp.RDRAM)[((addy/2)+x)^S];
+ Accum = *(u16 *)(rsp.RDRAM+addy+10);
+ } else {
+ for (int x=0; x < 4; x++)
+ src[(srcPtr+x)^S] = 0;//*(u16 *)(rsp.RDRAM+((addy+x)^2));
+ }
+
+ for(int i=0;i < ((AudioCount+0xf)&0xFFF0)/2;i++) {
+ //location = (((Accum * 0x40) >> 0x10) * 8);
+ // location is the fractional position between two samples
+ location = (Accum >> 0xa) * 4;
+ lut = (s16*)ResampleLUT + location;
+
+ // mov eax, dword ptr [src+srcPtr];
+ // movsx edx, word ptr [lut];
+ // shl edx, 1
+ // imul edx
+ // test eax, 08000h
+ // setz ecx
+ // shl ecx, 16
+ // xor eax, 08000h
+ // add eax, ecx
+ // and edx, 0f000h
+
+ // imul
+ temp = ((s32)*(s16*)(src+((srcPtr+0)^S))*((s32)((s16)lut[0])));
+ accum = (s32)(temp >> 15);
+
+ temp = ((s32)*(s16*)(src+((srcPtr+1)^S))*((s32)((s16)lut[1])));
+ accum += (s32)(temp >> 15);
+
+ temp = ((s32)*(s16*)(src+((srcPtr+2)^S))*((s32)((s16)lut[2])));
+ accum += (s32)(temp >> 15);
+
+ temp = ((s32)*(s16*)(src+((srcPtr+3)^S))*((s32)((s16)lut[3])));
+ accum += (s32)(temp >> 15);
+
+ if (accum > 32767) accum = 32767;
+ if (accum < -32768) accum = -32768;
+
+ dst[dstPtr^S] = (accum);
+ dstPtr++;
+ Accum += Pitch;
+ srcPtr += (Accum>>16);
+ Accum&=0xffff;
+ }
+ for (int x=0; x < 4; x++)
+ ((u16 *)rsp.RDRAM)[((addy/2)+x)^S] = src[(srcPtr+x)^S];
+ //memcpy (RSWORK, src+srcPtr, 0x8);
+ *(u16 *)(rsp.RDRAM+addy+10) = Accum;
+}
+
+static void SETVOL (u32 inst1, u32 inst2) {
+// Might be better to unpack these depending on the flags...
+ u8 flags = (u8)((inst1 >> 16) & 0xff);
+ u16 vol = (s16)(inst1 & 0xffff);
+ //u16 voltarg =(u16)((inst2 >> 16)&0xffff);
+ u16 volrate = (u16)((inst2 & 0xffff));
+
+ if (flags & A_AUX) {
+ Env_Dry = (s16)vol; // m_MainVol
+ Env_Wet = (s16)volrate; // m_AuxVol
+ return;
+ }
+
+ if(flags & A_VOL) { // Set the Source(start) Volumes
+ if(flags & A_LEFT) {
+ Vol_Left = (s16)vol; // m_LeftVolume
+ } else { // A_RIGHT
+ Vol_Right = (s16)vol; // m_RightVolume
+ }
+ return;
+ }
+
+//0x370 Loop Value (shared location)
+//0x370 Target Volume (Left)
+//u16 VolRamp_Left; // 0x0012(T8)
+ if(flags & A_LEFT) { // Set the Ramping values Target, Ramp
+ //loopval = (((u32)vol << 0x10) | (u32)voltarg);
+ VolTrg_Left = (s16)inst1; // m_LeftVol
+ //VolRamp_Left = (s32)inst2;
+ VolRamp_Left = (s32)inst2;//(u16)(inst2) | (s32)(s16)(inst2 << 0x10);
+ //fprintf (dfile, "Ramp Left: %f\n", (float)VolRamp_Left/65536.0);
+ //fprintf (dfile, "Ramp Left: %08X\n", inst2);
+ //VolRamp_Left = (s16)voltarg; // m_LeftVolTarget
+ //VolRate_Left = (s16)volrate; // m_LeftVolRate
+ } else { // A_RIGHT
+ VolTrg_Right = (s16)inst1; // m_RightVol
+ //VolRamp_Right = (s32)inst2;
+ VolRamp_Right = (s32)inst2;//(u16)(inst2 >> 0x10) | (s32)(s16)(inst2 << 0x10);
+ //fprintf (dfile, "Ramp Right: %f\n", (float)VolRamp_Right/65536.0);
+ //fprintf (dfile, "Ramp Right: %08X\n", inst2);
+ //VolRamp_Right = (s16)voltarg; // m_RightVolTarget
+ //VolRate_Right = (s16)volrate; // m_RightVolRate
+ }
+}
+
+static void UNKNOWN (u32 inst1, u32 inst2) {}
+
+static void SETLOOP (u32 inst1, u32 inst2) {
+ loopval = (inst2 & 0xffffff);// + SEGMENTS[(inst2>>24)&0xf];
+ //VolTrg_Left = (s16)(loopval>>16); // m_LeftVol
+ //VolRamp_Left = (s16)(loopval); // m_LeftVolTarget
+}
+
+static void ADPCM (u32 inst1, u32 inst2) { // Work in progress! :)
+ unsigned char Flags=(u8)(inst1>>16)&0xff;
+ //unsigned short Gain=(u16)(inst1&0xffff);
+ unsigned int Address=(inst2 & 0xffffff);// + SEGMENTS[(inst2>>24)&0xf];
+ unsigned short inPtr=0;
+ //short *out=(s16 *)(testbuff+(AudioOutBuffer>>2));
+ short *out=(short *)(BufferSpace+AudioOutBuffer);
+ //unsigned char *in=(unsigned char *)(BufferSpace+AudioInBuffer);
+ short count=(short)AudioCount;
+ unsigned char icode;
+ unsigned char code;
+ int vscale;
+ unsigned short index;
+ unsigned short j;
+ int a[8];
+ short *book1,*book2;
+/*
+ if (Address > (1024*1024*8))
+ Address = (inst2 & 0xffffff);
+*/
+ memset(out,0,32);
+
+ if(!(Flags&0x1))
+ {
+ if(Flags&0x2) {
+ memcpy(out,&rsp.RDRAM[loopval&MEMMASK],32);
+ } else {
+ memcpy(out,&rsp.RDRAM[Address],32);
+ }
+ }
+
+ int l1=out[14^S];
+ int l2=out[15^S];
+ int inp1[8];
+ int inp2[8];
+ out+=16;
+ while(count>0)
+ {
+ // the first interation through, these values are
+ // either 0 in the case of A_INIT, from a special
+ // area of memory in the case of A_LOOP or just
+ // the values we calculated the last time
+
+ code=BufferSpace[(AudioInBuffer+inPtr)^S8];
+ index=code&0xf;
+ index<<=4; // index into the adpcm code table
+ book1=(short *)&adpcmtable[index];
+ book2=book1+8;
+ code>>=4; // upper nibble is scale
+ vscale=(0x8000>>((12-code)-1)); // very strange. 0x8000 would be .5 in 16:16 format
+ // so this appears to be a fractional scale based
+ // on the 12 based inverse of the scale value. note
+ // that this could be negative, in which case we do
+ // not use the calculated vscale value... see the
+ // if(code>12) check below
+
+ inPtr++; // coded adpcm data lies next
+ j=0;
+ while(j<8) // loop of 8, for 8 coded nibbles from 4 bytes
+ // which yields 8 short pcm values
+ {
+ icode=BufferSpace[(AudioInBuffer+inPtr)^S8];
+ inPtr++;
+
+ inp1[j]=(s16)((icode&0xf0)<<8); // this will in effect be signed
+ if(code<12)
+ inp1[j]=((int)((int)inp1[j]*(int)vscale)>>16);
+ /*else
+ int catchme=1;*/
+ j++;
+
+ inp1[j]=(s16)((icode&0xf)<<12);
+ if(code<12)
+ inp1[j]=((int)((int)inp1[j]*(int)vscale)>>16);
+ /*else
+ int catchme=1;*/
+ j++;
+ }
+ j=0;
+ while(j<8)
+ {
+ icode=BufferSpace[(AudioInBuffer+inPtr)^S8];
+ inPtr++;
+
+ inp2[j]=(short)((icode&0xf0)<<8); // this will in effect be signed
+ if(code<12)
+ inp2[j]=((int)((int)inp2[j]*(int)vscale)>>16);
+ /*else
+ int catchme=1;*/
+ j++;
+
+ inp2[j]=(short)((icode&0xf)<<12);
+ if(code<12)
+ inp2[j]=((int)((int)inp2[j]*(int)vscale)>>16);
+ /*else
+ int catchme=1;*/
+ j++;
+ }
+
+ a[0]= (int)book1[0]*(int)l1;
+ a[0]+=(int)book2[0]*(int)l2;
+ a[0]+=(int)inp1[0]*(int)2048;
+
+ a[1] =(int)book1[1]*(int)l1;
+ a[1]+=(int)book2[1]*(int)l2;
+ a[1]+=(int)book2[0]*inp1[0];
+ a[1]+=(int)inp1[1]*(int)2048;
+
+ a[2] =(int)book1[2]*(int)l1;
+ a[2]+=(int)book2[2]*(int)l2;
+ a[2]+=(int)book2[1]*inp1[0];
+ a[2]+=(int)book2[0]*inp1[1];
+ a[2]+=(int)inp1[2]*(int)2048;
+
+ a[3] =(int)book1[3]*(int)l1;
+ a[3]+=(int)book2[3]*(int)l2;
+ a[3]+=(int)book2[2]*inp1[0];
+ a[3]+=(int)book2[1]*inp1[1];
+ a[3]+=(int)book2[0]*inp1[2];
+ a[3]+=(int)inp1[3]*(int)2048;
+
+ a[4] =(int)book1[4]*(int)l1;
+ a[4]+=(int)book2[4]*(int)l2;
+ a[4]+=(int)book2[3]*inp1[0];
+ a[4]+=(int)book2[2]*inp1[1];
+ a[4]+=(int)book2[1]*inp1[2];
+ a[4]+=(int)book2[0]*inp1[3];
+ a[4]+=(int)inp1[4]*(int)2048;
+
+ a[5] =(int)book1[5]*(int)l1;
+ a[5]+=(int)book2[5]*(int)l2;
+ a[5]+=(int)book2[4]*inp1[0];
+ a[5]+=(int)book2[3]*inp1[1];
+ a[5]+=(int)book2[2]*inp1[2];
+ a[5]+=(int)book2[1]*inp1[3];
+ a[5]+=(int)book2[0]*inp1[4];
+ a[5]+=(int)inp1[5]*(int)2048;
+
+ a[6] =(int)book1[6]*(int)l1;
+ a[6]+=(int)book2[6]*(int)l2;
+ a[6]+=(int)book2[5]*inp1[0];
+ a[6]+=(int)book2[4]*inp1[1];
+ a[6]+=(int)book2[3]*inp1[2];
+ a[6]+=(int)book2[2]*inp1[3];
+ a[6]+=(int)book2[1]*inp1[4];
+ a[6]+=(int)book2[0]*inp1[5];
+ a[6]+=(int)inp1[6]*(int)2048;
+
+ a[7] =(int)book1[7]*(int)l1;
+ a[7]+=(int)book2[7]*(int)l2;
+ a[7]+=(int)book2[6]*inp1[0];
+ a[7]+=(int)book2[5]*inp1[1];
+ a[7]+=(int)book2[4]*inp1[2];
+ a[7]+=(int)book2[3]*inp1[3];
+ a[7]+=(int)book2[2]*inp1[4];
+ a[7]+=(int)book2[1]*inp1[5];
+ a[7]+=(int)book2[0]*inp1[6];
+ a[7]+=(int)inp1[7]*(int)2048;
+
+ for(j=0;j<8;j++)
+ {
+ a[j^S]>>=11;
+ if(a[j^S]>32767) a[j^S]=32767;
+ else if(a[j^S]<-32768) a[j^S]=-32768;
+ *(out++)=a[j^S];
+ }
+ l1=a[6];
+ l2=a[7];
+
+ a[0]= (int)book1[0]*(int)l1;
+ a[0]+=(int)book2[0]*(int)l2;
+ a[0]+=(int)inp2[0]*(int)2048;
+
+ a[1] =(int)book1[1]*(int)l1;
+ a[1]+=(int)book2[1]*(int)l2;
+ a[1]+=(int)book2[0]*inp2[0];
+ a[1]+=(int)inp2[1]*(int)2048;
+
+ a[2] =(int)book1[2]*(int)l1;
+ a[2]+=(int)book2[2]*(int)l2;
+ a[2]+=(int)book2[1]*inp2[0];
+ a[2]+=(int)book2[0]*inp2[1];
+ a[2]+=(int)inp2[2]*(int)2048;
+
+ a[3] =(int)book1[3]*(int)l1;
+ a[3]+=(int)book2[3]*(int)l2;
+ a[3]+=(int)book2[2]*inp2[0];
+ a[3]+=(int)book2[1]*inp2[1];
+ a[3]+=(int)book2[0]*inp2[2];
+ a[3]+=(int)inp2[3]*(int)2048;
+
+ a[4] =(int)book1[4]*(int)l1;
+ a[4]+=(int)book2[4]*(int)l2;
+ a[4]+=(int)book2[3]*inp2[0];
+ a[4]+=(int)book2[2]*inp2[1];
+ a[4]+=(int)book2[1]*inp2[2];
+ a[4]+=(int)book2[0]*inp2[3];
+ a[4]+=(int)inp2[4]*(int)2048;
+
+ a[5] =(int)book1[5]*(int)l1;
+ a[5]+=(int)book2[5]*(int)l2;
+ a[5]+=(int)book2[4]*inp2[0];
+ a[5]+=(int)book2[3]*inp2[1];
+ a[5]+=(int)book2[2]*inp2[2];
+ a[5]+=(int)book2[1]*inp2[3];
+ a[5]+=(int)book2[0]*inp2[4];
+ a[5]+=(int)inp2[5]*(int)2048;
+
+ a[6] =(int)book1[6]*(int)l1;
+ a[6]+=(int)book2[6]*(int)l2;
+ a[6]+=(int)book2[5]*inp2[0];
+ a[6]+=(int)book2[4]*inp2[1];
+ a[6]+=(int)book2[3]*inp2[2];
+ a[6]+=(int)book2[2]*inp2[3];
+ a[6]+=(int)book2[1]*inp2[4];
+ a[6]+=(int)book2[0]*inp2[5];
+ a[6]+=(int)inp2[6]*(int)2048;
+
+ a[7] =(int)book1[7]*(int)l1;
+ a[7]+=(int)book2[7]*(int)l2;
+ a[7]+=(int)book2[6]*inp2[0];
+ a[7]+=(int)book2[5]*inp2[1];
+ a[7]+=(int)book2[4]*inp2[2];
+ a[7]+=(int)book2[3]*inp2[3];
+ a[7]+=(int)book2[2]*inp2[4];
+ a[7]+=(int)book2[1]*inp2[5];
+ a[7]+=(int)book2[0]*inp2[6];
+ a[7]+=(int)inp2[7]*(int)2048;
+
+ for(j=0;j<8;j++)
+ {
+ a[j^S]>>=11;
+ if(a[j^S]>32767) a[j^S]=32767;
+ else if(a[j^S]<-32768) a[j^S]=-32768;
+ *(out++)=a[j^S];
+ }
+ l1=a[6];
+ l2=a[7];
+
+ count-=32;
+ }
+ out-=16;
+ memcpy(&rsp.RDRAM[Address],out,32);
+}
+
+static void LOADBUFF (u32 inst1, u32 inst2) { // memcpy causes static... endianess issue :(
+ u32 v0;
+ //u32 cnt;
+ if (AudioCount == 0)
+ return;
+ v0 = (inst2 & 0xfffffc);// + SEGMENTS[(inst2>>24)&0xf];
+ memcpy (BufferSpace+(AudioInBuffer&0xFFFC), rsp.RDRAM+v0, (AudioCount+3)&0xFFFC);
+}
+
+static void SAVEBUFF (u32 inst1, u32 inst2) { // memcpy causes static... endianess issue :(
+ u32 v0;
+ //u32 cnt;
+ if (AudioCount == 0)
+ return;
+ v0 = (inst2 & 0xfffffc);// + SEGMENTS[(inst2>>24)&0xf];
+ memcpy (rsp.RDRAM+v0, BufferSpace+(AudioOutBuffer&0xFFFC), (AudioCount+3)&0xFFFC);
+}
+
+static void SETBUFF (u32 inst1, u32 inst2) { // Should work ;-)
+ if ((inst1 >> 0x10) & 0x8) { // A_AUX - Auxillary Sound Buffer Settings
+ AudioAuxA = u16(inst1);
+ AudioAuxC = u16((inst2 >> 0x10));
+ AudioAuxE = u16(inst2);
+ } else { // A_MAIN - Main Sound Buffer Settings
+ AudioInBuffer = u16(inst1); // 0x00
+ AudioOutBuffer = u16((inst2 >> 0x10)); // 0x02
+ AudioCount = u16(inst2); // 0x04
+ }
+}
+
+static void DMEMMOVE (u32 inst1, u32 inst2) { // Doesn't sound just right?... will fix when HLE is ready - 03-11-01
+ u32 v0, v1;
+ u32 cnt;
+ if ((inst2 & 0xffff)==0)
+ return;
+ v0 = (inst1 & 0xFFFF);
+ v1 = (inst2 >> 0x10);
+ //assert ((v1 & 0x3) == 0);
+ //assert ((v0 & 0x3) == 0);
+ u32 count = ((inst2+3) & 0xfffc);
+ //v0 = (v0) & 0xfffc;
+ //v1 = (v1) & 0xfffc;
+
+ //memcpy (BufferSpace+v1, BufferSpace+v0, count-1);
+ for (cnt = 0; cnt < count; cnt++) {
+ *(u8 *)(BufferSpace+((cnt+v1)^S8)) = *(u8 *)(BufferSpace+((cnt+v0)^S8));
+ }
+}
+
+static void LOADADPCM (u32 inst1, u32 inst2) { // Loads an ADPCM table - Works 100% Now 03-13-01
+ u32 v0;
+ v0 = (inst2 & 0xffffff);// + SEGMENTS[(inst2>>24)&0xf];
+/* if (v0 > (1024*1024*8))
+ v0 = (inst2 & 0xffffff);*/
+ //memcpy (dmem+0x4c0, rsp.RDRAM+v0, inst1&0xffff); // Could prolly get away with not putting this in dmem
+ //assert ((inst1&0xffff) <= 0x80);
+ u16 *table = (u16 *)(rsp.RDRAM+v0);
+ for (u32 x = 0; x < ((inst1&0xffff)>>0x4); x++) {
+ adpcmtable[(0x0+(x<<3))^S] = table[0];
+ adpcmtable[(0x1+(x<<3))^S] = table[1];
+
+ adpcmtable[(0x2+(x<<3))^S] = table[2];
+ adpcmtable[(0x3+(x<<3))^S] = table[3];
+
+ adpcmtable[(0x4+(x<<3))^S] = table[4];
+ adpcmtable[(0x5+(x<<3))^S] = table[5];
+
+ adpcmtable[(0x6+(x<<3))^S] = table[6];
+ adpcmtable[(0x7+(x<<3))^S] = table[7];
+ table += 8;
+ }
+}
+
+
+static void INTERLEAVE (u32 inst1, u32 inst2) { // Works... - 3-11-01
+ u32 inL, inR;
+ u16 *outbuff = (u16 *)(AudioOutBuffer+BufferSpace);
+ u16 *inSrcR;
+ u16 *inSrcL;
+ u16 Left, Right, Left2, Right2;
+
+ inL = inst2 & 0xFFFF;
+ inR = (inst2 >> 16) & 0xFFFF;
+
+ inSrcR = (u16 *)(BufferSpace+inR);
+ inSrcL = (u16 *)(BufferSpace+inL);
+
+ for (int x = 0; x < (AudioCount/4); x++) {
+ Left=*(inSrcL++);
+ Right=*(inSrcR++);
+ Left2=*(inSrcL++);
+ Right2=*(inSrcR++);
+
+#ifdef M64P_BIG_ENDIAN
+ *(outbuff++)=Right;
+ *(outbuff++)=Left;
+ *(outbuff++)=Right2;
+ *(outbuff++)=Left2;
+#else
+ *(outbuff++)=Right2;
+ *(outbuff++)=Left2;
+ *(outbuff++)=Right;
+ *(outbuff++)=Left;
+#endif
+ }
+}
+
+
+static void MIXER (u32 inst1, u32 inst2) { // Fixed a sign issue... 03-14-01
+ u32 dmemin = (u16)(inst2 >> 0x10);
+ u32 dmemout = (u16)(inst2 & 0xFFFF);
+ //u8 flags = (u8)((inst1 >> 16) & 0xff);
+ s32 gain = (s16)(inst1 & 0xFFFF);
+ s32 temp;
+
+ if (AudioCount == 0)
+ return;
+
+ for (int x=0; x < AudioCount; x+=2) { // I think I can do this a lot easier
+ temp = (*(s16 *)(BufferSpace+dmemin+x) * gain) >> 15;
+ temp += *(s16 *)(BufferSpace+dmemout+x);
+
+ if ((s32)temp > 32767)
+ temp = 32767;
+ if ((s32)temp < -32768)
+ temp = -32768;
+
+ *(u16 *)(BufferSpace+dmemout+x) = (u16)(temp & 0xFFFF);
+ }
+}
+
+// TOP Performance Hogs:
+//Command: ADPCM - Calls: 48 - Total Time: 331226 - Avg Time: 6900.54 - Percent: 31.53%
+//Command: ENVMIXER - Calls: 48 - Total Time: 408563 - Avg Time: 8511.73 - Percent: 38.90%
+//Command: LOADBUFF - Calls: 56 - Total Time: 21551 - Avg Time: 384.84 - Percent: 2.05%
+//Command: RESAMPLE - Calls: 48 - Total Time: 225922 - Avg Time: 4706.71 - Percent: 21.51%
+
+//Command: ADPCM - Calls: 48 - Total Time: 391600 - Avg Time: 8158.33 - Percent: 32.52%
+//Command: ENVMIXER - Calls: 48 - Total Time: 444091 - Avg Time: 9251.90 - Percent: 36.88%
+//Command: LOADBUFF - Calls: 58 - Total Time: 29945 - Avg Time: 516.29 - Percent: 2.49%
+//Command: RESAMPLE - Calls: 48 - Total Time: 276354 - Avg Time: 5757.38 - Percent: 22.95%
+
+
+extern "C" const acmd_callback_t ABI1[0x10] = { // TOP Performace Hogs: MIXER, RESAMPLE, ENVMIXER
+ SPNOOP , ADPCM , CLEARBUFF, ENVMIXER , LOADBUFF, RESAMPLE , SAVEBUFF, UNKNOWN,
+ SETBUFF, SETVOL, DMEMMOVE , LOADADPCM , MIXER , INTERLEAVE, UNKNOWN , SETLOOP
+};
+
+/* BACKUPS
+void MIXER (u32 inst1, u32 inst2) { // Fixed a sign issue... 03-14-01
+ u16 dmemin = (u16)(inst2 >> 0x10);
+ u16 dmemout = (u16)(inst2 & 0xFFFF);
+ u16 gain = (u16)(inst1 & 0xFFFF);
+ u8 flags = (u8)((inst1 >> 16) & 0xff);
+ u64 temp;
+
+ if (AudioCount == 0)
+ return;
+
+ for (int x=0; x < AudioCount; x+=2) { // I think I can do this a lot easier
+ temp = (s64)(*(s16 *)(BufferSpace+dmemout+x)) * (s64)((s16)(0x7FFF)*2);
+
+ if (temp & 0x8000)
+ temp = (temp^0x8000) + 0x10000;
+ else
+ temp = (temp^0x8000);
+
+ temp = (temp & 0xFFFFFFFFFFFF);
+
+ temp += ((*(s16 *)(BufferSpace+dmemin+x) * (s64)((s16)gain*2))) & 0xFFFFFFFFFFFF;
+
+ temp = (s32)(temp >> 16);
+ if ((s32)temp > 32767)
+ temp = 32767;
+ if ((s32)temp < -32768)
+ temp = -32768;
+
+ *(u16 *)(BufferSpace+dmemout+x) = (u16)(temp & 0xFFFF);
+ }
+}
+*/
+
+