d->spos = s->spos;\r
  d->sinc = s->sinc;\r
  memcpy(d->SB, s->SB, sizeof(d->SB));\r
- d->pStart = s->pStart;\r
- d->pCurr = s->pCurr;\r
- d->pLoop = s->pLoop;\r
+ d->pStart = (void *)((long)s->pStart & 0x7fff0);\r
+ d->pCurr = (void *)((long)s->pCurr & 0x7fff0);\r
+ d->pLoop = (void *)((long)s->pLoop & 0x7fff0);\r
  if (s->bOn) dwChannelOn |= 1<<ch;\r
  d->bStop = s->bStop;\r
  d->bReverb = s->bReverb;\r
    pFO->spuAddr=spuAddr;\r
    if(pFO->spuAddr==0) pFO->spuAddr=0xbaadf00d;\r
 \r
+   dwChannelOn&=~dwPendingChanOff;\r
+   dwPendingChanOff=0;\r
+\r
    for(i=0;i<MAXCHAN;i++)\r
     {\r
      save_channel(&pFO->s_chan[i],&s_chan[i],i);\r
   SPUplayADPCMchannel(&pF->xaS);\r
 \r
  xapGlobal=0;\r
+ dwPendingChanOff=0;\r
 \r
  if(!strcmp(pF->szSPUName,"PBOSS") && pF->ulFreezeVersion==5)\r
    LoadStateV5(pF);\r
  pFO=(SPUOSSFreeze_t *)(pF+1);\r
 \r
  spuIrq = pFO->spuIrq;\r
- if(pFO->pSpuIrq) pSpuIrq = pFO->pSpuIrq+spuMemC; else pSpuIrq=NULL;\r
+ if(pFO->pSpuIrq) pSpuIrq = spuMemC+((long)pFO->pSpuIrq&0x7fff0); else pSpuIrq=NULL;\r
 \r
  if(pFO->spuAddr)\r
   {\r
 
 #define _IN_SPU
 
 #include "externals.h"
+#include "registers.h"
 #include "cfg.h"
 #include "dsoundoss.h"
 #include "regs.h"
 
 unsigned long dwNewChannel=0;                          // flags for faster testing, if new channel starts
 unsigned long dwChannelOn=0;
+unsigned long dwPendingChanOff=0;
 
 void (CALLBACK *irqCallback)(void)=0;                  // func of main emu, called on spu irq
 void (CALLBACK *cddavCallback)(unsigned short,unsigned short)=0;
  return fa;
 }
 
+static void do_irq(void)
+{
+ if(!(spuStat & STAT_IRQ))
+ {
+  spuStat |= STAT_IRQ;
+  if(irqCallback) irqCallback();
+ }
+}
+
 static int decode_block(int ch)
 {
  unsigned char *start;
  s_chan[ch].iSBPos=0;
 
  start=s_chan[ch].pCurr;                   // set up the current pos
- if (start == (unsigned char*)-1)          // special "stop" sign
+ if(start == (unsigned char*)-1 ||         // special "stop" sign
+    (dwPendingChanOff&(1<<ch)))
  {
   dwChannelOn&=~(1<<ch);                   // -> turn everything off
+  dwPendingChanOff&=~(1<<ch);
   s_chan[ch].bStop=1;
   s_chan[ch].ADSRX.EnvelopeVol=0;
   return 0;                                // -> and done for this channel
  }
 
- //////////////////////////////////////////// spu irq handler here? mmm... do it later
+ //////////////////////////////////////////// irq check
+
+ if(spuCtrl&CTRL_IRQ)
+ {
+  if(pSpuIrq == start)                     // irq address reached?
+  {
+   do_irq();                               // -> call main emu
+   ret = 1;
+  }
+ }
 
  s_1=s_chan[ch].s_1;
  s_2=s_chan[ch].s_2;
   s_chan[ch].SB[nSample++]=fa;
  }
 
- //////////////////////////////////////////// irq check
-
- if(irqCallback && (spuCtrl&0x40))         // some callback and irq active?
- {
-  if((pSpuIrq >  start-16 &&              // irq address reached?
-     pSpuIrq <= start) ||
-    ((flags&1) &&                        // special: irq on looping addr, when stop/loop flag is set 
-     (pSpuIrq >  s_chan[ch].pLoop-16 &&
-      pSpuIrq <= s_chan[ch].pLoop)))
-  {
-   irqCallback();                        // -> call main emu
-   ret = 1;
-  }
- }
-
  //////////////////////////////////////////// flag handler
 
  if((flags&4) && (!s_chan[ch].bIgnoreLoop))
 
  if(flags&1)                               // 1: stop/loop
  {
-  // We play this block out first...
-  //if(!(flags&2))                         // 1+2: do loop... otherwise: stop
-  if(flags!=3 && flags!=7)                 // PETE: if we don't check exactly for 3, loop hang ups will happen (DQ4, for example)
-  {
-   start = (unsigned char*)-1;
-  }
-  else
-  {
-   start = s_chan[ch].pLoop;
-  }
+  if(!(flags&2))
+   dwPendingChanOff|=1<<ch;
+
+  start = s_chan[ch].pLoop;
  }
 
  if (start - spuMemC >= 0x80000)
   // an IRQ. Only problem: the "wait for cpu" option is kinda hard to do here
   // in some of Peops timer modes. So: we ignore this option here (for now).
 
-  if(pMixIrq && irqCallback)
+  if(pMixIrq)
    {
     for(ns=0;ns<NSSIZE;ns++)
      {
         for(ch=0;ch<4;ch++)
          {
           if(pSpuIrq>=pMixIrq+(ch*0x400) && pSpuIrq<pMixIrq+(ch*0x400)+2)
-           irqCallback();
+           do_irq();
          }
        }
       pMixIrq+=2;if(pMixIrq>spuMemC+0x3ff) pMixIrq=spuMemC;