X-Git-Url: https://notaz.gp2x.de/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=source%2Fgles2glide64%2Fsrc%2FGlideHQ%2FTextureFilters.cpp;fp=source%2Fgles2glide64%2Fsrc%2FGlideHQ%2FTextureFilters.cpp;h=b46dcb566b707affaf46b6e2911a5e5a9d4aab2e;hb=98e75f2d18c02c233da543560f76282f04fc796c;hp=0000000000000000000000000000000000000000;hpb=0ced54f867d36e8b324155bef49e8abfebfc3237;p=mupen64plus-pandora.git diff --git a/source/gles2glide64/src/GlideHQ/TextureFilters.cpp b/source/gles2glide64/src/GlideHQ/TextureFilters.cpp new file mode 100644 index 0000000..b46dcb5 --- /dev/null +++ b/source/gles2glide64/src/GlideHQ/TextureFilters.cpp @@ -0,0 +1,702 @@ +/* +Copyright (C) 2003 Rice1964 + +This program is free software; you can redistribute it and/or +modify it under the terms of the GNU General Public License +as published by the Free Software Foundation; either version 2 +of the License, or (at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + +*/ + +/* Copyright (C) 2007 Hiroshi Morii + * Modified for the Texture Filtering library + */ + +#include +#include "TextureFilters.h" + +/************************************************************************/ +/* 2X filters */ +/************************************************************************/ + +#define DWORD_MAKE(r, g, b, a) ((uint32) (((a) << 24) | ((r) << 16) | ((g) << 8) | (b))) +#define WORD_MAKE(r, g, b, a) ((uint16) (((a) << 12) | ((r) << 8) | ((g) << 4) | (b))) + +// Basic 2x R8G8B8A8 filter with interpolation + +void Texture2x_32(uint8 *srcPtr, uint32 srcPitch, uint8 *dstPtr, uint32 dstPitch, int width, int height) +{ + uint32 *pDst1, *pDst2; + uint32 *pSrc, *pSrc2; + uint32 nWidth = width; + uint32 nHeight = height; + + uint32 b1; + uint32 g1; + uint32 r1; + uint32 a1; + uint32 b2; + uint32 g2; + uint32 r2; + uint32 a2; + uint32 b3; + uint32 g3; + uint32 r3; + uint32 a3; + uint32 b4; + uint32 g4; + uint32 r4; + uint32 a4; + + uint32 xSrc; + uint32 ySrc; + + for (ySrc = 0; ySrc < nHeight; ySrc++) + { + pSrc = (uint32*)(((uint8*)srcPtr)+ySrc*srcPitch); + pSrc2 = (uint32*)(((uint8*)srcPtr)+(ySrc+1)*srcPitch); + pDst1 = (uint32*)(((uint8*)dstPtr)+(ySrc*2)*dstPitch); + pDst2 = (uint32*)(((uint8*)dstPtr)+(ySrc*2+1)*dstPitch); + + for (xSrc = 0; xSrc < nWidth; xSrc++) + { + b1 = (pSrc[xSrc]>>0)&0xFF; + g1 = (pSrc[xSrc]>>8)&0xFF; + r1 = (pSrc[xSrc]>>16)&0xFF; + a1 = (pSrc[xSrc]>>24)&0xFF; + + // Pixel 1 + pDst1[xSrc*2] = pSrc[xSrc]; + + // Pixel 2 + if( xSrc>0)&0xFF; + g2 = (pSrc[xSrc+1]>>8)&0xFF; + r2 = (pSrc[xSrc+1]>>16)&0xFF; + a2 = (pSrc[xSrc+1]>>24)&0xFF; + pDst1[xSrc*2+1] = DWORD_MAKE((r1+r2)/2, (g1+g2)/2, (b1+b2)/2, (a1+a2)/2); + } + else + pDst1[xSrc*2+1] = pSrc[xSrc]; + + // Pixel 3 + if( ySrc>0)&0xFF; + g3 = (pSrc2[xSrc]>>8)&0xFF; + r3 = (pSrc2[xSrc]>>16)&0xFF; + a3 = (pSrc2[xSrc]>>24)&0xFF; + pDst2[xSrc*2] = DWORD_MAKE((r1+r3)/2, (g1+g3)/2, (b1+b3)/2, (a1+a3)/2); + if( xSrc>0)&0xFF; + g4 = (pSrc2[xSrc+1]>>8)&0xFF; + r4 = (pSrc2[xSrc+1]>>16)&0xFF; + a4 = (pSrc2[xSrc+1]>>24)&0xFF; + // Pixel 4 + pDst2[xSrc*2+1] = DWORD_MAKE((r1+r2+r3+r4)/4, (g1+g2+g3+g4)/4, (b1+b2+b3+b4)/4, (a1+a2+a3+a4)/4); + } + else + { + // Pixel 4 + pDst2[xSrc*2+1] = DWORD_MAKE((r1+r3)/2, (g1+g3)/2, (b1+b3)/2, (a1+a3)/2); + } + } + else + { + // Pixel 3 + pDst2[xSrc*2] = pSrc[xSrc]; + // Pixel 4 + if( xSrc> 0)&0xF; + g1 = (pSrc[xSrc]>> 4)&0xF; + r1 = (pSrc[xSrc]>> 8)&0xF; + a1 = (pSrc[xSrc]>>12)&0xF; + + if( xSrc> 0)&0xF; + g2 = (pSrc[xSrc+1]>> 4)&0xF; + r2 = (pSrc[xSrc+1]>> 8)&0xF; + a2 = (pSrc[xSrc+1]>>12)&0xF; + } + + if( ySrc> 0)&0xF; + g3 = (pSrc2[xSrc]>> 4)&0xF; + r3 = (pSrc2[xSrc]>> 8)&0xF; + a3 = (pSrc2[xSrc]>>12)&0xF; + if( xSrc> 0)&0xF; + g4 = (pSrc2[xSrc+1]>> 4)&0xF; + r4 = (pSrc2[xSrc+1]>> 8)&0xF; + a4 = (pSrc2[xSrc+1]>>12)&0xF; + } + } + + // Pixel 1 + pDst1[xSrc*2] = pSrc[xSrc]; + + // Pixel 2 + if( xSrc + */ +void SharpFilter_8888(uint32 *src, uint32 srcwidth, uint32 srcheight, uint32 *dest, uint32 filter) +{ + // NOTE: for now we get away with copying the boundaries + // filter the boundaries if we face problems + + uint32 mul1, mul2, mul3, shift4; + + uint32 x,y,z; + uint32 *_src1, *_src2, *_src3, *_dest; + uint32 val[4]; + uint32 t1,t2,t3,t4,t5,t6,t7,t8,t9; + + switch( filter ) + { + case SHARP_FILTER_2: + mul1=1; + mul2=8; + mul3=12; + shift4=2; + break; + case SHARP_FILTER_1: + default: + mul1=1; + mul2=8; + mul3=16; + shift4=3; + break; + } + + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + + // copy the first row + memcpy(_dest, _src1, (srcwidth << 2)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for (y = 1; y < srcheight-1; y++) { + // copy the first pixel + _dest[0] = *_src2; + // filter 2nd pixel to 1 pixel before last + for (x = 1; x < srcwidth-1; x++) { + for (z=0; z<4; z++) { + t1 = *((uint8*)(_src1+x-1)+z); + t2 = *((uint8*)(_src1+x )+z); + t3 = *((uint8*)(_src1+x+1)+z); + t4 = *((uint8*)(_src2+x-1)+z); + t5 = *((uint8*)(_src2+x )+z); + t6 = *((uint8*)(_src2+x+1)+z); + t7 = *((uint8*)(_src3+x-1)+z); + t8 = *((uint8*)(_src3+x )+z); + t9 = *((uint8*)(_src3+x+1)+z); + + if( (t5*mul2) > (t1+t3+t7+t9+t2+t4+t6+t8)*mul1 ) { + val[z]= ((t5*mul3) - (t1+t3+t7+t9+t2+t4+t6+t8)*mul1)>>shift4; + if (val[z] > 0xFF) val[z] = 0xFF; + } else { + val[z] = t5; + } + } + _dest[x] = val[0]|(val[1]<<8)|(val[2]<<16)|(val[3]<<24); + } + // copy the ending pixel + _dest[srcwidth-1] = *(_src3 - 1); + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 2)); +} + +#if !_16BPP_HACK +void SharpFilter_4444(uint16 *src, uint32 srcwidth, uint32 srcheight, uint16 *dest, uint32 filter) +{ + // NOTE: for now we get away with copying the boundaries + // filter the boundaries if we face problems + + uint16 mul1, mul2, mul3, shift4; + + uint32 x,y,z; + uint16 *_src1, *_src2, *_src3, *_dest; + uint16 val[4]; + uint16 t1,t2,t3,t4,t5,t6,t7,t8,t9; + + switch( filter ) { + case SHARP_FILTER_2: + mul1=1; + mul2=8; + mul3=12; + shift4=2; + break; + case SHARP_FILTER_1: + default: + mul1=1; + mul2=8; + mul3=16; + shift4=3; + break; + } + + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + + // copy the first row + memcpy(_dest, _src1, (srcwidth << 1)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for( y = 1; y < srcheight - 1; y++) { + // copy the first pixel + _dest[0] = *_src2; + // filter 2nd pixel to 1 pixel before last + for( x = 1; x < srcwidth - 1; x++) { + for( z = 0; z < 4; z++ ) { + /* Hiroshi Morii + * Read the entire 16bit pixel and then extract the A,R,G,B components. + */ + uint32 shift = z << 2; + t1 = ((*((uint16*)(_src1+x-1))) >> shift) & 0xF; + t2 = ((*((uint16*)(_src1+x ))) >> shift) & 0xF; + t3 = ((*((uint16*)(_src1+x+1))) >> shift) & 0xF; + t4 = ((*((uint16*)(_src2+x-1))) >> shift) & 0xF; + t5 = ((*((uint16*)(_src2+x ))) >> shift) & 0xF; + t6 = ((*((uint16*)(_src2+x+1))) >> shift) & 0xF; + t7 = ((*((uint16*)(_src3+x-1))) >> shift) & 0xF; + t8 = ((*((uint16*)(_src3+x ))) >> shift) & 0xF; + t9 = ((*((uint16*)(_src3+x+1))) >> shift) & 0xF; + + if( (t5*mul2) > (t1+t3+t7+t9+t2+t4+t6+t8)*mul1 ) { + val[z] = ((t5*mul3) - (t1+t3+t7+t9+t2+t4+t6+t8)*mul1)>>shift4; + if (val[z] > 0xF) val[z] = 0xF; + } else { + val[z] = t5; + } + } + _dest[x] = val[0]|(val[1]<<4)|(val[2]<<8)|(val[3]<<12); + } + // copy the ending pixel + _dest[srcwidth-1] = *(_src3 - 1); + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 1)); +} +#endif /* !_16BPP_HACK */ + +/* + * Smooth filters + * Hiroshi Morii + */ +void SmoothFilter_8888(uint32 *src, uint32 srcwidth, uint32 srcheight, uint32 *dest, uint32 filter) +{ + // NOTE: for now we get away with copying the boundaries + // filter the boundaries if we face problems + + uint32 mul1, mul2, mul3, shift4; + + uint32 x,y,z; + uint32 *_src1, *_src2, *_src3, *_dest; + uint32 val[4]; + uint32 t1,t2,t3,t4,t5,t6,t7,t8,t9; + + switch( filter ) { + case SMOOTH_FILTER_4: + mul1=1; + mul2=2; + mul3=4; + shift4=4; + break; + case SMOOTH_FILTER_3: + mul1=1; + mul2=1; + mul3=8; + shift4=4; + break; + case SMOOTH_FILTER_2: + mul1=1; + mul2=1; + mul3=2; + shift4=2; + break; + case SMOOTH_FILTER_1: + default: + mul1=1; + mul2=1; + mul3=6; + shift4=3; + break; + } + + switch (filter) { + case SMOOTH_FILTER_3: + case SMOOTH_FILTER_4: + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + // copy the first row + memcpy(_dest, _src1, (srcwidth << 2)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for (y = 1; y < srcheight - 1; y++){ + // copy the first pixel + _dest[0] = _src2[0]; + // filter 2nd pixel to 1 pixel before last + for (x = 1; x < srcwidth - 1; x++) { + for (z = 0; z < 4; z++ ) { + t1 = *((uint8*)(_src1+x-1)+z); + t2 = *((uint8*)(_src1+x )+z); + t3 = *((uint8*)(_src1+x+1)+z); + t4 = *((uint8*)(_src2+x-1)+z); + t5 = *((uint8*)(_src2+x )+z); + t6 = *((uint8*)(_src2+x+1)+z); + t7 = *((uint8*)(_src3+x-1)+z); + t8 = *((uint8*)(_src3+x )+z); + t9 = *((uint8*)(_src3+x+1)+z); + /* the component value must not overflow 0xFF */ + val[z] = ((t1+t3+t7+t9)*mul1+((t2+t4+t6+t8)*mul2)+(t5*mul3))>>shift4; + if (val[z] > 0xFF) val[z] = 0xFF; + } + _dest[x] = val[0]|(val[1]<<8)|(val[2]<<16)|(val[3]<<24); + } + // copy the ending pixel + _dest[srcwidth-1] = *(_src3 - 1); + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 2)); + break; + case SMOOTH_FILTER_1: + case SMOOTH_FILTER_2: + default: + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + // copy the first row + memcpy(_dest, _src1, (srcwidth << 2)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for (y = 1; y < srcheight - 1; y++) { + // filter 1st pixel to the last + if (y & 1) { + for( x = 0; x < srcwidth; x++) { + for( z = 0; z < 4; z++ ) { + t2 = *((uint8*)(_src1+x )+z); + t5 = *((uint8*)(_src2+x )+z); + t8 = *((uint8*)(_src3+x )+z); + /* the component value must not overflow 0xFF */ + val[z] = ((t2+t8)*mul2+(t5*mul3))>>shift4; + if (val[z] > 0xFF) val[z] = 0xFF; + } + _dest[x] = val[0]|(val[1]<<8)|(val[2]<<16)|(val[3]<<24); + } + } else { + memcpy(_dest, _src2, (srcwidth << 2)); + } + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 2)); + break; + } +} + +#if !_16BPP_HACK +void SmoothFilter_4444(uint16 *src, uint32 srcwidth, uint32 srcheight, uint16 *dest, uint32 filter) +{ + // NOTE: for now we get away with copying the boundaries + // filter the boundaries if we face problems + + uint16 mul1, mul2, mul3, shift4; + + uint32 x,y,z; + uint16 *_src1, *_src2, *_src3, *_dest; + uint16 val[4]; + uint16 t1,t2,t3,t4,t5,t6,t7,t8,t9; + + switch( filter ) { + case SMOOTH_FILTER_4: + mul1=1; + mul2=2; + mul3=4; + shift4=4; + break; + case SMOOTH_FILTER_3: + mul1=1; + mul2=1; + mul3=8; + shift4=4; + break; + case SMOOTH_FILTER_2: + mul1=1; + mul2=1; + mul3=2; + shift4=2; + break; + case SMOOTH_FILTER_1: + default: + mul1=1; + mul2=1; + mul3=6; + shift4=3; + break; + } + + switch (filter) { + case SMOOTH_FILTER_3: + case SMOOTH_FILTER_4: + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + // copy the first row + memcpy(_dest, _src1, (srcwidth << 1)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for (y = 1; y < srcheight - 1; y++) { + // copy the first pixel + _dest[0] = *_src2; + // filter 2nd pixel to 1 pixel before last + for (x = 1; x < srcwidth - 1; x++) { + for (z = 0; z < 4; z++ ) { + /* Read the entire 16bit pixel and then extract the A,R,G,B components. */ + uint32 shift = z << 2; + t1 = ((*(uint16*)(_src1+x-1)) >> shift) & 0xF; + t2 = ((*(uint16*)(_src1+x )) >> shift) & 0xF; + t3 = ((*(uint16*)(_src1+x+1)) >> shift) & 0xF; + t4 = ((*(uint16*)(_src2+x-1)) >> shift) & 0xF; + t5 = ((*(uint16*)(_src2+x )) >> shift) & 0xF; + t6 = ((*(uint16*)(_src2+x+1)) >> shift) & 0xF; + t7 = ((*(uint16*)(_src3+x-1)) >> shift) & 0xF; + t8 = ((*(uint16*)(_src3+x )) >> shift) & 0xF; + t9 = ((*(uint16*)(_src3+x+1)) >> shift) & 0xF; + /* the component value must not overflow 0xF */ + val[z] = ((t1+t3+t7+t9)*mul1+((t2+t4+t6+t8)*mul2)+(t5*mul3))>>shift4; + if (val[z] > 0xF) val[z] = 0xF; + } + _dest[x] = val[0]|(val[1]<<4)|(val[2]<<8)|(val[3]<<12); + } + // copy the ending pixel + _dest[srcwidth-1] = *(_src3 - 1); + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 1)); + break; + case SMOOTH_FILTER_1: + case SMOOTH_FILTER_2: + default: + // setup rows + _src1 = src; + _src2 = _src1 + srcwidth; + _src3 = _src2 + srcwidth; + _dest = dest; + // copy the first row + memcpy(_dest, _src1, (srcwidth << 1)); + _dest += srcwidth; + // filter 2nd row to 1 row before the last + for( y = 1; y < srcheight - 1; y++) { + if (y & 1) { + for( x = 0; x < srcwidth; x++) { + for( z = 0; z < 4; z++ ) { + /* Read the entire 16bit pixel and then extract the A,R,G,B components. */ + uint32 shift = z << 2; + t2 = ((*(uint16*)(_src1+x)) >> shift) & 0xF; + t5 = ((*(uint16*)(_src2+x)) >> shift) & 0xF; + t8 = ((*(uint16*)(_src3+x)) >> shift) & 0xF; + /* the component value must not overflow 0xF */ + val[z] = ((t2+t8)*mul2+(t5*mul3))>>shift4; + if (val[z] > 0xF) val[z] = 0xF; + } + _dest[x] = val[0]|(val[1]<<4)|(val[2]<<8)|(val[3]<<12); + } + } else { + memcpy(_dest, _src2, (srcwidth << 1)); + } + // next row + _src1 += srcwidth; + _src2 += srcwidth; + _src3 += srcwidth; + _dest += srcwidth; + } + // copy the last row + memcpy(_dest, _src2, (srcwidth << 1)); + break; + } +} +#endif /* !_16BPP_HACK */ + +void filter_8888(uint32 *src, uint32 srcwidth, uint32 srcheight, uint32 *dest, uint32 filter) { + switch (filter & ENHANCEMENT_MASK) { + case HQ4X_ENHANCEMENT: + hq4x_8888((uint8*)src, (uint8*)dest, srcwidth, srcheight, srcwidth, (srcwidth << 4)); + return; + case HQ2X_ENHANCEMENT: + hq2x_32((uint8*)src, (srcwidth << 2), (uint8*)dest, (srcwidth << 3), srcwidth, srcheight); + return; + case HQ2XS_ENHANCEMENT: + hq2xS_32((uint8*)src, (srcwidth << 2), (uint8*)dest, (srcwidth << 3), srcwidth, srcheight); + return; + case LQ2X_ENHANCEMENT: + lq2x_32((uint8*)src, (srcwidth << 2), (uint8*)dest, (srcwidth << 3), srcwidth, srcheight); + return; + case LQ2XS_ENHANCEMENT: + lq2xS_32((uint8*)src, (srcwidth << 2), (uint8*)dest, (srcwidth << 3), srcwidth, srcheight); + return; + case X2SAI_ENHANCEMENT: + Super2xSaI_8888((uint32*)src, (uint32*)dest, srcwidth, srcheight, srcwidth); + return; + case X2_ENHANCEMENT: + Texture2x_32((uint8*)src, (srcwidth << 2), (uint8*)dest, (srcwidth << 3), srcwidth, srcheight); + return; + } + + switch (filter & (SMOOTH_FILTER_MASK|SHARP_FILTER_MASK)) { + case SMOOTH_FILTER_1: + case SMOOTH_FILTER_2: + case SMOOTH_FILTER_3: + case SMOOTH_FILTER_4: + SmoothFilter_8888((uint32*)src, srcwidth, srcheight, (uint32*)dest, (filter & SMOOTH_FILTER_MASK)); + return; + case SHARP_FILTER_1: + case SHARP_FILTER_2: + SharpFilter_8888((uint32*)src, srcwidth, srcheight, (uint32*)dest, (filter & SHARP_FILTER_MASK)); + return; + } +}