X-Git-Url: https://notaz.gp2x.de/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=src%2Fvideo%2FSDL_blit_A.c;h=565879d550ad42b878bcaa103d4004498ef4c9da;hb=bdfa698900e2b6c8601b77004a8ba91f5b30dbb6;hp=2c52209e647908f98e967b13466a1bbaecaa5783;hpb=211e4bff4e12acc0da1a752980c484604975c396;p=sdl_omap.git diff --git a/src/video/SDL_blit_A.c b/src/video/SDL_blit_A.c index 2c52209..565879d 100644 --- a/src/video/SDL_blit_A.c +++ b/src/video/SDL_blit_A.c @@ -61,6 +61,53 @@ /* Functions to perform alpha blended blitting */ +#ifdef __ARM_NEON__ + +/* NEON optimized blitter callers */ +#define make_neon_caller(name, neon_name) \ +extern void neon_name(void *dst, const void *src, int count); \ +static void name(SDL_BlitInfo *info) \ +{ \ + int width = info->d_width; \ + int height = info->d_height; \ + Uint8 *src = info->s_pixels; \ + Uint8 *dst = info->d_pixels; \ + int srcskip = info->s_skip; \ + int dstskip = info->d_skip; \ +\ + while ( height-- ) { \ + neon_name(dst, src, width); \ + src += width * 4 + srcskip; \ + dst += width * 4 + dstskip; \ + } \ +} + +#define make_neon_callerS(name, neon_name) \ +extern void neon_name(void *dst, const void *src, int count, unsigned int alpha); \ +static void name(SDL_BlitInfo *info) \ +{ \ + int width = info->d_width; \ + int height = info->d_height; \ + Uint8 *src = info->s_pixels; \ + Uint8 *dst = info->d_pixels; \ + int srcskip = info->s_skip; \ + int dstskip = info->d_skip; \ + unsigned alpha = info->src->alpha;\ +\ + while ( height-- ) { \ + neon_name(dst, src, width, alpha); \ + src += width * 4 + srcskip; \ + dst += width * 4 + dstskip; \ + } \ +} + +make_neon_caller(BlitABGRtoXRGBalpha_neon, neon_ABGRtoXRGBalpha) +make_neon_caller(BlitARGBtoXRGBalpha_neon, neon_ARGBtoXRGBalpha) +make_neon_callerS(BlitABGRtoXRGBalphaS_neon, neon_ABGRtoXRGBalphaS) +make_neon_callerS(BlitARGBtoXRGBalphaS_neon, neon_ARGBtoXRGBalphaS) + +#endif /* __ARM_NEON__ */ + /* N->1 blending with per-surface alpha */ static void BlitNto1SurfaceAlpha(SDL_BlitInfo *info) { @@ -2805,6 +2852,12 @@ SDL_loblit SDL_CalculateAlphaBlit(SDL_Surface *surface, int blit_index) && sf->Bshift % 8 == 0 && SDL_HasMMX()) return BlitRGBtoRGBSurfaceAlphaMMX; +#endif +#ifdef __ARM_NEON__ + if(sf->Rshift % 8 == 0 + && sf->Gshift % 8 == 0 + && sf->Bshift % 8 == 0) + return BlitARGBtoXRGBalphaS_neon; #endif if((sf->Rmask | sf->Gmask | sf->Bmask) == 0xffffff) { @@ -2879,10 +2932,21 @@ SDL_loblit SDL_CalculateAlphaBlit(SDL_Surface *surface, int blit_index) if(!(surface->map->dst->flags & SDL_HWSURFACE) && SDL_HasAltiVec()) return BlitRGBtoRGBPixelAlphaAltivec; +#endif +#ifdef __ARM_NEON__ + return BlitARGBtoXRGBalpha_neon; #endif return BlitRGBtoRGBPixelAlpha; } } +#ifdef __ARM_NEON__ + if (sf->Gmask == df->Gmask && sf->Amask == 0xff000000 && + ((sf->Rmask == 0xff && df->Rmask == 0xff0000 && sf->Bmask == 0xff0000 && df->Bmask == 0xff) || + (sf->Rmask == 0xff0000 && df->Rmask == 0xff && sf->Bmask == 0xff && df->Bmask == 0xff0000))) + { + return BlitABGRtoXRGBalpha_neon; + } +#endif #if SDL_ALTIVEC_BLITTERS if (sf->Amask && sf->BytesPerPixel == 4 && !(surface->map->dst->flags & SDL_HWSURFACE) && SDL_HasAltiVec())