gpu_neon: new intrinsics-only implementation
[pcsx_rearmed.git] / frontend / cspace.c
CommitLineData
c9099d02 1/*
2 * (C) GraÅžvydas "notaz" Ignotas, 2011,2012
3 *
4 * This work is licensed under the terms of any of these licenses
5 * (at your option):
6 * - GNU GPL, version 2 or later.
7 * - GNU LGPL, version 2.1 or later.
8 * See the COPYING file in the top-level directory.
9 */
10
a80ae4a0 11#include "cspace.h"
12
4ea7de6a 13/*
14 * note: these are intended for testing and should be avoided
15 * in favor of NEON version or platform-specific conversion
16 */
17
ae8f89db
PC
18#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
19#define SWAP16(x) __builtin_bswap16(x)
20#define LE16TOHx2(x) ((SWAP16((x) >> 16) << 16) | SWAP16(x))
21#else
22#define LE16TOHx2(x) (x)
23#endif
24
d57557c0 25#ifndef __arm__
c9099d02 26
55b0eeea 27void bgr555_to_rgb565(void *dst_, const void *src_, int bytes)
28{
4ea7de6a 29 const unsigned int *src = src_;
30 unsigned int *dst = dst_;
ae8f89db 31 unsigned int x, p, r, g, b;
55b0eeea 32
33 for (x = 0; x < bytes / 4; x++) {
ae8f89db
PC
34 p = LE16TOHx2(src[x]);
35
36 r = (p & 0x001f001f) << 11;
37 g = (p & 0x03e003e0) << 1;
38 b = (p & 0x7c007c00) >> 10;
39
40 dst[x] = r | g | b;
55b0eeea 41 }
42}
43
d57557c0 44#endif
45
46#ifndef __ARM_NEON__
47
4ea7de6a 48void bgr888_to_rgb565(void *dst_, const void *src_, int bytes)
49{
50 const unsigned char *src = src_;
51 unsigned int *dst = dst_;
52 unsigned int r1, g1, b1, r2, g2, b2;
53
54 for (; bytes >= 6; bytes -= 6, src += 6, dst++) {
55 r1 = src[0] & 0xf8;
56 g1 = src[1] & 0xfc;
57 b1 = src[2] & 0xf8;
58 r2 = src[3] & 0xf8;
59 g2 = src[4] & 0xfc;
60 b2 = src[5] & 0xf8;
ae8f89db
PC
61#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
62 *dst = (r1 << 24) | (g1 << 19) | (b1 << 13) |
63 (r2 << 8) | (g2 << 3) | (b2 >> 3);
64#else
4ea7de6a 65 *dst = (r2 << 24) | (g2 << 19) | (b2 << 13) |
66 (r1 << 8) | (g1 << 3) | (b1 >> 3);
ae8f89db 67#endif
4ea7de6a 68 }
69}
70
a80ae4a0 71// TODO?
00a5d459 72void rgb888_to_rgb565(void *dst, const void *src, int bytes) {}
a80ae4a0 73void bgr888_to_rgb888(void *dst, const void *src, int bytes) {}
a80ae4a0 74
c9099d02 75#endif // __ARM_NEON__
76
77/* YUV stuff */
78static int yuv_ry[32], yuv_gy[32], yuv_by[32];
79static unsigned char yuv_u[32 * 2], yuv_v[32 * 2];
80
81void bgr_to_uyvy_init(void)
82{
83 int i, v;
84
85 /* init yuv converter:
86 y0 = (int)((0.299f * r0) + (0.587f * g0) + (0.114f * b0));
87 y1 = (int)((0.299f * r1) + (0.587f * g1) + (0.114f * b1));
88 u = (int)(8 * 0.565f * (b0 - y0)) + 128;
89 v = (int)(8 * 0.713f * (r0 - y0)) + 128;
90 */
91 for (i = 0; i < 32; i++) {
92 yuv_ry[i] = (int)(0.299f * i * 65536.0f + 0.5f);
93 yuv_gy[i] = (int)(0.587f * i * 65536.0f + 0.5f);
94 yuv_by[i] = (int)(0.114f * i * 65536.0f + 0.5f);
95 }
96 for (i = -32; i < 32; i++) {
97 v = (int)(8 * 0.565f * i) + 128;
98 if (v < 0)
99 v = 0;
100 if (v > 255)
101 v = 255;
102 yuv_u[i + 32] = v;
103 v = (int)(8 * 0.713f * i) + 128;
104 if (v < 0)
105 v = 0;
106 if (v > 255)
107 v = 255;
108 yuv_v[i + 32] = v;
109 }
110}
111
5b9aa749 112void rgb565_to_uyvy(void *d, const void *s, int pixels)
113{
114 unsigned int *dst = d;
115 const unsigned short *src = s;
116 const unsigned char *yu = yuv_u + 32;
117 const unsigned char *yv = yuv_v + 32;
118 int r0, g0, b0, r1, g1, b1;
119 int y0, y1, u, v;
120
121 for (; pixels > 0; src += 2, dst++, pixels -= 2)
122 {
123 r0 = (src[0] >> 11) & 0x1f;
124 g0 = (src[0] >> 6) & 0x1f;
125 b0 = src[0] & 0x1f;
126 r1 = (src[1] >> 11) & 0x1f;
127 g1 = (src[1] >> 6) & 0x1f;
128 b1 = src[1] & 0x1f;
129 y0 = (yuv_ry[r0] + yuv_gy[g0] + yuv_by[b0]) >> 16;
130 y1 = (yuv_ry[r1] + yuv_gy[g1] + yuv_by[b1]) >> 16;
131 u = yu[b0 - y0];
132 v = yv[r0 - y0];
133 // valid Y range seems to be 16..235
134 y0 = 16 + 219 * y0 / 31;
135 y1 = 16 + 219 * y1 / 31;
136
137 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
138 }
139}
140
c9099d02 141void bgr555_to_uyvy(void *d, const void *s, int pixels)
142{
143 unsigned int *dst = d;
144 const unsigned short *src = s;
145 const unsigned char *yu = yuv_u + 32;
146 const unsigned char *yv = yuv_v + 32;
147 int r0, g0, b0, r1, g1, b1;
148 int y0, y1, u, v;
149
150 for (; pixels > 0; src += 2, dst++, pixels -= 2)
151 {
152 b0 = (src[0] >> 10) & 0x1f;
153 g0 = (src[0] >> 5) & 0x1f;
154 r0 = src[0] & 0x1f;
155 b1 = (src[1] >> 10) & 0x1f;
156 g1 = (src[1] >> 5) & 0x1f;
157 r1 = src[1] & 0x1f;
158 y0 = (yuv_ry[r0] + yuv_gy[g0] + yuv_by[b0]) >> 16;
159 y1 = (yuv_ry[r1] + yuv_gy[g1] + yuv_by[b1]) >> 16;
160 u = yu[b0 - y0];
161 v = yv[r0 - y0];
c9099d02 162 y0 = 16 + 219 * y0 / 31;
163 y1 = 16 + 219 * y1 / 31;
164
165 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
166 }
167}
168
169void bgr888_to_uyvy(void *d, const void *s, int pixels)
170{
171 unsigned int *dst = d;
172 const unsigned char *src8 = s;
173 const unsigned char *yu = yuv_u + 32;
174 const unsigned char *yv = yuv_v + 32;
175 int r0, g0, b0, r1, g1, b1;
176 int y0, y1, u, v;
177
178 for (; pixels > 0; src8 += 3*2, dst++, pixels -= 2)
179 {
180 r0 = src8[0], g0 = src8[1], b0 = src8[2];
181 r1 = src8[3], g1 = src8[4], b1 = src8[5];
182 y0 = (r0 * 19595 + g0 * 38470 + b0 * 7471) >> 16;
183 y1 = (r1 * 19595 + g1 * 38470 + b1 * 7471) >> 16;
184 u = yu[(b0 - y0) / 8];
185 v = yv[(r0 - y0) / 8];
186 y0 = 16 + 219 * y0 / 255;
187 y1 = 16 + 219 * y1 / 255;
188
189 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
190 }
191}