gpu_neon: integration for arm64
[pcsx_rearmed.git] / frontend / cspace.c
CommitLineData
c9099d02 1/*
2 * (C) GraÅžvydas "notaz" Ignotas, 2011,2012
3 *
4 * This work is licensed under the terms of any of these licenses
5 * (at your option):
6 * - GNU GPL, version 2 or later.
7 * - GNU LGPL, version 2.1 or later.
8 * See the COPYING file in the top-level directory.
9 */
10
a80ae4a0 11#include "cspace.h"
12
4ea7de6a 13/*
14 * note: these are intended for testing and should be avoided
15 * in favor of NEON version or platform-specific conversion
16 */
17
1318072a
PC
18#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
19#define SWAP16(x) __builtin_bswap16(x)
20#define LE16TOHx2(x) ((SWAP16((x) >> 16) << 16) | SWAP16(x))
21#else
22#define LE16TOHx2(x) (x)
23#endif
24
047899a4 25#ifndef HAVE_bgr555_to_rgb565
c9099d02 26
55b0eeea 27void bgr555_to_rgb565(void *dst_, const void *src_, int bytes)
28{
1318072a
PC
29 const unsigned int *src = src_;
30 unsigned int *dst = dst_;
31 unsigned int x, p, r, g, b;
32
33 for (x = 0; x < bytes / 4; x++) {
34 p = LE16TOHx2(src[x]);
35
36 r = (p & 0x001f001f) << 11;
37 g = (p & 0x03e003e0) << 1;
38 b = (p & 0x7c007c00) >> 10;
39
40 dst[x] = r | g | b;
41 }
55b0eeea 42}
43
d57557c0 44#endif
45
047899a4 46#ifndef HAVE_bgr888_to_x
d57557c0 47
4ea7de6a 48void bgr888_to_rgb565(void *dst_, const void *src_, int bytes)
49{
778ad9ce
G
50 const unsigned char *src = src_;
51 unsigned int *dst = dst_;
52 unsigned int r1, g1, b1, r2, g2, b2;
53
54 for (; bytes >= 6; bytes -= 6, src += 6, dst++) {
55 r1 = src[0] & 0xf8;
56 g1 = src[1] & 0xfc;
57 b1 = src[2] & 0xf8;
58 r2 = src[3] & 0xf8;
59 g2 = src[4] & 0xfc;
60 b2 = src[5] & 0xf8;
1318072a
PC
61#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
62 *dst = (r1 << 24) | (g1 << 19) | (b1 << 13) |
63 (r2 << 8) | (g2 << 3) | (b2 >> 3);
64#else
778ad9ce
G
65 *dst = (r2 << 24) | (g2 << 19) | (b2 << 13) |
66 (r1 << 8) | (g1 << 3) | (b1 >> 3);
1318072a 67#endif
778ad9ce 68 }
4ea7de6a 69}
70
8fd0f4a8
PC
71#endif
72
73#ifndef __ARM_NEON__
a80ae4a0 74// TODO?
00a5d459 75void rgb888_to_rgb565(void *dst, const void *src, int bytes) {}
a80ae4a0 76void bgr888_to_rgb888(void *dst, const void *src, int bytes) {}
a80ae4a0 77
c9099d02 78#endif // __ARM_NEON__
79
80/* YUV stuff */
81static int yuv_ry[32], yuv_gy[32], yuv_by[32];
82static unsigned char yuv_u[32 * 2], yuv_v[32 * 2];
83
84void bgr_to_uyvy_init(void)
85{
86 int i, v;
87
88 /* init yuv converter:
89 y0 = (int)((0.299f * r0) + (0.587f * g0) + (0.114f * b0));
90 y1 = (int)((0.299f * r1) + (0.587f * g1) + (0.114f * b1));
91 u = (int)(8 * 0.565f * (b0 - y0)) + 128;
92 v = (int)(8 * 0.713f * (r0 - y0)) + 128;
93 */
94 for (i = 0; i < 32; i++) {
95 yuv_ry[i] = (int)(0.299f * i * 65536.0f + 0.5f);
96 yuv_gy[i] = (int)(0.587f * i * 65536.0f + 0.5f);
97 yuv_by[i] = (int)(0.114f * i * 65536.0f + 0.5f);
98 }
99 for (i = -32; i < 32; i++) {
100 v = (int)(8 * 0.565f * i) + 128;
101 if (v < 0)
102 v = 0;
103 if (v > 255)
104 v = 255;
105 yuv_u[i + 32] = v;
106 v = (int)(8 * 0.713f * i) + 128;
107 if (v < 0)
108 v = 0;
109 if (v > 255)
110 v = 255;
111 yuv_v[i + 32] = v;
112 }
113}
114
5b9aa749 115void rgb565_to_uyvy(void *d, const void *s, int pixels)
116{
117 unsigned int *dst = d;
118 const unsigned short *src = s;
119 const unsigned char *yu = yuv_u + 32;
120 const unsigned char *yv = yuv_v + 32;
121 int r0, g0, b0, r1, g1, b1;
122 int y0, y1, u, v;
123
124 for (; pixels > 0; src += 2, dst++, pixels -= 2)
125 {
126 r0 = (src[0] >> 11) & 0x1f;
127 g0 = (src[0] >> 6) & 0x1f;
128 b0 = src[0] & 0x1f;
129 r1 = (src[1] >> 11) & 0x1f;
130 g1 = (src[1] >> 6) & 0x1f;
131 b1 = src[1] & 0x1f;
132 y0 = (yuv_ry[r0] + yuv_gy[g0] + yuv_by[b0]) >> 16;
133 y1 = (yuv_ry[r1] + yuv_gy[g1] + yuv_by[b1]) >> 16;
134 u = yu[b0 - y0];
135 v = yv[r0 - y0];
136 // valid Y range seems to be 16..235
137 y0 = 16 + 219 * y0 / 31;
138 y1 = 16 + 219 * y1 / 31;
139
140 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
141 }
142}
143
c9099d02 144void bgr555_to_uyvy(void *d, const void *s, int pixels)
145{
146 unsigned int *dst = d;
147 const unsigned short *src = s;
148 const unsigned char *yu = yuv_u + 32;
149 const unsigned char *yv = yuv_v + 32;
150 int r0, g0, b0, r1, g1, b1;
151 int y0, y1, u, v;
152
153 for (; pixels > 0; src += 2, dst++, pixels -= 2)
154 {
155 b0 = (src[0] >> 10) & 0x1f;
156 g0 = (src[0] >> 5) & 0x1f;
157 r0 = src[0] & 0x1f;
158 b1 = (src[1] >> 10) & 0x1f;
159 g1 = (src[1] >> 5) & 0x1f;
160 r1 = src[1] & 0x1f;
161 y0 = (yuv_ry[r0] + yuv_gy[g0] + yuv_by[b0]) >> 16;
162 y1 = (yuv_ry[r1] + yuv_gy[g1] + yuv_by[b1]) >> 16;
163 u = yu[b0 - y0];
164 v = yv[r0 - y0];
c9099d02 165 y0 = 16 + 219 * y0 / 31;
166 y1 = 16 + 219 * y1 / 31;
167
168 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
169 }
170}
171
172void bgr888_to_uyvy(void *d, const void *s, int pixels)
173{
174 unsigned int *dst = d;
175 const unsigned char *src8 = s;
176 const unsigned char *yu = yuv_u + 32;
177 const unsigned char *yv = yuv_v + 32;
178 int r0, g0, b0, r1, g1, b1;
179 int y0, y1, u, v;
180
181 for (; pixels > 0; src8 += 3*2, dst++, pixels -= 2)
182 {
183 r0 = src8[0], g0 = src8[1], b0 = src8[2];
184 r1 = src8[3], g1 = src8[4], b1 = src8[5];
185 y0 = (r0 * 19595 + g0 * 38470 + b0 * 7471) >> 16;
186 y1 = (r1 * 19595 + g1 * 38470 + b1 * 7471) >> 16;
187 u = yu[(b0 - y0) / 8];
188 v = yv[(r0 - y0) / 8];
189 y0 = 16 + 219 * y0 / 255;
190 y1 = 16 + 219 * y1 / 255;
191
192 *dst = (y1 << 24) | (v << 16) | (y0 << 8) | u;
193 }
194}