Glide Plugin GLES2 port from mupen64plus-ae, but with special FrameSkip code
[mupen64plus-pandora.git] / source / gles2glide64 / src / Glide64 / TexLoad8b.h
CommitLineData
98e75f2d 1/*
2* Glide64 - Glide video plugin for Nintendo 64 emulators.
3* Copyright (c) 2002 Dave2001
4* Copyright (c) 2003-2009 Sergey 'Gonetz' Lipski
5*
6* This program is free software; you can redistribute it and/or modify
7* it under the terms of the GNU General Public License as published by
8* the Free Software Foundation; either version 2 of the License, or
9* any later version.
10*
11* This program is distributed in the hope that it will be useful,
12* but WITHOUT ANY WARRANTY; without even the implied warranty of
13* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14* GNU General Public License for more details.
15*
16* You should have received a copy of the GNU General Public License
17* along with this program; if not, write to the Free Software
18* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19*/
20
21//****************************************************************
22//
23// Glide64 - Glide Plugin for Nintendo 64 emulators
24// Project started on December 29th, 2001
25//
26// Authors:
27// Dave2001, original author, founded the project in 2001, left it in 2002
28// Gugaman, joined the project in 2002, left it in 2002
29// Sergey 'Gonetz' Lipski, joined the project in 2002, main author since fall of 2002
30// Hiroshi 'KoolSmoky' Morii, joined the project in 2007
31//
32//****************************************************************
33//
34// To modify Glide64:
35// * Write your name and (optional)email, commented by your work, so I know who did it, and so that you can find which parts you modified when it comes time to send it to me.
36// * Do NOT send me the whole project or file that you modified. Take out your modified code sections, and tell me where to put them. If people sent the whole thing, I would have many different versions, but no idea how to combine them all.
37//
38//****************************************************************
39#include <stdint.h>
40
41static inline void load8bCI(uint8_t *src, uint8_t *dst, int wid_64, int height, int line, int ext, uint16_t *pal)
42{
43 uint8_t *v7;
44 uint32_t *v8;
45 int v9;
46 int v10;
47 int v11;
48 uint32_t v12;
49 uint32_t *v13;
50 uint32_t v14;
51 uint32_t *v15;
52 uint32_t v16;
53 uint32_t *v17;
54 uint32_t *v18;
55 int v19;
56 int v20;
57 uint32_t v21;
58 uint32_t v22;
59 uint32_t *v23;
60 uint32_t v24;
61 int v25;
62 int v26;
63
64 v7 = src;
65 v8 = (uint32_t *)dst;
66 v9 = height;
67 do
68 {
69 v25 = v9;
70 v10 = wid_64;
71 do
72 {
73 v11 = v10;
74 v12 = bswap32(*(uint32_t *)v7);
75 v13 = (uint32_t *)(v7 + 4);
76 ALOWORD(v10) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 15) & 0x1FE)), 1);
77 v14 = v10 << 16;
78 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 23) & 0x1FE)), 1);
79 *v8 = v14;
80 v15 = v8 + 1;
81 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v12 & 0x1FE)), 1);
82 v14 <<= 16;
83 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 7) & 0x1FE)), 1);
84 *v15 = v14;
85 ++v15;
86 v16 = bswap32(*v13);
87 v7 = (uint8_t *)(v13 + 1);
88 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 15) & 0x1FE)), 1);
89 v14 <<= 16;
90 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 23) & 0x1FE)), 1);
91 *v15 = v14;
92 ++v15;
93 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v16 & 0x1FE)), 1);
94 v14 <<= 16;
95 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 7) & 0x1FE)), 1);
96 *v15 = v14;
97 v8 = v15 + 1;
98 v10 = v11 - 1;
99 }
100 while ( v11 != 1 );
101 if ( v25 == 1 )
102 break;
103 v26 = v25 - 1;
104 v17 = (uint32_t *)&src[(line + (uintptr_t)v7 - (uintptr_t)src) & 0x7FF];
105 v18 = (uint32_t *)((char *)v8 + ext);
106 v19 = wid_64;
107 do
108 {
109 v20 = v19;
110 v21 = bswap32(v17[1]);
111 ALOWORD(v19) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 15) & 0x1FE)), 1);
112 v22 = v19 << 16;
113 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 23) & 0x1FE)), 1);
114 *v18 = v22;
115 v23 = v18 + 1;
116 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v21 & 0x1FE)), 1);
117 v22 <<= 16;
118 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 7) & 0x1FE)), 1);
119 *v23 = v22;
120 ++v23;
121 v24 = bswap32(*v17);
122 v17 = (uint32_t *)&src[((uintptr_t)v17 + 8 - (uintptr_t)src) & 0x7FF];
123 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 15) & 0x1FE)), 1);
124 v22 <<= 16;
125 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 23) & 0x1FE)), 1);
126 *v23 = v22;
127 ++v23;
128 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v24 & 0x1FE)), 1);
129 v22 <<= 16;
130 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 7) & 0x1FE)), 1);
131 *v23 = v22;
132 v18 = v23 + 1;
133 v19 = v20 - 1;
134 }
135 while ( v20 != 1 );
136 v7 = &src[(line + (uintptr_t)v17 - (uintptr_t)src) & 0x7FF];
137 v8 = (uint32_t *)((char *)v18 + ext);
138 v9 = v26 - 1;
139 }
140 while ( v26 != 1 );
141}
142
143static inline void load8bIA8(uint8_t *src, uint8_t *dst, int wid_64, int height, int line, int ext, uint16_t *pal)
144{
145 uint32_t *v7;
146 uint32_t *v8;
147 int v9;
148 int v10;
149 int v11;
150 uint32_t v12;
151 uint32_t *v13;
152 uint32_t v14;
153 uint32_t *v15;
154 uint32_t v16;
155 uint32_t *v17;
156 uint32_t *v18;
157 int v19;
158 int v20;
159 uint32_t v21;
160 uint32_t v22;
161 uint32_t *v23;
162 uint32_t v24;
163 int v25;
164 int v26;
165
166 v7 = (uint32_t *)src;
167 v8 = (uint32_t *)dst;
168 v9 = height;
169 do
170 {
171 v25 = v9;
172 v10 = wid_64;
173 do
174 {
175 v11 = v10;
176 v12 = bswap32(*v7);
177 v13 = v7 + 1;
178 ALOWORD(v10) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 15) & 0x1FE)), 8);
179 v14 = v10 << 16;
180 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 23) & 0x1FE)), 8);
181 *v8 = v14;
182 v15 = v8 + 1;
183 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v12 & 0x1FE)), 8);
184 v14 <<= 16;
185 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v12 >> 7) & 0x1FE)), 8);
186 *v15 = v14;
187 ++v15;
188 v16 = bswap32(*v13);
189 v7 = v13 + 1;
190 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 15) & 0x1FE)), 8);
191 v14 <<= 16;
192 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 23) & 0x1FE)), 8);
193 *v15 = v14;
194 ++v15;
195 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v16 & 0x1FE)), 8);
196 v14 <<= 16;
197 ALOWORD(v14) = __ROR__(*(uint16_t *)((char *)pal + ((v16 >> 7) & 0x1FE)), 8);
198 *v15 = v14;
199 v8 = v15 + 1;
200 v10 = v11 - 1;
201 }
202 while ( v11 != 1 );
203 if ( v25 == 1 )
204 break;
205 v26 = v25 - 1;
206 v17 = (uint32_t *)((char *)v7 + line);
207 v18 = (uint32_t *)((char *)v8 + ext);
208 v19 = wid_64;
209 do
210 {
211 v20 = v19;
212 v21 = bswap32(v17[1]);
213 ALOWORD(v19) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 15) & 0x1FE)), 8);
214 v22 = v19 << 16;
215 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 23) & 0x1FE)), 8);
216 *v18 = v22;
217 v23 = v18 + 1;
218 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v21 & 0x1FE)), 8);
219 v22 <<= 16;
220 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v21 >> 7) & 0x1FE)), 8);
221 *v23 = v22;
222 ++v23;
223 v24 = bswap32(*v17);
224 v17 += 2;
225 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 15) & 0x1FE)), 8);
226 v22 <<= 16;
227 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 23) & 0x1FE)), 8);
228 *v23 = v22;
229 ++v23;
230 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + (2 * (uint16_t)v24 & 0x1FE)), 8);
231 v22 <<= 16;
232 ALOWORD(v22) = __ROR__(*(uint16_t *)((char *)pal + ((v24 >> 7) & 0x1FE)), 8);
233 *v23 = v22;
234 v18 = v23 + 1;
235 v19 = v20 - 1;
236 }
237 while ( v20 != 1 );
238 v7 = (uint32_t *)((char *)v17 + line);
239 v8 = (uint32_t *)((char *)v18 + ext);
240 v9 = v26 - 1;
241 }
242 while ( v26 != 1 );
243}
244
245static inline void load8bIA4(uint8_t *src, uint8_t *dst, int wid_64, int height, int line, int ext)
246{
247 uint32_t *v6;
248 uint32_t *v7;
249 int v8;
250 int v9;
251 uint32_t v10;
252 uint32_t v11;
253 uint32_t *v12;
254 uint32_t *v13;
255 uint32_t v14;
256 uint32_t v15;
257 uint32_t *v16;
258 uint32_t *v17;
259 int v18;
260 uint32_t *v19;
261 uint32_t v20;
262 int v21;
263 int v22;
264
265 v6 = (uint32_t *)src;
266 v7 = (uint32_t *)dst;
267 v8 = height;
268 do
269 {
270 v21 = v8;
271 v9 = wid_64;
272 do
273 {
274 v10 = *v6;
275 v11 = (*v6 >> 4) & 0xF0F0F0F;
276 v12 = v6 + 1;
277 *v7 = (16 * v10 & 0xF0F0F0F0) | v11;
278 v13 = v7 + 1;
279 v14 = (*v12 >> 4) & 0xF0F0F0F;
280 v15 = 16 * *v12 & 0xF0F0F0F0;
281 v6 = v12 + 1;
282 *v13 = v15 | v14;
283 v7 = v13 + 1;
284 --v9;
285 }
286 while ( v9 );
287 if ( v21 == 1 )
288 break;
289 v22 = v21 - 1;
290 v16 = (uint32_t *)((char *)v6 + line);
291 v17 = (uint32_t *)((char *)v7 + ext);
292 v18 = wid_64;
293 do
294 {
295 *v17 = (16 * v16[1] & 0xF0F0F0F0) | ((v16[1] >> 4) & 0xF0F0F0F);
296 v19 = v17 + 1;
297 v20 = *v16;
298 v16 += 2;
299 *v19 = (16 * v20 & 0xF0F0F0F0) | ((v20 >> 4) & 0xF0F0F0F);
300 v17 = v19 + 1;
301 --v18;
302 }
303 while ( v18 );
304 v6 = (uint32_t *)((char *)v16 + line);
305 v7 = (uint32_t *)((char *)v17 + ext);
306 v8 = v22 - 1;
307 }
308 while ( v22 != 1 );
309}
310
311static inline void load8bI(uint8_t *src, uint8_t *dst, int wid_64, int height, int line, int ext)
312{
313 uint32_t *v6;
314 uint32_t *v7;
315 int v8;
316 int v9;
317 uint32_t v10;
318 uint32_t *v11;
319 uint32_t *v12;
320 uint32_t v13;
321 uint32_t *v14;
322 uint32_t *v15;
323 int v16;
324 uint32_t *v17;
325 uint32_t v18;
326 int v19;
327 int v20;
328
329 v6 = (uint32_t *)src;
330 v7 = (uint32_t *)dst;
331 v8 = height;
332 do
333 {
334 v19 = v8;
335 v9 = wid_64;
336 do
337 {
338 v10 = *v6;
339 v11 = v6 + 1;
340 *v7 = v10;
341 v12 = v7 + 1;
342 v13 = *v11;
343 v6 = v11 + 1;
344 *v12 = v13;
345 v7 = v12 + 1;
346 --v9;
347 }
348 while ( v9 );
349 if ( v19 == 1 )
350 break;
351 v20 = v19 - 1;
352 v14 = (uint32_t *)((char *)v6 + line);
353 v15 = (uint32_t *)((char *)v7 + ext);
354 v16 = wid_64;
355 do
356 {
357 *v15 = v14[1];
358 v17 = v15 + 1;
359 v18 = *v14;
360 v14 += 2;
361 *v17 = v18;
362 v15 = v17 + 1;
363 --v16;
364 }
365 while ( v16 );
366 v6 = (uint32_t *)((char *)v14 + line);
367 v7 = (uint32_t *)((char *)v15 + ext);
368 v8 = v20 - 1;
369 }
370 while ( v20 != 1 );
371}
372
373//****************************************************************
374// Size: 1, Format: 2
375//
376
377wxUint32 Load8bCI (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int tile)
378{
379 if (wid_64 < 1) wid_64 = 1;
380 if (height < 1) height = 1;
381 int ext = (real_width - (wid_64 << 3));
382 unsigned short * pal = rdp.pal_8;
383
384 switch (rdp.tlut_mode) {
385 case 0: //palette is not used
386 //in tlut DISABLE mode load CI texture as plain intensity texture instead of palette dereference.
387 //Thanks to angrylion for the advice
388 load8bI ((uint8_t *)src, (uint8_t *)dst, wid_64, height, line, ext);
389 return /*(0 << 16) | */GR_TEXFMT_ALPHA_8;
390 case 2: //color palette
391 ext <<= 1;
392 load8bCI ((uint8_t *)src, (uint8_t *)dst, wid_64, height, line, ext, pal);
393 return (1 << 16) | GR_TEXFMT_ARGB_1555;
394 default: //IA palette
395 ext <<= 1;
396 load8bIA8 ((uint8_t *)src, (uint8_t *)dst, wid_64, height, line, ext, pal);
397 return (1 << 16) | GR_TEXFMT_ALPHA_INTENSITY_88;
398 }
399}
400
401//****************************************************************
402// Size: 1, Format: 3
403//
404// ** by Gugaman **
405
406wxUint32 Load8bIA (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int tile)
407{
408 if (rdp.tlut_mode != 0)
409 return Load8bCI (dst, src, wid_64, height, line, real_width, tile);
410
411 if (wid_64 < 1) wid_64 = 1;
412 if (height < 1) height = 1;
413 int ext = (real_width - (wid_64 << 3));
414 load8bIA4 ((uint8_t *)src, (uint8_t *)dst, wid_64, height, line, ext);
415 return /*(0 << 16) | */GR_TEXFMT_ALPHA_INTENSITY_44;
416}
417
418//****************************************************************
419// Size: 1, Format: 4
420//
421// ** by Gugaman **
422
423wxUint32 Load8bI (wxUIntPtr dst, wxUIntPtr src, int wid_64, int height, int line, int real_width, int tile)
424{
425 if (rdp.tlut_mode != 0)
426 return Load8bCI (dst, src, wid_64, height, line, real_width, tile);
427
428 if (wid_64 < 1) wid_64 = 1;
429 if (height < 1) height = 1;
430 int ext = (real_width - (wid_64 << 3));
431 load8bI ((uint8_t *)src, (uint8_t *)dst, wid_64, height, line, ext);
432 return /*(0 << 16) | */GR_TEXFMT_ALPHA_8;
433}
434