src/ds/gx/software.c (view raw)
1/* Copyright (c) 2013-2017 Jeffrey Pfau
2 *
3 * This Source Code Form is subject to the terms of the Mozilla Public
4 * License, v. 2.0. If a copy of the MPL was not distributed with this
5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
6#include <mgba/internal/ds/gx/software.h>
7
8#include <mgba-util/memory.h>
9#include "gba/renderers/software-private.h"
10
11#define SCREEN_SIZE (DS_VIDEO_VERTICAL_PIXELS << 12)
12
13DEFINE_VECTOR(DSGXSoftwarePolygonList, struct DSGXSoftwarePolygon);
14DEFINE_VECTOR(DSGXSoftwareEdgeList, struct DSGXSoftwareEdge);
15DEFINE_VECTOR(DSGXSoftwareSpanList, struct DSGXSoftwareSpan);
16
17static void DSGXSoftwareRendererInit(struct DSGXRenderer* renderer);
18static void DSGXSoftwareRendererReset(struct DSGXRenderer* renderer);
19static void DSGXSoftwareRendererDeinit(struct DSGXRenderer* renderer);
20static void DSGXSoftwareRendererInvalidateTex(struct DSGXRenderer* renderer, int slot);
21static void DSGXSoftwareRendererSetRAM(struct DSGXRenderer* renderer, struct DSGXVertex* verts, struct DSGXPolygon* polys, unsigned polyCount);
22static void DSGXSoftwareRendererDrawScanline(struct DSGXRenderer* renderer, int y);
23static void DSGXSoftwareRendererGetScanline(struct DSGXRenderer* renderer, int y, color_t** output);
24
25static void _expandColor(uint16_t c15, uint8_t* r, uint8_t* g, uint8_t* b) {
26 *r = ((c15 << 1) & 0x3E) | 1;
27 *g = ((c15 >> 4) & 0x3E) | 1;
28 *b = ((c15 >> 9) & 0x3E) | 1;
29}
30
31static color_t _finishColor(uint8_t r, uint8_t g, uint8_t b) {
32#ifndef COLOR_16_BIT
33 color_t rgb = (r << 2) & 0xF8;
34 rgb |= (g << 10) & 0xF800;
35 rgb |= (b << 18) & 0xF80000;
36 return rgb;
37#else
38#error Unsupported color depth
39#endif
40}
41
42static color_t _lookupColor(struct DSGXSoftwareEndpoint* ep, struct DSGXSoftwarePolygon* poly) {
43 // TODO: Optimize
44 uint16_t texel;
45
46 int16_t s = ep->s >> 4;
47 int16_t t = ep->t >> 4;
48 if (!DSGXTexParamsIsSRepeat(poly->poly->texParams)) {
49 if (s < 0) {
50 s = 0;
51 } else if (s >= poly->texW) {
52 s = poly->texW - 1;
53 }
54 } else if (DSGXTexParamsIsSMirror(poly->poly->texParams)) {
55 if (s & poly->texW) {
56 s = poly->texW - s;
57 }
58 s &= poly->texW - 1;
59 } else {
60 s &= poly->texW - 1;
61 }
62 if (!DSGXTexParamsIsTRepeat(poly->poly->texParams)) {
63 if (t < 0) {
64 t = 0;
65 } else if (t >= poly->texH) {
66 t = poly->texW - 1;
67 }
68 } else if (DSGXTexParamsIsTMirror(poly->poly->texParams)) {
69 if (t & poly->texH) {
70 t = poly->texH - t;
71 }
72 t &= poly->texH - 1;
73 } else {
74 t &= poly->texH - 1;
75 }
76
77 uint16_t texelCoord = s + t * poly->texW;
78 switch (poly->texFormat) {
79 case 0:
80 default:
81 return _finishColor(ep->cr, ep->cg, ep->cb);
82 case 1:
83 return _finishColor(0, 0, 0x3F);
84 case 2:
85 texel = ((uint8_t*) poly->texBase)[texelCoord >> 2];
86 if (texelCoord & 0x3) {
87 texel >>= 2 * texel & 3;
88 }
89 texel &= 0x3;
90 break;
91 case 3:
92 texel = ((uint8_t*) poly->texBase)[texelCoord >> 1];
93 if (texelCoord & 0x1) {
94 texel >>= 4;
95 }
96 texel &= 0xF;
97 break;
98 case 4:
99 texel = ((uint8_t*) poly->texBase)[texelCoord];
100 break;
101 case 5:
102 return _finishColor(0x3F, 0, 0x3F);
103 case 6:
104 return _finishColor(0x3F, 0x3F, 0);
105 case 7:
106 return _finishColor(0x3F, 0x3F, 0x3F);
107 }
108 if (DSGXTexParamsIs0Transparent(poly->poly->texParams) && !texel) {
109 return FLAG_UNWRITTEN;
110 }
111 uint8_t r, g, b;
112 texel = poly->palBase[texel];
113 _expandColor(texel, &r, &g, &b);
114 return _finishColor(r, g, b);
115}
116
117static int _edgeSort(const void* a, const void* b) {
118 const struct DSGXSoftwareEdge* ea = a;
119 const struct DSGXSoftwareEdge* eb = b;
120
121 // Sort upside down
122 if (ea->y0 < eb->y0) {
123 return 1;
124 }
125 if (ea->y0 > eb->y0) {
126 return -1;
127 }
128 if (ea->y1 < eb->y1) {
129 return 1;
130 }
131 if (ea->y1 > eb->y1) {
132 return -1;
133 }
134 return 0;
135}
136
137static bool _edgeToSpan(struct DSGXSoftwareSpan* span, const struct DSGXSoftwareEdge* edge, int index, int32_t y) {
138 int32_t height = edge->y1 - edge->y0;
139 int64_t yw = (y << 12) - edge->y0;
140 if (!height) {
141 return false;
142 }
143 // Clamp to bounds
144 if (yw < 0) {
145 yw = 0;
146 } else if (yw > height) {
147 yw = height;
148 }
149 yw *= 0x100000000LL / height;
150
151 span->ep[index].x = (((int64_t) (edge->x1 - edge->x0) * yw) >> 32) + edge->x0;
152
153 if (index && span->ep[0].x > span->ep[index].x) {
154 int32_t temp = span->ep[index].x;
155 span->ep[index] = span->ep[0];
156 span->ep[0].x = temp;
157 index = 0;
158 }
159 int32_t w0 = edge->w0;
160 int32_t w1 = edge->w1;
161 int32_t w = (((int64_t) (edge->w1 - edge->w0) * yw) >> 32) + edge->w0;
162 int64_t wRecip;// = 0x1000000000000LL / w;
163 // XXX: Disable perspective correction until I figure out how to fix it
164 wRecip = 0x100000000;
165 w0 = 0x10000;
166 w1 = 0x10000;
167 span->ep[index].w = w;
168 span->ep[index].cr = (((((edge->cr1 * (int64_t) w1 - edge->cr0 * (int64_t) w0) * yw) >> 32) + edge->cr0 * (int64_t) w0) * wRecip) >> 48;
169 span->ep[index].cg = (((((edge->cg1 * (int64_t) w1 - edge->cg0 * (int64_t) w0) * yw) >> 32) + edge->cg0 * (int64_t) w0) * wRecip) >> 48;
170 span->ep[index].cb = (((((edge->cb1 * (int64_t) w1 - edge->cb0 * (int64_t) w0) * yw) >> 32) + edge->cb0 * (int64_t) w0) * wRecip) >> 48;
171 span->ep[index].s = (((((edge->s1 * (int64_t) w1 - edge->s0 * (int64_t) w0) * yw) >> 32) + edge->s0 * (int64_t) w0) * wRecip) >> 48;
172 span->ep[index].t = (((((edge->t1 * (int64_t) w1 - edge->t0 * (int64_t) w0) * yw) >> 32) + edge->t0 * (int64_t) w0) * wRecip) >> 48;
173
174 return true;
175}
176
177static int _spanSort(const void* a, const void* b) {
178 const struct DSGXSoftwareSpan* sa = a;
179 const struct DSGXSoftwareSpan* sb = b;
180
181 // Sort backwards
182 if (sa->ep[0].x < sb->ep[0].x) {
183 return 1;
184 }
185 if (sa->ep[0].x > sb->ep[0].x) {
186 return -1;
187 }
188 if (sa->ep[0].w < sb->ep[0].w) {
189 return 1;
190 }
191 if (sa->ep[0].w > sb->ep[0].w) {
192 return -1;
193 }
194 return 0;
195}
196
197static void _lerpEndpoint(const struct DSGXSoftwareSpan* span, struct DSGXSoftwareEndpoint* ep, unsigned x) {
198 int64_t width = span->ep[1].x - span->ep[0].x;
199 int64_t xw = ((uint64_t) x << 12) - span->ep[0].x;
200 if (!width) {
201 return; // TODO?
202 }
203 // Clamp to bounds
204 if (xw < 0) {
205 xw = 0;
206 } else if (xw > width) {
207 xw = width;
208 }
209 xw *= 0x100000000LL / width;
210 int32_t w0 = span->ep[0].w;
211 int32_t w1 = span->ep[1].w;
212 int64_t w = (((int64_t) (w1 - w0) * xw) >> 32) + w0;
213 int64_t wRecip;// = 0x1000000000000LL / w;
214 ep->w = w;
215 // XXX: Disable perspective correction until I figure out how to fix it
216 wRecip = 0x100000000;
217 w0 = 0x10000;
218 w1 = 0x10000;
219
220 uint64_t r = (((span->ep[1].cr * (int64_t) w1 - span->ep[0].cr * (int64_t) w0) * xw) >> 32) + span->ep[0].cr * (int64_t) w0;
221 uint64_t g = (((span->ep[1].cg * (int64_t) w1 - span->ep[0].cg * (int64_t) w0) * xw) >> 32) + span->ep[0].cg * (int64_t) w0;
222 uint64_t b = (((span->ep[1].cb * (int64_t) w1 - span->ep[0].cb * (int64_t) w0) * xw) >> 32) + span->ep[0].cb * (int64_t) w0;
223 ep->cr = (r * wRecip) >> 48;
224 ep->cg = (g * wRecip) >> 48;
225 ep->cb = (b * wRecip) >> 48;
226
227 int32_t s = (((span->ep[1].s * (int64_t) w1 - span->ep[0].s * (int64_t) w0) * xw) >> 32) + span->ep[0].s * (int64_t) w0;
228 int32_t t = (((span->ep[1].t * (int64_t) w1 - span->ep[0].t * (int64_t) w0) * xw) >> 32) + span->ep[0].t * (int64_t) w0;
229 ep->s = (s * wRecip) >> 48;
230 ep->t = (t * wRecip) >> 48;
231}
232
233void DSGXSoftwareRendererCreate(struct DSGXSoftwareRenderer* renderer) {
234 renderer->d.init = DSGXSoftwareRendererInit;
235 renderer->d.reset = DSGXSoftwareRendererReset;
236 renderer->d.deinit = DSGXSoftwareRendererDeinit;
237 renderer->d.invalidateTex = DSGXSoftwareRendererInvalidateTex;
238 renderer->d.setRAM = DSGXSoftwareRendererSetRAM;
239 renderer->d.drawScanline = DSGXSoftwareRendererDrawScanline;
240 renderer->d.getScanline = DSGXSoftwareRendererGetScanline;
241}
242
243static void DSGXSoftwareRendererInit(struct DSGXRenderer* renderer) {
244 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
245 DSGXSoftwarePolygonListInit(&softwareRenderer->activePolys, DS_GX_POLYGON_BUFFER_SIZE / 4);
246 DSGXSoftwareEdgeListInit(&softwareRenderer->activeEdges, DS_GX_POLYGON_BUFFER_SIZE);
247 DSGXSoftwareSpanListInit(&softwareRenderer->activeSpans, DS_GX_POLYGON_BUFFER_SIZE / 2);
248 softwareRenderer->bucket = anonymousMemoryMap(sizeof(*softwareRenderer->bucket) * DS_GX_POLYGON_BUFFER_SIZE);
249 softwareRenderer->scanlineCache = anonymousMemoryMap(sizeof(color_t) * DS_VIDEO_VERTICAL_PIXELS * DS_VIDEO_HORIZONTAL_PIXELS);
250}
251
252static void DSGXSoftwareRendererReset(struct DSGXRenderer* renderer) {
253 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
254 softwareRenderer->flushPending = false;
255}
256
257static void DSGXSoftwareRendererDeinit(struct DSGXRenderer* renderer) {
258 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
259 DSGXSoftwarePolygonListDeinit(&softwareRenderer->activePolys);
260 DSGXSoftwareEdgeListDeinit(&softwareRenderer->activeEdges);
261 DSGXSoftwareSpanListDeinit(&softwareRenderer->activeSpans);
262 mappedMemoryFree(softwareRenderer->bucket, sizeof(*softwareRenderer->bucket) * DS_GX_POLYGON_BUFFER_SIZE);
263 mappedMemoryFree(softwareRenderer->scanlineCache, sizeof(color_t) * DS_VIDEO_VERTICAL_PIXELS * DS_VIDEO_HORIZONTAL_PIXELS);
264}
265
266static void DSGXSoftwareRendererInvalidateTex(struct DSGXRenderer* renderer, int slot) {
267 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
268 // TODO
269}
270
271static void DSGXSoftwareRendererSetRAM(struct DSGXRenderer* renderer, struct DSGXVertex* verts, struct DSGXPolygon* polys, unsigned polyCount) {
272 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
273
274 softwareRenderer->flushPending = true;
275 softwareRenderer->verts = verts;
276 DSGXSoftwarePolygonListClear(&softwareRenderer->activePolys);
277 DSGXSoftwareEdgeListClear(&softwareRenderer->activeEdges);
278 unsigned i;
279 for (i = 0; i < polyCount; ++i) {
280 struct DSGXSoftwarePolygon* poly = DSGXSoftwarePolygonListAppend(&softwareRenderer->activePolys);
281 struct DSGXSoftwareEdge* edge = DSGXSoftwareEdgeListAppend(&softwareRenderer->activeEdges);
282 poly->poly = &polys[i];
283 poly->texFormat = DSGXTexParamsGetFormat(poly->poly->texParams);
284 poly->texW = 8 << DSGXTexParamsGetSSize(poly->poly->texParams);
285 poly->texH = 8 << DSGXTexParamsGetTSize(poly->poly->texParams);
286 switch (poly->texFormat) {
287 case 0:
288 case 7:
289 poly->texBase = NULL;
290 poly->palBase = NULL;
291 break;
292 case 2:
293 poly->texBase = &renderer->tex[DSGXTexParamsGetVRAMBase(poly->poly->texParams) >> VRAM_BLOCK_OFFSET][(DSGXTexParamsGetVRAMBase(poly->poly->texParams) << 2) & 0xFFFF];
294 poly->palBase = &renderer->texPal[poly->poly->palBase >> 12][(poly->poly->palBase << 2) & 0x1FFF];
295 break;
296 default:
297 poly->texBase = &renderer->tex[DSGXTexParamsGetVRAMBase(poly->poly->texParams) >> VRAM_BLOCK_OFFSET][(DSGXTexParamsGetVRAMBase(poly->poly->texParams) << 2) & 0xFFFF];
298 poly->palBase = &renderer->texPal[poly->poly->palBase >> 11][(poly->poly->palBase << 3) & 0x1FFF];
299 break;
300 }
301 edge->polyId = i;
302
303 struct DSGXVertex* v0 = &verts[poly->poly->vertIds[0]];
304 struct DSGXVertex* v1;
305
306 int v;
307 for (v = 1; v < poly->poly->verts; ++v) {
308 v1 = &verts[poly->poly->vertIds[v]];
309 if (v0->vy >= v1->vy) {
310 edge->y0 = SCREEN_SIZE - v0->vy;
311 edge->x0 = v0->vx;
312 edge->w0 = v0->vw;
313 _expandColor(v0->color, &edge->cr0, &edge->cg0, &edge->cb0);
314 edge->s0 = v0->vs;
315 edge->t0 = v0->vt;
316
317 edge->y1 = SCREEN_SIZE - v1->vy;
318 edge->x1 = v1->vx;
319 edge->w1 = v1->vw;
320 _expandColor(v1->color, &edge->cr1, &edge->cg1, &edge->cb1);
321 edge->s1 = v1->vs;
322 edge->t1 = v1->vt;
323 } else {
324 edge->y0 = SCREEN_SIZE - v1->vy;
325 edge->x0 = v1->vx;
326 edge->w0 = v1->vw;
327 _expandColor(v1->color, &edge->cr0, &edge->cg0, &edge->cb0);
328 edge->s0 = v1->vs;
329 edge->t0 = v1->vt;
330
331 edge->y1 = SCREEN_SIZE - v0->vy;
332 edge->x1 = v0->vx;
333 edge->w1 = v0->vw;
334 _expandColor(v0->color, &edge->cr1, &edge->cg1, &edge->cb1);
335 edge->s1 = v0->vs;
336 edge->t1 = v0->vt;
337 }
338
339 edge = DSGXSoftwareEdgeListAppend(&softwareRenderer->activeEdges);
340 edge->polyId = i;
341 v0 = v1;
342 }
343
344 v1 = &verts[poly->poly->vertIds[0]];
345 if (v0->vy >= v1->vy) {
346 edge->y0 = SCREEN_SIZE - v0->vy;
347 edge->x0 = v0->vx;
348 edge->w0 = v0->vw;
349 _expandColor(v0->color, &edge->cr0, &edge->cg0, &edge->cb0);
350 edge->s0 = v0->vs;
351 edge->t0 = v0->vt;
352
353 edge->y1 = SCREEN_SIZE - v1->vy;
354 edge->x1 = v1->vx;
355 edge->w1 = v1->vw;
356 _expandColor(v1->color, &edge->cr1, &edge->cg1, &edge->cb1);
357 edge->s1 = v1->vs;
358 edge->t1 = v1->vt;
359 } else {
360 edge->y0 = SCREEN_SIZE - v1->vy;
361 edge->x0 = v1->vx;
362 edge->w0 = v1->vw;
363 _expandColor(v1->color, &edge->cr0, &edge->cg0, &edge->cb0);
364 edge->s0 = v1->vs;
365 edge->t0 = v1->vt;
366
367 edge->y1 = SCREEN_SIZE - v0->vy;
368 edge->x1 = v0->vx;
369 edge->w1 = v0->vw;
370 _expandColor(v0->color, &edge->cr1, &edge->cg1, &edge->cb1);
371 edge->s1 = v0->vs;
372 edge->t1 = v0->vt;
373 }
374 }
375 qsort(DSGXSoftwareEdgeListGetPointer(&softwareRenderer->activeEdges, 0), DSGXSoftwareEdgeListSize(&softwareRenderer->activeEdges), sizeof(struct DSGXSoftwareEdge), _edgeSort);
376}
377
378static void DSGXSoftwareRendererDrawScanline(struct DSGXRenderer* renderer, int y) {
379 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
380 if (!softwareRenderer->flushPending) {
381 return;
382 }
383 DSGXSoftwareSpanListClear(&softwareRenderer->activeSpans);
384 memset(softwareRenderer->bucket, 0, sizeof(*softwareRenderer->bucket) * DS_GX_POLYGON_BUFFER_SIZE);
385 int i;
386 for (i = DSGXSoftwareEdgeListSize(&softwareRenderer->activeEdges); i; --i) {
387 size_t idx = i - 1;
388 struct DSGXSoftwareEdge* edge = DSGXSoftwareEdgeListGetPointer(&softwareRenderer->activeEdges, idx);
389 if (edge->y1 >> 12 < y) {
390 DSGXSoftwareEdgeListShift(&softwareRenderer->activeEdges, idx, 1);
391 continue;
392 } else if (edge->y0 >> 12 > y) {
393 continue;
394 }
395
396 unsigned poly = edge->polyId;
397 struct DSGXSoftwareSpan* span = softwareRenderer->bucket[poly];
398 if (span && !span->ep[1].w) {
399 _edgeToSpan(span, edge, 1, y);
400 softwareRenderer->bucket[poly] = NULL;
401 } else if (!span) {
402 span = DSGXSoftwareSpanListAppend(&softwareRenderer->activeSpans);
403 memset(&span->ep[1], 0, sizeof(span->ep[1]));
404 span->poly = DSGXSoftwarePolygonListGetPointer(&softwareRenderer->activePolys, poly);
405 if (!_edgeToSpan(span, edge, 0, y)) {
406 // Horizontal line
407 DSGXSoftwareSpanListShift(&softwareRenderer->activeSpans, DSGXSoftwareSpanListSize(&softwareRenderer->activeSpans) - 1, 1);
408 } else {
409 softwareRenderer->bucket[poly] = span;
410 }
411 }
412 }
413 qsort(DSGXSoftwareSpanListGetPointer(&softwareRenderer->activeSpans, 0), DSGXSoftwareSpanListSize(&softwareRenderer->activeSpans), sizeof(struct DSGXSoftwareSpan), _spanSort);
414
415 color_t* scanline = &softwareRenderer->scanlineCache[DS_VIDEO_HORIZONTAL_PIXELS * y];
416
417 int nextSpanX = DS_VIDEO_HORIZONTAL_PIXELS;
418 if (DSGXSoftwareSpanListSize(&softwareRenderer->activeSpans)) {
419 nextSpanX = DSGXSoftwareSpanListGetPointer(&softwareRenderer->activeSpans, DSGXSoftwareSpanListSize(&softwareRenderer->activeSpans) - 1)->ep[0].x;
420 nextSpanX >>= 12;
421 }
422 for (i = 0; i < DS_VIDEO_HORIZONTAL_PIXELS; ++i) {
423 struct DSGXSoftwareSpan* span = NULL;
424 struct DSGXSoftwareEndpoint ep;
425 int32_t depth = INT32_MAX;
426 scanline[i] = FLAG_UNWRITTEN;
427 if (i >= nextSpanX) {
428 size_t nextSpanId = DSGXSoftwareSpanListSize(&softwareRenderer->activeSpans);
429 span = DSGXSoftwareSpanListGetPointer(&softwareRenderer->activeSpans, nextSpanId - 1);
430 while (i > (span->ep[1].x >> 12) || !span->ep[1].x) {
431 DSGXSoftwareSpanListShift(&softwareRenderer->activeSpans, nextSpanId - 1, 1);
432 --nextSpanId;
433 if (!nextSpanId) {
434 nextSpanX = DS_VIDEO_HORIZONTAL_PIXELS;
435 span = NULL;
436 break;
437 }
438 span = DSGXSoftwareSpanListGetPointer(&softwareRenderer->activeSpans, nextSpanId - 1);
439 nextSpanX = span->ep[0].x >> 12;
440 }
441 while (i > (span->ep[0].x >> 12)) {
442 if (i <= (span->ep[1].x >> 12)) {
443 _lerpEndpoint(span, &ep, i);
444 color_t color = _lookupColor(&ep, span->poly);
445 if (scanline[i] == FLAG_UNWRITTEN) {
446 scanline[i] = color;
447 }
448 if (ep.w < depth && color != FLAG_UNWRITTEN) {
449 depth = ep.w;
450 scanline[i] = color;
451 }
452 }
453 --nextSpanId;
454 if (!nextSpanId) {
455 break;
456 }
457 span = DSGXSoftwareSpanListGetPointer(&softwareRenderer->activeSpans, nextSpanId - 1);
458 }
459 }
460 }
461 if (y == DS_VIDEO_VERTICAL_PIXELS - 1) {
462 softwareRenderer->flushPending = false;
463 }
464}
465
466static void DSGXSoftwareRendererGetScanline(struct DSGXRenderer* renderer, int y, color_t** output) {
467 struct DSGXSoftwareRenderer* softwareRenderer = (struct DSGXSoftwareRenderer*) renderer;
468 *output = &softwareRenderer->scanlineCache[DS_VIDEO_HORIZONTAL_PIXELS * y];
469}