all repos — mgba @ 1a0e44c014ad34bea30d237d27015d82d02cda4b

mGBA Game Boy Advance Emulator

src/ds/renderers/software.c (view raw)

  1/* Copyright (c) 2013-2017 Jeffrey Pfau
  2 *
  3 * This Source Code Form is subject to the terms of the Mozilla Public
  4 * License, v. 2.0. If a copy of the MPL was not distributed with this
  5 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
  6#include <mgba/internal/ds/renderers/software.h>
  7#include "gba/renderers/software-private.h"
  8
  9#include <mgba/internal/arm/macros.h>
 10#include <mgba/internal/ds/gx.h>
 11#include <mgba/internal/ds/io.h>
 12
 13static void DSVideoSoftwareRendererInit(struct DSVideoRenderer* renderer);
 14static void DSVideoSoftwareRendererDeinit(struct DSVideoRenderer* renderer);
 15static void DSVideoSoftwareRendererReset(struct DSVideoRenderer* renderer);
 16static uint16_t DSVideoSoftwareRendererWriteVideoRegister(struct DSVideoRenderer* renderer, uint32_t address, uint16_t value);
 17static void DSVideoSoftwareRendererWritePalette(struct DSVideoRenderer* renderer, uint32_t address, uint16_t value);
 18static void DSVideoSoftwareRendererWriteOAM(struct DSVideoRenderer* renderer, uint32_t oam);
 19static void DSVideoSoftwareRendererInvalidateExtPal(struct DSVideoRenderer* renderer, bool obj, bool engB, int slot);
 20static void DSVideoSoftwareRendererDrawScanline(struct DSVideoRenderer* renderer, int y);
 21static void DSVideoSoftwareRendererDrawScanlineDirectly(struct DSVideoRenderer* renderer, int y, color_t* scanline);
 22static void DSVideoSoftwareRendererFinishFrame(struct DSVideoRenderer* renderer);
 23static void DSVideoSoftwareRendererGetPixels(struct DSVideoRenderer* renderer, size_t* stride, const void** pixels);
 24static void DSVideoSoftwareRendererPutPixels(struct DSVideoRenderer* renderer, size_t stride, const void* pixels);
 25
 26static void DSVideoSoftwareRendererDrawBackgroundExt0(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY);
 27static void DSVideoSoftwareRendererDrawBackgroundExt1(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY);
 28static void DSVideoSoftwareRendererDrawBackgroundExt2(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY);
 29
 30static bool _regenerateExtPalette(struct DSVideoSoftwareRenderer* renderer, bool obj, bool engB, int slot) {
 31	color_t* palette;
 32	color_t* variantPalette;
 33	struct GBAVideoSoftwareRenderer* softwareRenderer;
 34	uint16_t* vram;
 35	if (!obj) {
 36		if (!engB) {
 37			palette = &renderer->extPaletteA[slot * 4096];
 38			variantPalette = &renderer->variantPaletteA[slot * 4096];
 39			softwareRenderer = &renderer->engA;
 40			vram = renderer->d.vramABGExtPal[slot];
 41		} else {
 42			palette = &renderer->extPaletteB[slot * 4096];
 43			variantPalette = &renderer->variantPaletteB[slot * 4096];
 44			softwareRenderer = &renderer->engB;
 45			vram = renderer->d.vramBBGExtPal[slot];
 46		}
 47	} else {
 48		if (!engB) {
 49			palette = renderer->objExtPaletteA;
 50			variantPalette = renderer->variantPaletteA;
 51			softwareRenderer = &renderer->engA;
 52			vram = renderer->d.vramAOBJExtPal;
 53		} else {
 54			palette = renderer->objExtPaletteB;
 55			variantPalette = renderer->variantPaletteB;
 56			softwareRenderer = &renderer->engB;
 57			vram = renderer->d.vramBOBJExtPal;
 58		}
 59	}
 60	if (!vram) {
 61		return false;
 62	}
 63	int i;
 64	for (i = 0; i < 4096; ++i) {
 65		uint16_t value = vram[i];
 66#ifdef COLOR_16_BIT
 67#ifdef COLOR_5_6_5
 68		unsigned color = 0;
 69		color |= (value & 0x001F) << 11;
 70		color |= (value & 0x03E0) << 1;
 71		color |= (value & 0x7C00) >> 10;
 72#else
 73		unsigned color = value;
 74#endif
 75#else
 76		unsigned color = 0;
 77		color |= (value << 3) & 0xF8;
 78		color |= (value << 6) & 0xF800;
 79		color |= (value << 9) & 0xF80000;
 80		color |= (color >> 5) & 0x070707;
 81#endif
 82		palette[i] = color;
 83		if (softwareRenderer->blendEffect == BLEND_BRIGHTEN) {
 84			variantPalette[i] = _brighten(color, softwareRenderer->bldy);
 85		} else if (softwareRenderer->blendEffect == BLEND_DARKEN) {
 86			variantPalette[i] = _darken(color, softwareRenderer->bldy);
 87		}
 88	}
 89	if (obj) {
 90		softwareRenderer->objExtPalette = palette;
 91		softwareRenderer->objExtVariantPalette = variantPalette;
 92	} else {
 93		if (slot >= 2) {
 94			if (GBARegisterBGCNTIsExtPaletteSlot(softwareRenderer->bg[slot - 2].control)) {
 95				softwareRenderer->bg[slot - 2].extPalette = palette;
 96				softwareRenderer->bg[slot - 2].variantPalette = variantPalette;
 97			}
 98		} else if (slot < 2 && !GBARegisterBGCNTIsExtPaletteSlot(softwareRenderer->bg[slot].control) ) {
 99			softwareRenderer->bg[slot].extPalette = palette;
100			softwareRenderer->bg[slot].variantPalette = variantPalette;
101		}
102		softwareRenderer->bg[slot].extPalette = palette;
103		softwareRenderer->bg[slot].variantPalette = variantPalette;
104	}
105	return true;
106}
107
108static void _updateCharBase(struct DSVideoSoftwareRenderer* softwareRenderer, bool engB) {
109	struct GBAVideoSoftwareRenderer* eng;
110	if (!engB) {
111		eng = &softwareRenderer->engA;
112	} else {
113		eng = &softwareRenderer->engB;
114	}
115	int i;
116	uint32_t charBase = DSRegisterDISPCNTGetCharBase(softwareRenderer->dispcntA) << 16;
117	uint32_t screenBase = DSRegisterDISPCNTGetScreenBase(softwareRenderer->dispcntA) << 16;
118	for (i = 0; i < 4; ++i) {
119		if (!engB) {
120			uint32_t control = eng->bg[i].control;
121			eng->d.writeVideoRegister(&eng->d, DS9_REG_A_BG0CNT + i * 2, control);
122			eng->bg[i].control = control;
123		}
124
125		eng->bg[i].charBase = GBARegisterBGCNTGetCharBase(eng->bg[i].control) << 14;
126
127		if (!engB) {
128			softwareRenderer->engA.bg[i].charBase += charBase;
129			softwareRenderer->engA.bg[i].screenBase &= ~0x70000;
130			softwareRenderer->engA.bg[i].screenBase |= screenBase;
131		}
132	}
133}
134
135void DSVideoSoftwareRendererCreate(struct DSVideoSoftwareRenderer* renderer) {
136	renderer->d.init = DSVideoSoftwareRendererInit;
137	renderer->d.reset = DSVideoSoftwareRendererReset;
138	renderer->d.deinit = DSVideoSoftwareRendererDeinit;
139	renderer->d.writeVideoRegister = DSVideoSoftwareRendererWriteVideoRegister;
140	renderer->d.writePalette = DSVideoSoftwareRendererWritePalette;
141	renderer->d.writeOAM = DSVideoSoftwareRendererWriteOAM;
142	renderer->d.invalidateExtPal = DSVideoSoftwareRendererInvalidateExtPal;
143	renderer->d.drawScanline = DSVideoSoftwareRendererDrawScanline;
144	renderer->d.drawScanlineDirectly = DSVideoSoftwareRendererDrawScanlineDirectly;
145	renderer->d.finishFrame = DSVideoSoftwareRendererFinishFrame;
146	renderer->d.getPixels = DSVideoSoftwareRendererGetPixels;
147	renderer->d.putPixels = DSVideoSoftwareRendererPutPixels;
148
149	renderer->d.disableABG[0] = false;
150	renderer->d.disableABG[1] = false;
151	renderer->d.disableABG[2] = false;
152	renderer->d.disableABG[3] = false;
153	renderer->d.disableAOBJ = false;
154
155	renderer->d.disableBBG[0] = false;
156	renderer->d.disableBBG[1] = false;
157	renderer->d.disableBBG[2] = false;
158	renderer->d.disableBBG[3] = false;
159	renderer->d.disableBOBJ = false;
160
161	renderer->engA.d.cache = NULL;
162	GBAVideoSoftwareRendererCreate(&renderer->engA);
163	renderer->engA.combinedObjSort = true;
164
165	renderer->engB.d.cache = NULL;
166	GBAVideoSoftwareRendererCreate(&renderer->engB);
167	renderer->engB.combinedObjSort = true;
168}
169
170static void DSVideoSoftwareRendererInit(struct DSVideoRenderer* renderer) {
171	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
172	softwareRenderer->engA.d.palette = &renderer->palette[0];
173	softwareRenderer->engA.d.oam = &renderer->oam->oam[0];
174	softwareRenderer->engA.masterEnd = DS_VIDEO_HORIZONTAL_PIXELS;
175	softwareRenderer->engA.masterHeight = DS_VIDEO_VERTICAL_PIXELS;
176	softwareRenderer->engA.masterScanlines = DS_VIDEO_VERTICAL_TOTAL_PIXELS;
177	softwareRenderer->engA.outputBufferStride = softwareRenderer->outputBufferStride;
178	softwareRenderer->engB.d.palette = &renderer->palette[512];
179	softwareRenderer->engB.d.oam = &renderer->oam->oam[1];
180	softwareRenderer->engB.masterEnd = DS_VIDEO_HORIZONTAL_PIXELS;
181	softwareRenderer->engB.masterHeight = DS_VIDEO_VERTICAL_PIXELS;
182	softwareRenderer->engB.masterScanlines = DS_VIDEO_VERTICAL_TOTAL_PIXELS;
183	softwareRenderer->engB.outputBufferStride = softwareRenderer->outputBufferStride;
184
185	DSVideoSoftwareRendererReset(renderer);
186}
187
188static void DSVideoSoftwareRendererReset(struct DSVideoRenderer* renderer) {
189	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
190	softwareRenderer->engA.d.reset(&softwareRenderer->engA.d);
191	softwareRenderer->engB.d.reset(&softwareRenderer->engB.d);
192	softwareRenderer->powcnt = 0;
193	softwareRenderer->dispcntA = 0;
194	softwareRenderer->dispcntB = 0;
195}
196
197static void DSVideoSoftwareRendererDeinit(struct DSVideoRenderer* renderer) {
198	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
199	softwareRenderer->engA.d.deinit(&softwareRenderer->engA.d);
200	softwareRenderer->engB.d.deinit(&softwareRenderer->engB.d);
201}
202
203static void DSVideoSoftwareRendererUpdateDISPCNT(struct DSVideoSoftwareRenderer* softwareRenderer, bool engB) {
204	uint32_t dispcnt;
205	struct GBAVideoSoftwareRenderer* eng;
206	if (!engB) {
207		dispcnt = softwareRenderer->dispcntA;
208		eng = &softwareRenderer->engA;
209	} else {
210		dispcnt = softwareRenderer->dispcntB;
211		eng = &softwareRenderer->engB;
212	}
213	uint16_t fakeDispcnt = dispcnt & 0xFF87;
214	if (!DSRegisterDISPCNTIsTileObjMapping(dispcnt)) {
215		eng->tileStride = 0x20;
216	} else {
217		eng->tileStride = 0x20 << DSRegisterDISPCNTGetTileBoundary(dispcnt);
218		fakeDispcnt = GBARegisterDISPCNTFillObjCharacterMapping(fakeDispcnt);
219	}
220	eng->bitmapStride = 0x10 << DSRegisterDISPCNTGetBitmapObj2D(dispcnt);
221	eng->d.writeVideoRegister(&eng->d, DS9_REG_A_DISPCNT_LO, fakeDispcnt);
222	eng->dispcnt |= dispcnt & 0xFFFF0000;
223	if (DSRegisterDISPCNTIsBgExtPalette(dispcnt)) {
224		color_t* extPalette;
225		if (!engB) {
226			extPalette = softwareRenderer->extPaletteA;
227		} else {
228			extPalette = softwareRenderer->extPaletteB;
229		}
230		int i;
231		for (i = 0; i < 4; ++i) {
232			int slot = i;
233			if (i < 2 && GBARegisterBGCNTIsExtPaletteSlot(eng->bg[i].control)) {
234				slot += 2;
235			}
236			if (eng->bg[i].extPalette != &extPalette[slot * 4096]) {
237				_regenerateExtPalette(softwareRenderer, false, engB, slot);
238			}
239		}
240	} else {
241		eng->bg[0].extPalette = NULL;
242		eng->bg[1].extPalette = NULL;
243		eng->bg[2].extPalette = NULL;
244		eng->bg[3].extPalette = NULL;
245	}
246	if (DSRegisterDISPCNTIsObjExtPalette(dispcnt)) {
247		if (!engB) {
248			if (softwareRenderer->engA.objExtPalette != softwareRenderer->objExtPaletteA) {
249				_regenerateExtPalette(softwareRenderer, true, engB, 0);
250			}
251		} else {
252			if (softwareRenderer->engB.objExtPalette != softwareRenderer->objExtPaletteB) {
253				_regenerateExtPalette(softwareRenderer, true, engB, 0);
254			}
255		}
256	} else {
257		if (!engB) {
258			softwareRenderer->engA.objExtPalette = NULL;
259		} else {
260			softwareRenderer->engB.objExtPalette = NULL;
261		}
262	}
263	if (!engB) {
264		eng->dispcnt = DSRegisterDISPCNTClear3D(eng->dispcnt);
265		eng->dispcnt |= DSRegisterDISPCNTIs3D(dispcnt);
266		_updateCharBase(softwareRenderer, engB);
267	}
268}
269
270static uint16_t DSVideoSoftwareRendererWriteVideoRegister(struct DSVideoRenderer* renderer, uint32_t address, uint16_t value) {
271	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
272	if (address >= DS9_REG_A_BG0CNT && address <= DS9_REG_A_BLDY) {
273		softwareRenderer->engA.d.writeVideoRegister(&softwareRenderer->engA.d, address, value);
274	} else if (address >= DS9_REG_B_BG0CNT && address <= DS9_REG_B_BLDY) {
275		softwareRenderer->engB.d.writeVideoRegister(&softwareRenderer->engB.d, address & 0xFF, value);
276	} else {
277		mLOG(DS_VIDEO, STUB, "Stub video register write: %04X:%04X", address, value);
278	}
279	switch (address) {
280	case DS9_REG_A_BG0CNT:
281	case DS9_REG_A_BG1CNT:
282		softwareRenderer->engA.bg[(address - DS9_REG_A_BG0CNT) >> 1].control = value;
283		// Fall through
284	case DS9_REG_A_BG2CNT:
285	case DS9_REG_A_BG3CNT:
286		_updateCharBase(softwareRenderer, false);
287		break;
288	case DS9_REG_B_BG0CNT:
289	case DS9_REG_B_BG1CNT:
290		softwareRenderer->engB.bg[(address - DS9_REG_B_BG0CNT) >> 1].control = value;
291		// Fall through
292	case DS9_REG_B_BG2CNT:
293	case DS9_REG_B_BG3CNT:
294		_updateCharBase(softwareRenderer, true);
295		break;
296	case DS9_REG_A_MASTER_BRIGHT:
297		softwareRenderer->engA.masterBright = DSRegisterMASTER_BRIGHTGetMode(value);
298		softwareRenderer->engA.masterBrightY = DSRegisterMASTER_BRIGHTGetY(value);
299		if (softwareRenderer->engA.masterBrightY > 0x10) {
300			softwareRenderer->engA.masterBrightY = 0x10;
301		}
302		break;
303	case DS9_REG_B_MASTER_BRIGHT:
304		softwareRenderer->engB.masterBright = DSRegisterMASTER_BRIGHTGetMode(value);
305		softwareRenderer->engB.masterBrightY = DSRegisterMASTER_BRIGHTGetY(value);
306		if (softwareRenderer->engB.masterBrightY > 0x10) {
307			softwareRenderer->engB.masterBrightY = 0x10;
308		}
309		break;
310	case DS9_REG_A_BLDCNT:
311	case DS9_REG_A_BLDY:
312		// TODO: Optimize
313		_regenerateExtPalette(softwareRenderer, false, false, 0);
314		_regenerateExtPalette(softwareRenderer, false, false, 1);
315		_regenerateExtPalette(softwareRenderer, false, false, 2);
316		_regenerateExtPalette(softwareRenderer, false, false, 3);
317		_regenerateExtPalette(softwareRenderer, true, false, 0);
318		break;
319	case DS9_REG_B_BLDCNT:
320	case DS9_REG_B_BLDY:
321		// TODO: Optimize
322		_regenerateExtPalette(softwareRenderer, false, true, 0);
323		_regenerateExtPalette(softwareRenderer, false, true, 1);
324		_regenerateExtPalette(softwareRenderer, false, true, 2);
325		_regenerateExtPalette(softwareRenderer, false, true, 3);
326		_regenerateExtPalette(softwareRenderer, true, true, 0);
327		break;
328	case DS9_REG_A_DISPCNT_LO:
329		softwareRenderer->dispcntA &= 0xFFFF0000;
330		softwareRenderer->dispcntA |= value;
331		DSVideoSoftwareRendererUpdateDISPCNT(softwareRenderer, false);
332		break;
333	case DS9_REG_A_DISPCNT_HI:
334		softwareRenderer->dispcntA &= 0x0000FFFF;
335		softwareRenderer->dispcntA |= value << 16;
336		DSVideoSoftwareRendererUpdateDISPCNT(softwareRenderer, false);
337		break;
338	case DS9_REG_B_DISPCNT_LO:
339		softwareRenderer->dispcntB &= 0xFFFF0000;
340		softwareRenderer->dispcntB |= value;
341		DSVideoSoftwareRendererUpdateDISPCNT(softwareRenderer, true);
342		break;
343	case DS9_REG_B_DISPCNT_HI:
344		softwareRenderer->dispcntB &= 0x0000FFFF;
345		softwareRenderer->dispcntB |= value << 16;
346		DSVideoSoftwareRendererUpdateDISPCNT(softwareRenderer, true);
347		break;
348	case DS9_REG_POWCNT1:
349		value &= 0x810F;
350		softwareRenderer->powcnt = value;
351	}
352	return value;
353}
354
355static void DSVideoSoftwareRendererWritePalette(struct DSVideoRenderer* renderer, uint32_t address, uint16_t value) {
356	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
357	if (address < 0x400) {
358		softwareRenderer->engA.d.writePalette(&softwareRenderer->engA.d, address & 0x3FF, value);
359	} else {
360		softwareRenderer->engB.d.writePalette(&softwareRenderer->engB.d, address & 0x3FF, value);
361	}
362}
363
364static void DSVideoSoftwareRendererWriteOAM(struct DSVideoRenderer* renderer, uint32_t oam) {
365	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
366	if (oam < 0x200) {
367		softwareRenderer->engA.d.writeOAM(&softwareRenderer->engA.d, oam & 0x1FF);
368	} else {
369		softwareRenderer->engB.d.writeOAM(&softwareRenderer->engB.d, oam & 0x1FF);
370	}
371}
372
373static void DSVideoSoftwareRendererInvalidateExtPal(struct DSVideoRenderer* renderer, bool obj, bool engB, int slot) {
374	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
375	_regenerateExtPalette(softwareRenderer, obj, engB, slot);
376}
377
378static void DSVideoSoftwareRendererDrawGBAScanline(struct GBAVideoRenderer* renderer, struct DSGX* gx, int y) {
379	struct GBAVideoSoftwareRenderer* softwareRenderer = (struct GBAVideoSoftwareRenderer*) renderer;
380
381	int x;
382	color_t* row = &softwareRenderer->outputBuffer[softwareRenderer->outputBufferStride * y];
383	if (GBARegisterDISPCNTIsForcedBlank(softwareRenderer->dispcnt)) {
384		for (x = 0; x < softwareRenderer->masterEnd; ++x) {
385			row[x] = GBA_COLOR_WHITE;
386		}
387		return;
388	}
389
390	GBAVideoSoftwareRendererPreprocessBuffer(softwareRenderer, y);
391	int spriteLayers = GBAVideoSoftwareRendererPreprocessSpriteLayer(softwareRenderer, y);
392	memset(softwareRenderer->alphaA, softwareRenderer->blda, sizeof(softwareRenderer->alphaA));
393	memset(softwareRenderer->alphaB, softwareRenderer->bldb, sizeof(softwareRenderer->alphaB));
394
395	int w;
396	unsigned priority;
397	for (priority = 0; priority < 4; ++priority) {
398		softwareRenderer->end = 0;
399		for (w = 0; w < softwareRenderer->nWindows; ++w) {
400			softwareRenderer->start = softwareRenderer->end;
401			softwareRenderer->end = softwareRenderer->windows[w].endX;
402			softwareRenderer->currentWindow = softwareRenderer->windows[w].control;
403			if (spriteLayers & (1 << priority)) {
404				GBAVideoSoftwareRendererPostprocessSprite(softwareRenderer, priority);
405			}
406			if (TEST_LAYER_ENABLED(0)) {
407				if (DSRegisterDISPCNTIs3D(softwareRenderer->dispcnt) && gx) {
408					const color_t* scanline;
409					gx->renderer->getScanline(gx->renderer, y, &scanline);
410					uint32_t flags = (softwareRenderer->bg[0].priority << OFFSET_PRIORITY) | FLAG_IS_BACKGROUND | FLAG_TARGET_1 | FLAG_TARGET_2;
411					int x;
412					for (x = softwareRenderer->start; x < softwareRenderer->end; ++x) {
413						color_t color = scanline[x];
414						if (color & 0xFC000000) {
415							if (softwareRenderer->bg[0].target1 && GBAWindowControlIsBlendEnable(softwareRenderer->currentWindow.packed)) {
416								if (softwareRenderer->blendEffect == BLEND_DARKEN) {
417									color = _darken(color, softwareRenderer->bldy) | (color & 0xFF000000);
418								} else if (softwareRenderer->blendEffect == BLEND_BRIGHTEN) {
419									color = _brighten(color, softwareRenderer->bldy) | (color & 0xFF000000);
420								}
421							}
422							if ((scanline[x] >> 28) != 0xF) {
423								// TODO: More precise values
424								softwareRenderer->alphaA[x] = (color >> 28) + 1;
425								softwareRenderer->alphaB[x] = 0xF - (color >> 28);
426								_compositeBlendNoObjwin(softwareRenderer, x, (color & 0x00FFFFFF) | flags, softwareRenderer->row[x]);
427							} else {
428								if (!(softwareRenderer->row[x] & FLAG_TARGET_1)) {
429									_compositeNoBlendNoObjwin(softwareRenderer, x, (color & 0x00FFFFFF) | flags, softwareRenderer->row[x]);
430								} else {
431									_compositeBlendNoObjwin(softwareRenderer, x, (color & 0x00FFFFFF) | flags, softwareRenderer->row[x]);
432								}
433								softwareRenderer->alphaA[x] = 0x10;
434								softwareRenderer->alphaB[x] = 0;
435							}
436						}
437					}
438				} else {
439					GBAVideoSoftwareRendererDrawBackgroundMode0(softwareRenderer, &softwareRenderer->bg[0], y);
440				}
441			}
442			if (TEST_LAYER_ENABLED(1)) {
443				GBAVideoSoftwareRendererDrawBackgroundMode0(softwareRenderer, &softwareRenderer->bg[1], y);
444			}
445			if (TEST_LAYER_ENABLED(2)) {
446				switch (GBARegisterDISPCNTGetMode(softwareRenderer->dispcnt)) {
447				case 0:
448				case 1:
449				case 3:
450					GBAVideoSoftwareRendererDrawBackgroundMode0(softwareRenderer, &softwareRenderer->bg[2], y);
451					break;
452				case 2:
453				case 4:
454					GBAVideoSoftwareRendererDrawBackgroundMode2(softwareRenderer, &softwareRenderer->bg[2], y);
455					break;
456				case 5:
457					if (!GBARegisterBGCNTIsExtendedMode1(softwareRenderer->bg[2].control)) {
458						DSVideoSoftwareRendererDrawBackgroundExt0(softwareRenderer, &softwareRenderer->bg[2], y);
459					} else if (!GBARegisterBGCNTIsExtendedMode0(softwareRenderer->bg[2].control)) {
460						DSVideoSoftwareRendererDrawBackgroundExt1(softwareRenderer, &softwareRenderer->bg[2], y);
461					} else {
462						DSVideoSoftwareRendererDrawBackgroundExt2(softwareRenderer, &softwareRenderer->bg[2], y);
463					}
464					break;
465				}
466			}
467			if (TEST_LAYER_ENABLED(3)) {
468				switch (GBARegisterDISPCNTGetMode(softwareRenderer->dispcnt)) {
469				case 0:
470					GBAVideoSoftwareRendererDrawBackgroundMode0(softwareRenderer, &softwareRenderer->bg[3], y);
471					break;
472				case 1:
473				case 2:
474					GBAVideoSoftwareRendererDrawBackgroundMode2(softwareRenderer, &softwareRenderer->bg[3], y);
475					break;
476				case 3:
477				case 4:
478				case 5:
479					if (!GBARegisterBGCNTIsExtendedMode1(softwareRenderer->bg[3].control)) {
480						DSVideoSoftwareRendererDrawBackgroundExt0(softwareRenderer, &softwareRenderer->bg[3], y);
481					} else if (!GBARegisterBGCNTIsExtendedMode0(softwareRenderer->bg[3].control)) {
482						DSVideoSoftwareRendererDrawBackgroundExt1(softwareRenderer, &softwareRenderer->bg[3], y);
483					} else {
484						DSVideoSoftwareRendererDrawBackgroundExt2(softwareRenderer, &softwareRenderer->bg[3], y);
485					}
486					break;
487				}
488			}
489		}
490	}
491
492	GBAVideoSoftwareRendererPostprocessBuffer(softwareRenderer);
493}
494
495static void _advanceAffine(struct GBAVideoSoftwareRenderer* softwareRenderer) {
496	switch (GBARegisterDISPCNTGetMode(softwareRenderer->dispcnt)) {
497	case 2:
498	case 4:
499	case 5:
500		softwareRenderer->bg[2].sx += softwareRenderer->bg[2].dmx;
501		softwareRenderer->bg[2].sy += softwareRenderer->bg[2].dmy;
502		// Fall through
503	case 1:
504	case 3:
505		softwareRenderer->bg[3].sx += softwareRenderer->bg[3].dmx;
506		softwareRenderer->bg[3].sy += softwareRenderer->bg[3].dmy;
507		break;
508	}
509}
510
511static void _deadvanceAffine(struct GBAVideoSoftwareRenderer* softwareRenderer) {
512	switch (GBARegisterDISPCNTGetMode(softwareRenderer->dispcnt)) {
513	case 2:
514	case 4:
515	case 5:
516		softwareRenderer->bg[2].sx -= softwareRenderer->bg[2].dmx;
517		softwareRenderer->bg[2].sy -= softwareRenderer->bg[2].dmy;
518		// Fall through
519	case 1:
520	case 3:
521		softwareRenderer->bg[3].sx -= softwareRenderer->bg[3].dmx;
522		softwareRenderer->bg[3].sy -= softwareRenderer->bg[3].dmy;
523		break;
524	}
525}
526
527static void _drawScanlineA(struct DSVideoSoftwareRenderer* softwareRenderer, int y) {
528	memcpy(softwareRenderer->engA.d.vramBG, softwareRenderer->d.vramABG, sizeof(softwareRenderer->engA.d.vramBG));
529	memcpy(softwareRenderer->engA.d.vramOBJ, softwareRenderer->d.vramAOBJ, sizeof(softwareRenderer->engA.d.vramOBJ));
530	color_t* row = &softwareRenderer->engA.outputBuffer[softwareRenderer->outputBufferStride * y];
531
532	int x;
533	switch (DSRegisterDISPCNTGetDispMode(softwareRenderer->dispcntA)) {
534	case 0:
535		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
536			row[x] = GBA_COLOR_WHITE;
537		}
538		return;
539	case 1:
540		DSVideoSoftwareRendererDrawGBAScanline(&softwareRenderer->engA.d, softwareRenderer->d.gx, y);
541		break;
542	case 2: {
543		uint16_t* vram = &softwareRenderer->d.vram[0x10000 * DSRegisterDISPCNTGetVRAMBlock(softwareRenderer->dispcntA)];
544		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
545			color_t color;
546			LOAD_16(color, (x + y * DS_VIDEO_HORIZONTAL_PIXELS) * 2, vram);
547#ifndef COLOR_16_BIT
548			unsigned color32 = 0;
549			color32 |= (color << 9) & 0xF80000;
550			color32 |= (color << 3) & 0xF8;
551			color32 |= (color << 6) & 0xF800;
552			color32 |= (color32 >> 5) & 0x070707;
553			color = color32;
554#elif COLOR_5_6_5
555			uint16_t color16 = 0;
556			color16 |= (color & 0x001F) << 11;
557			color16 |= (color & 0x03E0) << 1;
558			color16 |= (color & 0x7C00) >> 10;
559			color = color16;
560#endif
561			softwareRenderer->engA.row[x] = color;
562		}
563		break;
564	}
565	case 3:
566		break;
567	}
568
569	_advanceAffine(&softwareRenderer->engA);
570
571#ifdef COLOR_16_BIT
572#if defined(__ARM_NEON) && !defined(__APPLE__)
573	_to16Bit(row, softwareRenderer->engA.row, DS_VIDEO_HORIZONTAL_PIXELS);
574#else
575	for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
576		row[x] = softwareRenderer->engA.row[x];
577	}
578#endif
579#else
580	switch (softwareRenderer->engA.masterBright) {
581	case 0:
582	default:
583		memcpy(row, softwareRenderer->engA.row, softwareRenderer->engA.masterEnd * sizeof(*row));
584		break;
585	case 1:
586		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
587			row[x] = _brighten(softwareRenderer->engA.row[x], softwareRenderer->engA.masterBrightY);
588		}
589		break;
590	case 2:
591		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
592			row[x] = _darken(softwareRenderer->engA.row[x], softwareRenderer->engA.masterBrightY);
593		}
594		break;
595	}
596#endif
597}
598
599static void _drawScanlineB(struct DSVideoSoftwareRenderer* softwareRenderer, int y) {
600	memcpy(softwareRenderer->engB.d.vramBG, softwareRenderer->d.vramBBG, sizeof(softwareRenderer->engB.d.vramBG));
601	memcpy(softwareRenderer->engB.d.vramOBJ, softwareRenderer->d.vramBOBJ, sizeof(softwareRenderer->engB.d.vramOBJ));
602	color_t* row = &softwareRenderer->engB.outputBuffer[softwareRenderer->outputBufferStride * y];
603
604	int x;
605	switch (DSRegisterDISPCNTGetDispMode(softwareRenderer->dispcntB)) {
606	case 0:
607		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
608			row[x] = GBA_COLOR_WHITE;
609		}
610		return;
611	case 1:
612		DSVideoSoftwareRendererDrawGBAScanline(&softwareRenderer->engB.d, NULL, y);
613		break;
614	}
615
616	_advanceAffine(&softwareRenderer->engB);
617
618#ifdef COLOR_16_BIT
619#if defined(__ARM_NEON) && !defined(__APPLE__)
620	_to16Bit(row, softwareRenderer->engB.row, DS_VIDEO_HORIZONTAL_PIXELS);
621#else
622	for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
623		row[x] = softwareRenderer->engB.row[x];
624	}
625#endif
626#else
627	switch (softwareRenderer->engB.masterBright) {
628	case 0:
629	default:
630		memcpy(row, softwareRenderer->engB.row, softwareRenderer->engB.masterEnd * sizeof(*row));
631		break;
632	case 1:
633		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
634			row[x] = _brighten(softwareRenderer->engB.row[x], softwareRenderer->engB.masterBrightY);
635		}
636		break;
637	case 2:
638		for (x = 0; x < DS_VIDEO_HORIZONTAL_PIXELS; ++x) {
639			row[x] = _darken(softwareRenderer->engB.row[x], softwareRenderer->engB.masterBrightY);
640		}
641		break;
642	}
643#endif
644}
645
646static void DSVideoSoftwareRendererDrawScanline(struct DSVideoRenderer* renderer, int y) {
647	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
648	if (!DSRegisterPOWCNT1IsSwap(softwareRenderer->powcnt)) {
649		softwareRenderer->engA.outputBuffer = &softwareRenderer->outputBuffer[softwareRenderer->outputBufferStride * DS_VIDEO_VERTICAL_PIXELS];
650		softwareRenderer->engB.outputBuffer = softwareRenderer->outputBuffer;
651	} else {
652		softwareRenderer->engA.outputBuffer = softwareRenderer->outputBuffer;
653		softwareRenderer->engB.outputBuffer = &softwareRenderer->outputBuffer[softwareRenderer->outputBufferStride * DS_VIDEO_VERTICAL_PIXELS];
654	}
655
656	softwareRenderer->engA.d.disableBG[0] = softwareRenderer->d.disableABG[0];
657	softwareRenderer->engA.d.disableBG[1] = softwareRenderer->d.disableABG[1];
658	softwareRenderer->engA.d.disableBG[2] = softwareRenderer->d.disableABG[2];
659	softwareRenderer->engA.d.disableBG[3] = softwareRenderer->d.disableABG[3];
660	softwareRenderer->engA.d.disableOBJ = softwareRenderer->d.disableAOBJ;
661
662	softwareRenderer->engB.d.disableBG[0] = softwareRenderer->d.disableBBG[0];
663	softwareRenderer->engB.d.disableBG[1] = softwareRenderer->d.disableBBG[1];
664	softwareRenderer->engB.d.disableBG[2] = softwareRenderer->d.disableBBG[2];
665	softwareRenderer->engB.d.disableBG[3] = softwareRenderer->d.disableBBG[3];
666	softwareRenderer->engB.d.disableOBJ = softwareRenderer->d.disableBOBJ;
667
668	_drawScanlineA(softwareRenderer, y);
669	_drawScanlineB(softwareRenderer, y);
670}
671
672static void DSVideoSoftwareRendererDrawScanlineDirectly(struct DSVideoRenderer* renderer, int y, color_t* scanline) {
673	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
674	_deadvanceAffine(&softwareRenderer->engA);
675	DSVideoSoftwareRendererDrawGBAScanline(&softwareRenderer->engA.d, softwareRenderer->d.gx, y);
676	_advanceAffine(&softwareRenderer->engA);
677	memcpy(scanline, softwareRenderer->engA.row, softwareRenderer->engA.masterEnd * sizeof(*scanline));
678}
679
680static void DSVideoSoftwareRendererFinishFrame(struct DSVideoRenderer* renderer) {
681	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
682	softwareRenderer->engA.d.finishFrame(&softwareRenderer->engA.d);
683	softwareRenderer->engB.d.finishFrame(&softwareRenderer->engB.d);
684}
685
686static void DSVideoSoftwareRendererGetPixels(struct DSVideoRenderer* renderer, size_t* stride, const void** pixels) {
687	struct DSVideoSoftwareRenderer* softwareRenderer = (struct DSVideoSoftwareRenderer*) renderer;
688#ifdef COLOR_16_BIT
689#error Not yet supported
690#else
691	*stride = softwareRenderer->outputBufferStride;
692	*pixels = softwareRenderer->outputBuffer;
693#endif
694}
695
696static void DSVideoSoftwareRendererPutPixels(struct DSVideoRenderer* renderer, size_t stride, const void* pixels) {
697}
698
699#define EXT_0_COORD_OVERFLOW \
700	localX = x & (sizeAdjusted - 1); \
701	localY = y & (sizeAdjusted - 1); \
702
703#define EXT_0_COORD_NO_OVERFLOW \
704	if ((x | y) & ~(sizeAdjusted - 1)) { \
705		continue; \
706	} \
707	localX = x; \
708	localY = y;
709
710#define EXT_0_EXT_PAL \
711	paletteData = GBA_TEXT_MAP_PALETTE(mapData) << 8; \
712	palette = &mainPalette[paletteData];
713
714#define EXT_0_PAL palette = mainPalette;
715
716#define EXT_0_NO_MOSAIC(COORD, PAL) \
717	COORD \
718	uint32_t screenBase = background->screenBase + (localX >> 10) + (((localY >> 6) & 0xFE0) << background->size); \
719	uint16_t* screenBlock = renderer->d.vramBG[screenBase >> VRAM_BLOCK_OFFSET]; \
720	if (UNLIKELY(!screenBlock)) { \
721		continue; \
722	} \
723	LOAD_16(mapData, screenBase & (VRAM_BLOCK_MASK - 1), screenBlock); \
724	PAL; \
725	if (GBA_TEXT_MAP_VFLIP(mapData)) { \
726		localY = 0x7FF - localY; \
727	} \
728	if (GBA_TEXT_MAP_HFLIP(mapData)) { \
729		localX = 0x7FF - localX; \
730	} \
731	uint32_t charBase = (background->charBase + (GBA_TEXT_MAP_TILE(mapData) << 6)) + ((localY & 0x700) >> 5) + ((localX & 0x700) >> 8); \
732	uint16_t* vram = renderer->d.vramBG[charBase >> VRAM_BLOCK_OFFSET]; \
733	pixelData = ((uint8_t*) vram)[charBase & VRAM_BLOCK_MASK];
734
735#define EXT_0_MOSAIC(COORD, PAL) \
736		if (!mosaicWait) { \
737			EXT_0_NO_MOSAIC(COORD, PAL) \
738			mosaicWait = mosaicH; \
739		} else { \
740			--mosaicWait; \
741		}
742
743#define EXT_0_LOOP(MOSAIC, COORD, PAL, BLEND, OBJWIN) \
744	for (outX = renderer->start, pixel = &renderer->row[outX]; outX < renderer->end; ++outX, ++pixel) { \
745		x += background->dx; \
746		y += background->dy; \
747		\
748		uint32_t current = *pixel; \
749		MOSAIC(COORD, PAL) \
750		if (pixelData) { \
751			COMPOSITE_256_ ## OBJWIN (BLEND, 0); \
752		} \
753	}
754
755#define DRAW_BACKGROUND_EXT_0(BLEND, OBJWIN) \
756	if (background->extPalette) { \
757		if (background->overflow) { \
758			if (mosaicH > 1) { \
759				EXT_0_LOOP(EXT_0_MOSAIC, EXT_0_COORD_OVERFLOW, EXT_0_EXT_PAL, BLEND, OBJWIN); \
760			} else { \
761				EXT_0_LOOP(EXT_0_NO_MOSAIC, EXT_0_COORD_OVERFLOW, EXT_0_EXT_PAL, BLEND, OBJWIN); \
762			} \
763		} else { \
764			if (mosaicH > 1) { \
765				EXT_0_LOOP(EXT_0_MOSAIC, EXT_0_COORD_NO_OVERFLOW, EXT_0_EXT_PAL, BLEND, OBJWIN); \
766			} else { \
767				EXT_0_LOOP(EXT_0_NO_MOSAIC, EXT_0_COORD_NO_OVERFLOW, EXT_0_EXT_PAL, BLEND, OBJWIN); \
768			} \
769		} \
770	} else { \
771		if (background->overflow) { \
772			if (mosaicH > 1) { \
773				EXT_0_LOOP(EXT_0_MOSAIC, EXT_0_COORD_OVERFLOW, EXT_0_PAL, BLEND, OBJWIN); \
774			} else { \
775				EXT_0_LOOP(EXT_0_NO_MOSAIC, EXT_0_COORD_OVERFLOW, EXT_0_PAL, BLEND, OBJWIN); \
776			} \
777		} else { \
778			if (mosaicH > 1) { \
779				EXT_0_LOOP(EXT_0_MOSAIC, EXT_0_COORD_NO_OVERFLOW, EXT_0_PAL, BLEND, OBJWIN); \
780			} else { \
781				EXT_0_LOOP(EXT_0_NO_MOSAIC, EXT_0_COORD_NO_OVERFLOW, EXT_0_PAL, BLEND, OBJWIN); \
782			} \
783		} \
784	}
785
786void DSVideoSoftwareRendererDrawBackgroundExt0(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY) {
787	int sizeAdjusted = 0x8000 << background->size;
788
789	BACKGROUND_BITMAP_INIT;
790
791	color_t* mainPalette = background->extPalette;
792	if (variant) {
793		mainPalette = background->variantPalette;
794	}
795	if (!mainPalette) {
796		mainPalette = renderer->normalPalette;
797		if (variant) {
798			mainPalette = renderer->variantPalette;
799		}
800	}
801	int paletteData;
802
803	uint16_t mapData;
804	uint8_t pixelData = 0;
805
806	int outX;
807	uint32_t* pixel;
808
809	if (!objwinSlowPath) {
810		if (!(flags & FLAG_TARGET_2)) {
811			DRAW_BACKGROUND_EXT_0(NoBlend, NO_OBJWIN);
812		} else {
813			DRAW_BACKGROUND_EXT_0(Blend, NO_OBJWIN);
814		}
815	} else {
816		if (!(flags & FLAG_TARGET_2)) {
817			DRAW_BACKGROUND_EXT_0(NoBlend, OBJWIN);
818		} else {
819			DRAW_BACKGROUND_EXT_0(Blend, OBJWIN);
820		}
821	}
822}
823
824#define DS_BACKGROUND_BITMAP_ITERATE(W, H)                         \
825	x += background->dx;                                           \
826	y += background->dy;                                           \
827                                                                   \
828	if (background->overflow) {                                    \
829		localX = x & ((W << 8) - 1);                               \
830		localY = y & ((H << 8) - 1);                               \
831	} else if (x < 0 || y < 0 || (x >> 8) >= W || (y >> 8) >= H) { \
832		continue;                                                  \
833	} else {                                                       \
834		localX = x;                                                \
835		localY = y;                                                \
836	}
837
838void DSVideoSoftwareRendererDrawBackgroundExt1(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY) {
839	BACKGROUND_BITMAP_INIT;
840
841	uint32_t screenBase = (background->screenBase & 0xFF00) * 8;
842	uint8_t color;
843	int width, height;
844	switch (background->size) {
845	case 0:
846		width = 128;
847		height = 128;
848		break;
849	case 1:
850		width = 256;
851		height = 256;
852		break;
853	case 2:
854		width = 512;
855		height = 256;
856		break;
857	case 3:
858		width = 512;
859		height = 512;
860		break;
861	}
862
863	int outX;
864	for (outX = renderer->start; outX < renderer->end; ++outX) {
865		DS_BACKGROUND_BITMAP_ITERATE(width, height);
866
867		if (!mosaicWait) {
868			uint32_t address = (localX >> 8) + (localY >> 8) * width + screenBase;
869			uint8_t* vram = (uint8_t*) renderer->d.vramBG[address >> VRAM_BLOCK_OFFSET];
870			color = vram[address & VRAM_BLOCK_MASK];
871			mosaicWait = mosaicH;
872		} else {
873			--mosaicWait;
874		}
875
876		uint32_t current = renderer->row[outX];
877		if (color && IS_WRITABLE(current)) {
878			if (!objwinSlowPath) {
879				_compositeBlendNoObjwin(renderer, outX, palette[color] | flags, current);
880			} else if (objwinForceEnable || (!(current & FLAG_OBJWIN)) == objwinOnly) {
881				color_t* currentPalette = (current & FLAG_OBJWIN) ? objwinPalette : palette;
882				unsigned mergedFlags = flags;
883				if (current & FLAG_OBJWIN) {
884					mergedFlags = objwinFlags;
885				}
886				_compositeBlendObjwin(renderer, outX, currentPalette[color] | mergedFlags, current);
887			}
888		}
889	}
890}
891
892void DSVideoSoftwareRendererDrawBackgroundExt2(struct GBAVideoSoftwareRenderer* renderer, struct GBAVideoSoftwareBackground* background, int inY) {
893	BACKGROUND_BITMAP_INIT;
894
895	uint32_t screenBase = (background->screenBase & 0xFF00) * 4;
896	uint32_t color;
897	int width, height;
898	switch (background->size) {
899	case 0:
900		width = 128;
901		height = 128;
902		break;
903	case 1:
904		width = 256;
905		height = 256;
906		break;
907	case 2:
908		width = 512;
909		height = 256;
910		break;
911	case 3:
912		width = 512;
913		height = 512;
914		break;
915	}
916
917	int outX;
918	for (outX = renderer->start; outX < renderer->end; ++outX) {
919		DS_BACKGROUND_BITMAP_ITERATE(width, height);
920
921		if (!mosaicWait) {
922			uint32_t address = ((localX >> 8) + (localY >> 8) * width + screenBase) << 1;
923			uint16_t* vram = renderer->d.vramBG[address >> VRAM_BLOCK_OFFSET];
924			LOAD_16(color, address & VRAM_BLOCK_MASK, vram);
925#ifndef COLOR_16_BIT
926			unsigned color32;
927			color32 = 0;
928			color32 |= (color << 3) & 0xF8;
929			color32 |= (color << 6) & 0xF800;
930			color32 |= (color << 9) & 0xF80000;
931			color32 |= (color32 >> 5) & 0x070707;
932			color = color32;
933#elif COLOR_5_6_5
934			uint16_t color16 = 0;
935			color16 |= (color & 0x001F) << 11;
936			color16 |= (color & 0x03E0) << 1;
937			color16 |= (color & 0x7C00) >> 10;
938			color = color16;
939#endif
940			mosaicWait = mosaicH;
941		} else {
942			--mosaicWait;
943		}
944
945		uint32_t current = renderer->row[outX];
946		if (!objwinSlowPath || (!(current & FLAG_OBJWIN)) != objwinOnly) {
947			unsigned mergedFlags = flags;
948			if (current & FLAG_OBJWIN) {
949				mergedFlags = objwinFlags;
950			}
951			if (!variant) {
952				_compositeBlendObjwin(renderer, outX, color | mergedFlags, current);
953			} else if (renderer->blendEffect == BLEND_BRIGHTEN) {
954				_compositeBlendObjwin(renderer, outX, _brighten(color, renderer->bldy) | mergedFlags, current);
955			} else if (renderer->blendEffect == BLEND_DARKEN) {
956				_compositeBlendObjwin(renderer, outX, _darken(color, renderer->bldy) | mergedFlags, current);
957			}
958		}
959	}
960}