VRAM DMA during mode 3

This commit is contained in:
Lior Halphon 2022-01-16 13:50:59 +02:00
parent 3133687e68
commit b45761146f
3 changed files with 89 additions and 68 deletions

View File

@ -643,6 +643,23 @@ static void render_pixel_if_possible(GB_gameboy_t *gb)
gb->window_is_being_fetched = false; gb->window_is_being_fetched = false;
} }
static inline void dma_sync(GB_gameboy_t *gb, unsigned *cycles)
{
if (unlikely(GB_is_dma_active(gb))) {
unsigned offset = *cycles - gb->display_cycles; // Time passed in 8MHz ticks
if (offset) {
*cycles = gb->display_cycles;
if (!gb->cgb_double_speed) {
offset >>= 1; // Convert to T-cycles
}
unsigned old = gb->dma_cycles;
gb->dma_cycles = offset;
GB_dma_run(gb);
gb->dma_cycles = old - offset;
}
}
}
/* All verified CGB timings are based on CGB CPU E. CGB CPUs >= D are known to have /* All verified CGB timings are based on CGB CPU E. CGB CPUs >= D are known to have
slightly different timings than CPUs <= C. slightly different timings than CPUs <= C.
@ -653,7 +670,21 @@ static inline uint8_t fetcher_y(GB_gameboy_t *gb)
return gb->wx_triggered? gb->window_y : gb->current_line + gb->io_registers[GB_IO_SCY]; return gb->wx_triggered? gb->window_y : gb->current_line + gb->io_registers[GB_IO_SCY];
} }
static void advance_fetcher_state_machine(GB_gameboy_t *gb) static inline uint8_t vram_read(GB_gameboy_t *gb, uint16_t addr)
{
if (unlikely(gb->vram_ppu_blocked)) {
return 0xFF;
}
if (unlikely(gb->dma_current_dest <= 0xa0 && gb->dma_current_dest > 0 && (gb->dma_current_src & 0xE000) == 0x8000)) { // TODO: what happens in the last and first M cycles?
// DMAing from VRAM!
/* TODO: This is only correct on a DMG/MGB, CGBs and AGBs use some other pattern; AGS has a completely different one */
addr |= ((gb->dma_current_src - 1) & 0x1FFF);
gb->oam[gb->dma_current_dest - 1] = gb->vram[addr];
}
return gb->vram[addr];
}
static void advance_fetcher_state_machine(GB_gameboy_t *gb, unsigned *cycles)
{ {
typedef enum { typedef enum {
GB_FETCHER_GET_TILE, GB_FETCHER_GET_TILE,
@ -675,6 +706,7 @@ static void advance_fetcher_state_machine(GB_gameboy_t *gb)
}; };
switch (fetcher_state_machine[gb->fetcher_state & 7]) { switch (fetcher_state_machine[gb->fetcher_state & 7]) {
case GB_FETCHER_GET_TILE: { case GB_FETCHER_GET_TILE: {
dma_sync(gb, cycles);
uint16_t map = 0x1800; uint16_t map = 0x1800;
if (!(gb->io_registers[GB_IO_LCDC] & 0x20)) { if (!(gb->io_registers[GB_IO_LCDC] & 0x20)) {
@ -707,23 +739,18 @@ static void advance_fetcher_state_machine(GB_gameboy_t *gb)
gb->fetcher_y = y; gb->fetcher_y = y;
} }
gb->last_tile_index_address = map + x + y / 8 * 32; gb->last_tile_index_address = map + x + y / 8 * 32;
gb->current_tile = gb->vram[gb->last_tile_index_address]; gb->current_tile = vram_read(gb, gb->last_tile_index_address);
if (gb->vram_ppu_blocked) {
gb->current_tile = 0xFF;
}
if (GB_is_cgb(gb)) { if (GB_is_cgb(gb)) {
/* The CGB actually accesses both the tile index AND the attributes in the same T-cycle. /* The CGB actually accesses both the tile index AND the attributes in the same T-cycle.
This probably means the CGB has a 16-bit data bus for the VRAM. */ This probably means the CGB has a 16-bit data bus for the VRAM. */
gb->current_tile_attributes = gb->vram[gb->last_tile_index_address + 0x2000]; gb->current_tile_attributes = vram_read(gb, gb->last_tile_index_address + 0x2000);
if (gb->vram_ppu_blocked) {
gb->current_tile_attributes = 0xFF;
}
} }
} }
gb->fetcher_state++; gb->fetcher_state++;
break; break;
case GB_FETCHER_GET_TILE_DATA_LOWER: { case GB_FETCHER_GET_TILE_DATA_LOWER: {
dma_sync(gb, cycles);
bool use_glitched = false; bool use_glitched = false;
bool cgb_d_glitch = false; bool cgb_d_glitch = false;
if (gb->tile_sel_glitch) { if (gb->tile_sel_glitch) {
@ -748,29 +775,22 @@ static void advance_fetcher_state_machine(GB_gameboy_t *gb)
} }
if (!use_glitched) { if (!use_glitched) {
gb->current_tile_data[0] = gb->current_tile_data[0] =
gb->vram[tile_address + ((y & 7) ^ y_flip) * 2]; vram_read(gb, tile_address + ((y & 7) ^ y_flip) * 2);
if (gb->vram_ppu_blocked) {
gb->current_tile_data[0] = 0xFF;
}
} }
if ((gb->io_registers[GB_IO_LCDC] & 0x10) && gb->tile_sel_glitch) { if ((gb->io_registers[GB_IO_LCDC] & 0x10) && gb->tile_sel_glitch) {
gb->data_for_sel_glitch = gb->data_for_sel_glitch =
gb->vram[tile_address + ((y & 7) ^ y_flip) * 2]; vram_read(gb, tile_address + ((y & 7) ^ y_flip) * 2);
if (gb->vram_ppu_blocked) {
gb->data_for_sel_glitch = 0xFF;
}
} }
else if (cgb_d_glitch) { else if (cgb_d_glitch) {
gb->data_for_sel_glitch = gb->vram[gb->current_tile * 0x10 + ((y & 7) ^ y_flip) * 2]; gb->data_for_sel_glitch = vram_read(gb, gb->current_tile * 0x10 + ((y & 7) ^ y_flip) * 2);
if (gb->vram_ppu_blocked) {
gb->data_for_sel_glitch = 0xFF;
}
} }
} }
gb->fetcher_state++; gb->fetcher_state++;
break; break;
case GB_FETCHER_GET_TILE_DATA_HIGH: { case GB_FETCHER_GET_TILE_DATA_HIGH: {
dma_sync(gb, cycles);
/* Todo: Verified for DMG (Tested: SGB2), CGB timing is wrong. */ /* Todo: Verified for DMG (Tested: SGB2), CGB timing is wrong. */
bool use_glitched = false; bool use_glitched = false;
@ -798,22 +818,15 @@ static void advance_fetcher_state_machine(GB_gameboy_t *gb)
gb->last_tile_data_address = tile_address + ((y & 7) ^ y_flip) * 2 + 1 - cgb_d_glitch; gb->last_tile_data_address = tile_address + ((y & 7) ^ y_flip) * 2 + 1 - cgb_d_glitch;
if (!use_glitched) { if (!use_glitched) {
gb->current_tile_data[1] = gb->current_tile_data[1] =
gb->vram[gb->last_tile_data_address]; vram_read(gb, gb->last_tile_data_address);
if (gb->vram_ppu_blocked) {
gb->current_tile_data[1] = 0xFF;
}
} }
if ((gb->io_registers[GB_IO_LCDC] & 0x10) && gb->tile_sel_glitch) { if ((gb->io_registers[GB_IO_LCDC] & 0x10) && gb->tile_sel_glitch) {
gb->data_for_sel_glitch = gb->vram[gb->last_tile_data_address]; gb->data_for_sel_glitch = vram_read(gb, gb->last_tile_data_address);
if (gb->vram_ppu_blocked) {
gb->data_for_sel_glitch = 0xFF;
}
} }
else if (cgb_d_glitch) { else if (cgb_d_glitch) {
gb->data_for_sel_glitch = gb->vram[gb->current_tile * 0x10 + ((y & 7) ^ y_flip) * 2 + 1]; gb->data_for_sel_glitch = vram_read(gb, gb->current_tile * 0x10 + ((y & 7) ^ y_flip) * 2 + 1);
if (gb->vram_ppu_blocked) {
gb->data_for_sel_glitch = 0xFF;
}
} }
} }
if (gb->wx_triggered) { if (gb->wx_triggered) {
@ -849,8 +862,8 @@ static inline uint8_t oam_read(GB_gameboy_t *gb, uint8_t addr)
if (unlikely(gb->oam_ppu_blocked)) { if (unlikely(gb->oam_ppu_blocked)) {
return 0xFF; return 0xFF;
} }
if (unlikely(gb->dma_current_dest > 0 && gb->dma_current_dest <= 0xa0)) { // TODO: what happens in the last and first M cycles? if (unlikely(gb->dma_current_dest <= 0xa0 && gb->dma_current_dest > 0)) { // TODO: what happens in the last and first M cycles?
return gb->oam[((gb->dma_current_dest - 1) & ~1) | (addr & 1)]; return gb->oam[((gb->dma_current_dest - 1) & ~1) | (addr & 1)];
} }
return gb->oam[addr]; return gb->oam[addr];
} }
@ -1574,7 +1587,7 @@ void GB_display_run(GB_gameboy_t *gb, unsigned cycles, bool force)
gb->objects_x[gb->n_visible_objs - 1] == (uint8_t)(gb->position_in_line + 8)) { gb->objects_x[gb->n_visible_objs - 1] == (uint8_t)(gb->position_in_line + 8)) {
while (gb->fetcher_state < 5 || fifo_size(&gb->bg_fifo) == 0) { while (gb->fetcher_state < 5 || fifo_size(&gb->bg_fifo) == 0) {
advance_fetcher_state_machine(gb); advance_fetcher_state_machine(gb, &cycles);
gb->cycles_for_line++; gb->cycles_for_line++;
GB_SLEEP(gb, display, 27, 1); GB_SLEEP(gb, display, 27, 1);
if (gb->object_fetch_aborted) { if (gb->object_fetch_aborted) {
@ -1595,7 +1608,7 @@ void GB_display_run(GB_gameboy_t *gb, unsigned cycles, bool force)
} }
/* TODO: Can this be deleted? { */ /* TODO: Can this be deleted? { */
advance_fetcher_state_machine(gb); advance_fetcher_state_machine(gb, &cycles);
gb->cycles_for_line++; gb->cycles_for_line++;
GB_SLEEP(gb, display, 41, 1); GB_SLEEP(gb, display, 41, 1);
if (gb->object_fetch_aborted) { if (gb->object_fetch_aborted) {
@ -1603,40 +1616,36 @@ void GB_display_run(GB_gameboy_t *gb, unsigned cycles, bool force)
} }
/* } */ /* } */
advance_fetcher_state_machine(gb); advance_fetcher_state_machine(gb, &cycles);
dma_sync(gb, &cycles);
gb->cycles_for_line += 3;
GB_SLEEP(gb, display, 20, 3);
if (gb->object_fetch_aborted) {
goto abort_fetching_object;
}
if (unlikely(GB_is_dma_active(gb))) {
unsigned offset = cycles - gb->display_cycles; // Time passed in 8MHz ticks
cycles = gb->display_cycles;
if (offset) {
if (!gb->cgb_double_speed) {
offset >>= 1; // Convert to T-cycles
}
unsigned old = gb->dma_cycles;
gb->dma_cycles = offset;
GB_dma_run(gb);
gb->dma_cycles += old - offset;
}
}
gb->object_low_line_address = get_object_line_address(gb, gb->object_low_line_address = get_object_line_address(gb,
gb->objects_y[gb->n_visible_objs - 1], gb->objects_y[gb->n_visible_objs - 1],
oam_read(gb, gb->visible_objs[gb->n_visible_objs - 1] * 4 + 2), oam_read(gb, gb->visible_objs[gb->n_visible_objs - 1] * 4 + 2),
gb->object_flags = oam_read(gb, gb->visible_objs[gb->n_visible_objs - 1] * 4 + 3) gb->object_flags = oam_read(gb, gb->visible_objs[gb->n_visible_objs - 1] * 4 + 3)
); );
gb->cycles_for_line += 1; gb->cycles_for_line += 2;
GB_SLEEP(gb, display, 39, 1); GB_SLEEP(gb, display, 20, 2);
if (gb->object_fetch_aborted) { if (gb->object_fetch_aborted) {
goto abort_fetching_object; goto abort_fetching_object;
} }
/* TODO: timing not verified */
dma_sync(gb, &cycles);
gb->object_tile_data[0] = vram_read(gb, gb->object_low_line_address);
gb->cycles_for_line += 2;
GB_SLEEP(gb, display, 39, 2);
if (gb->object_fetch_aborted) {
goto abort_fetching_object;
}
/* TODO: timing not verified */
dma_sync(gb, &cycles);
gb->object_tile_data[1] = vram_read(gb, gb->object_low_line_address + 1);
gb->during_object_fetch = false; gb->during_object_fetch = false;
gb->cycles_for_line++; gb->cycles_for_line++;
GB_SLEEP(gb, display, 40, 1); GB_SLEEP(gb, display, 40, 1);
@ -1647,8 +1656,8 @@ void GB_display_run(GB_gameboy_t *gb, unsigned cycles, bool force)
palette = gb->object_flags & 0x7; palette = gb->object_flags & 0x7;
} }
fifo_overlay_object_row(&gb->oam_fifo, fifo_overlay_object_row(&gb->oam_fifo,
gb->vram_ppu_blocked? 0xFF : gb->vram[gb->object_low_line_address], gb->object_tile_data[0],
gb->vram_ppu_blocked? 0xFF : gb->vram[gb->object_low_line_address + 1], gb->object_tile_data[1],
palette, palette,
gb->object_flags & 0x80, gb->object_flags & 0x80,
gb->object_priority == GB_OBJECT_PRIORITY_INDEX? gb->visible_objs[gb->n_visible_objs - 1] : 0, gb->object_priority == GB_OBJECT_PRIORITY_INDEX? gb->visible_objs[gb->n_visible_objs - 1] : 0,
@ -1663,7 +1672,7 @@ abort_fetching_object:
gb->during_object_fetch = false; gb->during_object_fetch = false;
render_pixel_if_possible(gb); render_pixel_if_possible(gb);
advance_fetcher_state_machine(gb); advance_fetcher_state_machine(gb, &cycles);
if (gb->position_in_line == 160) break; if (gb->position_in_line == 160) break;
gb->cycles_for_line++; gb->cycles_for_line++;

View File

@ -427,7 +427,8 @@ struct GB_gameboy_internal_s {
uint8_t dma_current_dest; uint8_t dma_current_dest;
uint8_t last_dma_read; uint8_t last_dma_read;
uint16_t dma_current_src; uint16_t dma_current_src;
int16_t dma_cycles; uint16_t dma_cycles;
int8_t dma_cycles_modulo;
uint8_t last_opcode_read; /* Required to emulate HDMA reads from Exxx */ uint8_t last_opcode_read; /* Required to emulate HDMA reads from Exxx */
bool hdma_starting; bool hdma_starting;
) )
@ -592,6 +593,7 @@ struct GB_gameboy_internal_s {
uint8_t visible_objs[10]; uint8_t visible_objs[10];
uint8_t objects_x[10]; uint8_t objects_x[10];
uint8_t objects_y[10]; uint8_t objects_y[10];
uint8_t object_tile_data[2];
uint8_t object_flags; uint8_t object_flags;
uint8_t n_visible_objs; uint8_t n_visible_objs;
uint8_t oam_search_index; uint8_t oam_search_index;

View File

@ -292,10 +292,16 @@ static uint8_t read_mbc_rom(GB_gameboy_t *gb, uint16_t addr)
static uint8_t read_vram(GB_gameboy_t *gb, uint16_t addr) static uint8_t read_vram(GB_gameboy_t *gb, uint16_t addr)
{ {
if (!GB_is_dma_active(gb)) { if (likely(!GB_is_dma_active(gb))) {
/* Prevent syncing from a DMA read. Batching doesn't happen during DMA anyway. */ /* Prevent syncing from a DMA read. Batching doesn't happen during DMA anyway. */
GB_display_sync(gb); GB_display_sync(gb);
} }
else {
if ((gb->dma_current_dest & 0xE000) == 0x8000) {
// TODO: verify conflict behavior
return gb->vram[(addr & 0x1FFF) + (gb->cgb_vram_bank? 0x2000 : 0)];
}
}
if (unlikely(gb->vram_read_blocked)) { if (unlikely(gb->vram_read_blocked)) {
return 0xFF; return 0xFF;
@ -1465,6 +1471,7 @@ static void write_high_memory(GB_gameboy_t *gb, uint16_t addr, uint8_t value)
case GB_IO_DMA: case GB_IO_DMA:
gb->dma_cycles = 0; gb->dma_cycles = 0;
gb->dma_cycles_modulo = 2;
gb->dma_current_dest = 0xFF; gb->dma_current_dest = 0xFF;
gb->dma_current_src = value << 8; gb->dma_current_src = value << 8;
gb->io_registers[GB_IO_DMA] = value; gb->io_registers[GB_IO_DMA] = value;
@ -1692,8 +1699,9 @@ bool GB_is_dma_active(GB_gameboy_t *gb)
void GB_dma_run(GB_gameboy_t *gb) void GB_dma_run(GB_gameboy_t *gb)
{ {
if (gb->dma_current_dest == 0xa1) return; if (gb->dma_current_dest == 0xa1) return;
while (unlikely(gb->dma_cycles >= 4)) { signed cycles = gb->dma_cycles + gb->dma_cycles_modulo;
gb->dma_cycles -= 4; while (unlikely(cycles >= 4)) {
cycles -= 4;
if (gb->dma_current_dest >= 0xa0) { if (gb->dma_current_dest >= 0xa0) {
gb->dma_current_dest++; gb->dma_current_dest++;
break; break;
@ -1713,6 +1721,8 @@ void GB_dma_run(GB_gameboy_t *gb)
/* dma_current_src must be the correct value during GB_read_memory */ /* dma_current_src must be the correct value during GB_read_memory */
gb->dma_current_src++; gb->dma_current_src++;
} }
gb->dma_cycles_modulo = cycles;
gb->dma_cycles = 0;
} }
void GB_hdma_run(GB_gameboy_t *gb) void GB_hdma_run(GB_gameboy_t *gb)