picodrive/pico/videoport.c

1059 lines
31 KiB
C

/*
* PicoDrive
* (c) Copyright Dave, 2004
* (C) notaz, 2006-2009
* (C) kub, 2020
*
* This work is licensed under the terms of MAME license.
* See COPYING file in the top-level directory.
*/
#include "pico_int.h"
#define NEED_DMA_SOURCE
#include "memory.h"
extern const unsigned char hcounts_32[];
extern const unsigned char hcounts_40[];
static int blankline; // display disabled for this line
static unsigned sat; // VRAM addr of sprite attribute table
static int satxbits; // index bits in SAT address
int (*PicoDmaHook)(unsigned int source, int len, unsigned short **base, unsigned int *mask) = NULL;
/* VDP FIFO implementation
*
* fifo_slot: last slot executed in this scanline
* fifo_cnt: #slots remaining for active FIFO write (#writes<<#bytep)
* fifo_total: #total FIFO entries pending
* fifo_data: last values transferred through fifo
* fifo_queue: fifo transfer queue (#writes, flags)
*
* FIFO states: empty total=0
* inuse total>0 && total<4
* full total==4
* wait total>4
* Conditions:
* fifo_slot is always behind slot2cyc[cycles]. Advancing it beyond cycles
* implies blocking the 68k up to that slot.
*
* A FIFO write goes to the end of the FIFO queue, but DMA running in background
* is always the last queue entry (transfers by CPU intervene and come 1st).
* There can be more pending writes than FIFO slots, but the CPU will be blocked
* until FIFO level (without background DMA) <= 4.
* This is only about correct timing, data xfer must be handled by the caller.
* Blocking the CPU means burning cycles via SekCyclesBurn*(), which is to be
* executed by the caller.
*
* FIFOSync "executes" FIFO write slots up to the given cycle in the current
* scanline. A queue entry completely executed is removed from the queue.
* FIFOWrite pushes writes to the transfer queue. If it's a blocking write, 68k
* is blocked if more than 4 FIFO writes are pending.
* FIFORead executes a 68k read. 68k is blocked until the next transfer slot.
*/
// mapping between slot# and 68k cycles in a blanked scanline [H32, H40]
static const int vdpcyc2sl_bl[] = { (166<<16)/488, (204<<16)/488 };
static const int vdpsl2cyc_bl[] = { (488<<16)/166, (488<<16)/204 };
// VDP transfer slots in active display 32col mode. 1 slot is 488/171 = 2.8538
// 68k cycles. Only 16 of the 171 slots in a scanline can be used by CPU/DMA:
// (HINT=slot 0): 11,25,40,48,56,72,80,88,104,112,120,136,144,152,167,168
static const unsigned char vdpcyc2sl_32[] = { // 68k cycles/4 to slot #
// 4 8 12 16 20 24 28 32 36 40 44 48 52 56 60
0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3,
3, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 5,
5, 5, 5, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 8, 8,
8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9,10,
10,10,10,10,10,11,11,11,11,11,11,11,11,11,11,11,
11,12,12,12,12,12,13,13,13,13,13,13,14,14,14,14,
14,14,14,14,14,14,14,15,16,16,16,16,16,16,16,16,
};
static const unsigned char vdpsl2cyc_32[] = { // slot # to 68k cycles/4
0, 8, 18, 28, 33, 39, 51, 56, 62, 74, 79, 85, 97,102,108,119,120,130
};
// VDP transfer slots in active display 40col mode. 1 slot is 488/210 = 2.3238
// 68k cycles. Only 18 of the 210 slots in a scanline can be used by CPU/DMA:
// (HINT=0): 21,47,55,63,79,87,95,111,119,127,143,151,159,175,183,191,206,207,
static const unsigned char vdpcyc2sl_40[] = { // 68k cycles/4 to slot #
// 4 8 12 16 20 24 28 32 36 40 44 48 52 56 60
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2,
3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5,
5, 5, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 7,
8, 8, 8, 8, 8, 9, 9, 9, 9,10,10,10,10,10,10,10,
10,10,10,11,11,11,11,12,12,12,12,12,13,13,13,13,
13,13,13,13,13,14,14,14,14,14,15,15,15,15,15,16,
16,16,16,16,16,16,16,17,18,18,18,18,18,18,18,18,
};
static const unsigned char vdpsl2cyc_40[] = { // slot # to 68k cycles/4
0, 12, 27, 32, 36, 46, 50, 55, 64, 69, 73, 83, 87, 92,101,106,111,119,120,134
};
// NB code assumes fifo_* arrays have size 2^n
// last transferred FIFO data, ...x = index XXX currently only CPU
static short fifo_data[4], fifo_dx; // XXX must go into save?
// queued FIFO transfers, ...x = index, ...l = queue length
// each entry has 2 values: [n]>>3 = #writes, [n]&7 = flags
static int fifo_queue[8], fifo_qx, fifo_ql; // XXX must go into save?
enum { FQ_BYTE = 1, FQ_BGDMA = 2, FQ_FGDMA = 4 }; // queue flags, NB: BYTE = 1!
static unsigned int fifo_total; // total# of pending FIFO entries (w/o BGDMA)
static unsigned short fifo_slot; // last executed slot in current scanline
// map cycles to FIFO slot
static __inline int GetFIFOSlot(struct PicoVideo *pv, int cycles)
{
int active = !(pv->status & SR_VB) && (pv->reg[1] & 0x40);
int h40 = pv->reg[12] & 1;
if (active) return (h40 ? vdpcyc2sl_40 : vdpcyc2sl_32)[cycles/4];
else return (cycles * vdpcyc2sl_bl[h40] + cycles) >> 16;
}
// map FIFO slot to cycles
static __inline int GetFIFOCycles(struct PicoVideo *pv, int slot)
{
int active = !(pv->status & SR_VB) && (pv->reg[1] & 0x40);
int h40 = pv->reg[12] & 1;
if (active) return (h40 ? vdpsl2cyc_40 : vdpsl2cyc_32)[slot]*4;
else return ((slot * vdpsl2cyc_bl[h40] + slot) >> 16);
}
// do the FIFO math
static __inline int AdvanceFIFOEntry(struct PicoVideo *pv, int slots)
{
int l = slots, b = fifo_queue[fifo_qx] & FQ_BYTE;
// advance currently active FIFO entry
if (l > pv->fifo_cnt)
l = pv->fifo_cnt;
if (!(fifo_queue[fifo_qx] & FQ_BGDMA))
fifo_total -= ((pv->fifo_cnt & b) + l) >> b;
pv->fifo_cnt -= l;
// if entry has been processed...
if (pv->fifo_cnt == 0) {
if (fifo_ql) {
// terminate DMA if applicable
if ((pv->status & SR_DMA) && (fifo_queue[fifo_qx] & FQ_BGDMA)) {
pv->status &= ~SR_DMA;
pv->command &= ~0x80;
}
// remove entry from FIFO
fifo_qx ++, fifo_qx &= 7, fifo_ql --;
}
// start processing for next entry if there is one
if (fifo_ql)
pv->fifo_cnt= (fifo_queue[fifo_qx] >> 3) << (fifo_queue[fifo_qx] & FQ_BYTE);
else
fifo_total = 0;
}
return l;
}
static __inline void SetFIFOState(struct PicoVideo *pv)
{
// release CPU and terminate DMA if FIFO isn't blocking the 68k anymore
if (fifo_total == 0)
pv->status &= ~PVS_CPURD;
if (fifo_total <= 4) {
int x = (fifo_qx + fifo_ql - 1) & 7;
if ((pv->status & SR_DMA) && !(pv->status & PVS_DMAFILL) &&
(!fifo_ql || !(fifo_queue[x] & FQ_BGDMA))) {
pv->status &= ~SR_DMA;
pv->command &= ~0x80;
}
pv->status &= ~PVS_CPUWR;
}
}
// sync FIFO to cycles
void PicoVideoFIFOSync(int cycles)
{
struct PicoVideo *pv = &Pico.video;
int slots, done;
// calculate #slots since last executed slot
slots = GetFIFOSlot(pv, cycles) - fifo_slot;
// advance FIFO queue by #done slots
done = slots;
while (done > 0 && pv->fifo_cnt) {
int l = AdvanceFIFOEntry(pv, done);
fifo_slot += l;
done -= l;
}
SetFIFOState(pv);
}
// drain FIFO, blocking 68k on the way. FIFO must be synced prior to drain.
int PicoVideoFIFODrain(int level, int cycles, int bgdma)
{
struct PicoVideo *pv = &Pico.video;
int maxsl = GetFIFOSlot(pv, 488); // max xfer slots in this scanline
int burn = 0;
// process FIFO entries until low level is reached
while (fifo_total > level && fifo_slot < maxsl &&
(!(fifo_queue[fifo_qx] & FQ_BGDMA) || bgdma)) {
int b = fifo_queue[fifo_qx] & FQ_BYTE;
int cnt = ((fifo_total-level) << b) - (pv->fifo_cnt & b);
int last = fifo_slot;
int slot = (pv->fifo_cnt < cnt ? pv->fifo_cnt : cnt) + last; // target slot
unsigned ocyc = cycles;
if (slot > maxsl) {
// target in later scanline, advance to eol
slot = maxsl;
cycles = 488;
} else {
// advance FIFO to target slot and CPU to cycles at that slot
cycles = GetFIFOCycles(pv, slot);
}
fifo_slot = slot;
burn += cycles - ocyc;
AdvanceFIFOEntry(pv, slot - last);
}
SetFIFOState(pv);
return burn;
}
// read VDP data port
int PicoVideoFIFORead(void)
{
struct PicoVideo *pv = &Pico.video;
int lc = SekCyclesDone()-Pico.t.m68c_line_start;
int burn = 0;
PicoVideoFIFOSync(lc);
// advance FIFO and CPU until FIFO is empty
burn = PicoVideoFIFODrain(0, lc, 1);
lc += burn;
if (fifo_total > 0)
pv->status |= PVS_CPURD; // target slot is in later scanline
else {
// use next VDP access slot for reading, block 68k until then
fifo_slot = GetFIFOSlot(pv, lc) + 1;
burn += GetFIFOCycles(pv, fifo_slot) - lc;
}
return burn;
}
// write VDP data port
int PicoVideoFIFOWrite(int count, int flags, unsigned sr_mask,unsigned sr_flags)
{
struct PicoVideo *pv = &Pico.video;
int lc = SekCyclesDone()-Pico.t.m68c_line_start;
int burn = 0, x;
PicoVideoFIFOSync(lc);
pv->status = (pv->status & ~sr_mask) | sr_flags;
if (count && fifo_ql < 8) {
// update FIFO state if it was empty
if (fifo_ql == 0) {
fifo_slot = GetFIFOSlot(pv, lc+9); // FIFO latency ~3 vdp slots
pv->fifo_cnt = count << (flags & FQ_BYTE);
}
// create xfer queue entry
x = (fifo_qx + fifo_ql - 1) & 7;
if (fifo_ql && (fifo_queue[x] & FQ_BGDMA)) {
// CPU FIFO writes have priority over a background DMA Fill/Copy
fifo_queue[(x+1) & 7] = fifo_queue[x];
if (fifo_ql == 1) {
// XXX if interrupting a DMA fill, fill data changes
int f = fifo_queue[x] & 7;
fifo_queue[(x+1) & 7] = (pv->fifo_cnt >> (f & FQ_BYTE) << 3) | f;
pv->fifo_cnt = count << (flags & FQ_BYTE);
}
} else
x = (x+1) & 7;
fifo_queue[x] = (count << 3) | flags;
fifo_ql ++;
if (!(flags & FQ_BGDMA))
fifo_total += count;
}
// if CPU is waiting for the bus, advance CPU and FIFO until bus is free
if (pv->status & PVS_CPUWR)
burn = PicoVideoFIFODrain(4, lc, 0);
return burn;
}
// at HINT, advance FIFO to new scanline
int PicoVideoFIFOHint(void)
{
struct PicoVideo *pv = &Pico.video;
int burn = 0;
// reset slot to start of scanline
fifo_slot = 0;
// if CPU is waiting for the bus, advance CPU and FIFO until bus is free
if (pv->status & PVS_CPURD)
burn = PicoVideoFIFORead();
else if (pv->status & PVS_CPUWR)
burn = PicoVideoFIFOWrite(0, 0, 0, 0);
return burn;
}
// switch FIFO mode between active/inactive display
static void PicoVideoFIFOMode(int active)
{
struct PicoVideo *pv = &Pico.video;
int h40 = pv->reg[12] & 1;
int lc = SekCyclesDone() - Pico.t.m68c_line_start;
PicoVideoFIFOSync(lc);
if (fifo_ql) {
// recalculate FIFO slot for new mode
if (!(pv->status & SR_VB) && active)
fifo_slot = (pv->reg[12]&1 ? vdpcyc2sl_40 : vdpcyc2sl_32)[lc/4];
else fifo_slot = ((lc * vdpcyc2sl_bl[h40] + lc) >> 16);
}
}
// VDP memory rd/wr
static __inline void AutoIncrement(void)
{
Pico.video.addr=(unsigned short)(Pico.video.addr+Pico.video.reg[0xf]);
if (Pico.video.addr < Pico.video.reg[0xf]) Pico.video.addr_u ^= 1;
}
static __inline void UpdateSAT(u32 a, u32 d)
{
Pico.est.rendstatus |= PDRAW_DIRTY_SPRITES;
if (!(a & 4)) {
int num = (a-sat) >> 3;
((u16 *)&VdpSATCache[num])[(a&3) >> 1] = d;
}
}
static NOINLINE void VideoWriteVRAM128(u32 a, u16 d)
{
// nasty
u32 b = ((a & 2) >> 1) | ((a & 0x400) >> 9) | (a & 0x3FC) | ((a & 0x1F800) >> 1);
((u8 *)PicoMem.vram)[b] = d;
if (!((u16)(b^sat) >> satxbits))
Pico.est.rendstatus |= PDRAW_DIRTY_SPRITES;
if (!((u16)(a^sat) >> satxbits))
UpdateSAT(a, d);
}
static void VideoWriteVRAM(u32 a, u16 d)
{
PicoMem.vram [(u16)a >> 1] = d;
if (!((u16)(a^sat) >> satxbits))
UpdateSAT(a, d);
}
static void VideoWrite(u16 d)
{
unsigned int a = Pico.video.addr;
switch (Pico.video.type)
{
case 1: if (a & 1)
d = (u16)((d << 8) | (d >> 8));
a |= Pico.video.addr_u << 16;
VideoWriteVRAM(a, d);
break;
case 3: if (PicoMem.cram [(a >> 1) & 0x3f] != d) Pico.m.dirtyPal = 1;
PicoMem.cram [(a >> 1) & 0x3f] = d & 0xeee; break;
case 5: PicoMem.vsram[(a >> 1) & 0x3f] = d & 0x7ff; break;
case 0x81:
a |= Pico.video.addr_u << 16;
VideoWriteVRAM128(a, d);
break;
//default:elprintf(EL_ANOMALY, "VDP write %04x with bad type %i", d, Pico.video.type); break;
}
AutoIncrement();
}
static unsigned int VideoRead(void)
{
unsigned int a, d = fifo_data[(fifo_dx+1)&3];
a=Pico.video.addr; a>>=1;
SekCyclesBurnRun(PicoVideoFIFORead());
switch (Pico.video.type)
{
case 0: d=PicoMem.vram [a & 0x7fff]; break;
case 8: d=PicoMem.cram [a & 0x003f] | (d & ~0x0eee); break;
case 4: if ((a & 0x3f) >= 0x28) a = 0;
d=PicoMem.vsram [a & 0x003f] | (d & ~0x07ff); break;
case 12:a=PicoMem.vram [a & 0x7fff]; if (Pico.video.addr&1) a >>= 8;
d=(a & 0x00ff) | (d & ~0x00ff); break;
default:elprintf(EL_ANOMALY, "VDP read with bad type %i", Pico.video.type); break;
}
AutoIncrement();
return d;
}
// VDP DMA
static int GetDmaLength(void)
{
struct PicoVideo *pvid=&Pico.video;
int len=0;
// 16-bit words to transfer:
len =pvid->reg[0x13];
len|=pvid->reg[0x14]<<8;
len = ((len - 1) & 0xffff) + 1;
return len;
}
static void DmaSlow(int len, unsigned int source)
{
u32 inc = Pico.video.reg[0xf];
u32 a = Pico.video.addr | (Pico.video.addr_u << 16);
u16 *r, *base = NULL;
u32 mask = 0x1ffff;
elprintf(EL_VDPDMA, "DmaSlow[%i] %06x->%04x len %i inc=%i blank %i [%u] @ %06x",
Pico.video.type, source, a, len, inc, (Pico.video.status&SR_VB)||!(Pico.video.reg[1]&0x40),
SekCyclesDone(), SekPc);
SekCyclesBurnRun(PicoVideoFIFOWrite(len, FQ_FGDMA | (Pico.video.type == 1),
0, SR_DMA| PVS_CPUWR));
if ((source & 0xe00000) == 0xe00000) { // Ram
base = (u16 *)PicoMem.ram;
mask = 0xffff;
}
else if (PicoIn.AHW & PAHW_MCD)
{
u8 r3 = Pico_mcd->s68k_regs[3];
elprintf(EL_VDPDMA, "DmaSlow CD, r3=%02x", r3);
if (source < 0x20000) { // Bios area
base = (u16 *)Pico_mcd->bios;
} else if ((source & 0xfc0000) == 0x200000) { // Word Ram
if (!(r3 & 4)) { // 2M mode
base = (u16 *)(Pico_mcd->word_ram2M + (source & 0x20000));
} else {
if (source < 0x220000) { // 1M mode
int bank = r3 & 1;
base = (u16 *)(Pico_mcd->word_ram1M[bank]);
} else {
DmaSlowCell(source - 2, a, len, inc);
return;
}
}
source -= 2;
} else if ((source & 0xfe0000) == 0x020000) { // Prg Ram
base = (u16 *)Pico_mcd->prg_ram_b[r3 >> 6];
source -= 2; // XXX: test
}
}
else
{
// if we have DmaHook, let it handle ROM because of possible DMA delay
u32 source2;
if (PicoDmaHook && (source2 = PicoDmaHook(source, len, &base, &mask)))
source = source2;
else // Rom
base = m68k_dma_source(source);
}
if (!base) {
elprintf(EL_VDPDMA|EL_ANOMALY, "DmaSlow[%i] %06x->%04x: invalid src", Pico.video.type, source, a);
return;
}
// operate in words
source >>= 1;
mask >>= 1;
switch (Pico.video.type)
{
case 1: // vram
#if 0
r = PicoMem.vram;
if (inc == 2 && !(a & 1) && (a >> 16) == ((a + len*2) >> 16) &&
(source & ~mask) == ((source + len-1) & ~mask) &&
(a << 16 >= (sat+0x280) << 16 || (a + len*2) << 16 <= sat << 16))
{
// most used DMA mode
memcpy((char *)r + a, base + (source & mask), len * 2);
a += len * 2;
}
else
#endif
{
for(; len; len--)
{
u16 d = base[source++ & mask];
if(a & 1) d=(d<<8)|(d>>8);
VideoWriteVRAM(a, d);
// AutoIncrement
a = (a+inc) & ~0x20000;
}
}
break;
case 3: // cram
Pico.m.dirtyPal = 1;
r = PicoMem.cram;
for (; len; len--)
{
r[(a / 2) & 0x3f] = base[source++ & mask] & 0xeee;
// AutoIncrement
a = (a+inc) & ~0x20000;
}
break;
case 5: // vsram
r = PicoMem.vsram;
for (; len; len--)
{
r[(a / 2) & 0x3f] = base[source++ & mask] & 0x7ff;
// AutoIncrement
a = (a+inc) & ~0x20000;
}
break;
case 0x81: // vram 128k
for(; len; len--)
{
u16 d = base[source++ & mask];
VideoWriteVRAM128(a, d);
// AutoIncrement
a = (a+inc) & ~0x20000;
}
break;
default:
if (Pico.video.type != 0 || (EL_LOGMASK & EL_VDPDMA))
elprintf(EL_VDPDMA|EL_ANOMALY, "DMA with bad type %i", Pico.video.type);
break;
}
// remember addr
Pico.video.addr = a;
Pico.video.addr_u = a >> 16;
}
static void DmaCopy(int len)
{
u32 a = Pico.video.addr | (Pico.video.addr_u << 16);
u8 *vr = (u8 *)PicoMem.vram;
u8 inc = Pico.video.reg[0xf];
int source;
elprintf(EL_VDPDMA, "DmaCopy len %i [%u]", len, SekCyclesDone());
SekCyclesBurnRun(PicoVideoFIFOWrite(len, FQ_BGDMA | FQ_BYTE,
PVS_CPUWR, SR_DMA));
source =Pico.video.reg[0x15];
source|=Pico.video.reg[0x16]<<8;
// XXX implement VRAM 128k? Is this even working? count still in bytes?
for (; len; len--)
{
vr[(u16)a] = vr[(u16)(source++)];
if (!((u16)(a^sat) >> satxbits))
UpdateSAT(a, ((u16 *)vr)[(u16)a >> 1]);
// AutoIncrement
a = (a+inc) & ~0x20000;
}
// remember addr
Pico.video.addr = a;
Pico.video.addr_u = a >> 16;
}
static NOINLINE void DmaFill(int data)
{
u32 a = Pico.video.addr | (Pico.video.addr_u << 16);
u8 *vr = (u8 *)PicoMem.vram;
u8 high = (u8)(data >> 8);
u8 inc = Pico.video.reg[0xf];
int source;
int len, l;
len = GetDmaLength();
elprintf(EL_VDPDMA, "DmaFill len %i inc %i [%u]", len, inc, SekCyclesDone());
SekCyclesBurnRun(PicoVideoFIFOWrite(len, FQ_BGDMA | (Pico.video.type == 1),
PVS_CPUWR | PVS_DMAFILL, SR_DMA));
switch (Pico.video.type)
{
case 1: // vram
for (l = len; l; l--) {
// Write upper byte to adjacent address
// (here we are byteswapped, so address is already 'adjacent')
vr[(u16)a] = high;
if (!((u16)(a^sat) >> satxbits))
UpdateSAT(a, ((u16 *)vr)[(u16)a >> 1]);
// Increment address register
a = (a+inc) & ~0x20000;
}
break;
case 3: // cram
Pico.m.dirtyPal = 1;
data &= 0xeee;
for (l = len; l; l--) {
PicoMem.cram[(a/2) & 0x3f] = data;
// Increment address register
a = (a+inc) & ~0x20000;
}
break;
case 5: { // vsram
data &= 0x7ff;
for (l = len; l; l--) {
PicoMem.vsram[(a/2) & 0x3f] = data;
// Increment address register
a = (a+inc) & ~0x20000;
}
break;
}
case 0x81: // vram 128k
for (l = len; l; l--) {
VideoWriteVRAM128(a, data);
// Increment address register
a = (a+inc) & ~0x20000;
}
break;
default:
a += len * inc;
break;
}
// remember addr
Pico.video.addr = a;
Pico.video.addr_u = a >> 16;
// register update
Pico.video.reg[0x13] = Pico.video.reg[0x14] = 0;
source = Pico.video.reg[0x15];
source |= Pico.video.reg[0x16] << 8;
source += len;
Pico.video.reg[0x15] = source;
Pico.video.reg[0x16] = source >> 8;
}
// VDP command handling
static NOINLINE void CommandDma(void)
{
struct PicoVideo *pvid=&Pico.video;
u32 len, method;
u32 source;
PicoVideoFIFOSync(SekCyclesDone()-Pico.t.m68c_line_start);
if (pvid->status & SR_DMA) {
elprintf(EL_VDPDMA, "Dma overlap, left=%d @ %06x",
fifo_total, SekPc);
pvid->fifo_cnt = fifo_total = fifo_ql = 0;
}
len = GetDmaLength();
source =Pico.video.reg[0x15];
source|=Pico.video.reg[0x16] << 8;
source|=Pico.video.reg[0x17] << 16;
method=pvid->reg[0x17]>>6;
if (method < 2)
DmaSlow(len, source << 1); // 68000 to VDP
else if (method == 3)
DmaCopy(len); // VRAM Copy
else {
pvid->status |= SR_DMA|PVS_DMAFILL;
return;
}
source += len;
Pico.video.reg[0x13] = Pico.video.reg[0x14] = 0;
Pico.video.reg[0x15] = source;
Pico.video.reg[0x16] = source >> 8;
}
static NOINLINE void CommandChange(void)
{
struct PicoVideo *pvid = &Pico.video;
unsigned int cmd, addr;
cmd = pvid->command;
// Get type of transfer 0xc0000030 (v/c/vsram read/write)
pvid->type = (u8)(((cmd >> 2) & 0xc) | (cmd >> 30));
if (pvid->type == 1) // vram
pvid->type |= pvid->reg[1] & 0x80; // 128k
// Get address 0x3fff0003
addr = (cmd >> 16) & 0x3fff;
addr |= (cmd << 14) & 0xc000;
pvid->addr = (u16)addr;
pvid->addr_u = (u8)((cmd >> 2) & 1);
}
// VDP interface
static void DrawSync(int skip)
{
int lines = Pico.video.reg[1]&0x08 ? 240 : 224;
int last = Pico.m.scanline - (skip || blankline == Pico.m.scanline);
if (last < lines && !(PicoIn.opt & POPT_ALT_RENDERER) &&
!PicoIn.skipFrame && Pico.est.DrawScanline <= last) {
//elprintf(EL_ANOMALY, "sync");
if (blankline >= 0 && blankline < last) {
PicoDrawSync(blankline, 1);
blankline = -1;
}
PicoDrawSync(last, 0);
}
}
PICO_INTERNAL_ASM void PicoVideoWrite(unsigned int a,unsigned short d)
{
struct PicoVideo *pvid=&Pico.video;
//elprintf(EL_STATUS, "PicoVideoWrite [%06x] %04x [%u] @ %06x",
// a, d, SekCyclesDone(), SekPc);
a &= 0x1c;
switch (a)
{
case 0x00: // Data port 0 or 2
// try avoiding the sync..
if (Pico.m.scanline < (pvid->reg[1]&0x08 ? 240 : 224) && (pvid->reg[1]&0x40) &&
!(!pvid->pending &&
((pvid->command & 0xc00000f0) == 0x40000010 && PicoMem.vsram[pvid->addr>>1] == (d & 0x7ff)))
)
DrawSync(0); // XXX it's unclear when vscroll data is fetched from vsram?
if (pvid->pending) {
CommandChange();
pvid->pending=0;
}
if (!(PicoIn.opt&POPT_DIS_VDP_FIFO))
{
fifo_data[++fifo_dx&3] = d;
SekCyclesBurnRun(PicoVideoFIFOWrite(1, pvid->type == 1, 0, PVS_CPUWR));
elprintf(EL_ASVDP, "VDP data write: [%04x] %04x [%u] {%i} @ %06x",
Pico.video.addr, d, SekCyclesDone(), Pico.video.type, SekPc);
}
VideoWrite(d);
// start DMA fill on write. NB VSRAM and CRAM fills use wrong FIFO data.
if (pvid->status & PVS_DMAFILL)
DmaFill(fifo_data[(fifo_dx + !!(pvid->type&~0x81))&3]);
break;
case 0x04: // Control (command) port 4 or 6
if (pvid->status & SR_DMA)
SekCyclesBurnRun(PicoVideoFIFORead()); // kludge, flush out running DMA
if (pvid->pending)
{
// Low word of command:
if (!(pvid->reg[1]&0x10))
d = (d&~0x80)|(pvid->command&0x80);
pvid->command &= 0xffff0000;
pvid->command |= d;
pvid->pending = 0;
CommandChange();
// Check for dma:
if (d & 0x80) {
DrawSync(SekCyclesDone() - Pico.t.m68c_line_start <= 488-390);
CommandDma();
}
}
else
{
if ((d&0xc000)==0x8000)
{
// Register write:
int num=(d>>8)&0x1f;
int dold=pvid->reg[num];
pvid->type=0; // register writes clear command (else no Sega logo in Golden Axe II)
if (num > 0x0a && !(pvid->reg[1]&4)) {
elprintf(EL_ANOMALY, "%02x written to reg %02x in SMS mode @ %06x", d, num, SekPc);
return;
}
if (num == 0 && !(pvid->reg[0]&2) && (d&2))
pvid->hv_latch = PicoVideoRead(0x08);
if (num == 1 && ((pvid->reg[1]^d)&0x40)) {
PicoVideoFIFOMode(d & 0x40);
// handle line blanking before line rendering
if (SekCyclesDone() - Pico.t.m68c_line_start <= 488-390)
blankline = d&0x40 ? -1 : Pico.m.scanline;
}
DrawSync(SekCyclesDone() - Pico.t.m68c_line_start <= 488-390);
pvid->reg[num]=(unsigned char)d;
switch (num)
{
case 0x00:
elprintf(EL_INTSW, "hint_onoff: %i->%i [%u] pend=%i @ %06x", (dold&0x10)>>4,
(d&0x10)>>4, SekCyclesDone(), (pvid->pending_ints&0x10)>>4, SekPc);
goto update_irq;
case 0x01:
elprintf(EL_INTSW, "vint_onoff: %i->%i [%u] pend=%i @ %06x", (dold&0x20)>>5,
(d&0x20)>>5, SekCyclesDone(), (pvid->pending_ints&0x20)>>5, SekPc);
if (!(pvid->status & PVS_VB2))
pvid->status &= ~SR_VB;
pvid->status |= ((d >> 3) ^ SR_VB) & SR_VB; // forced blanking
goto update_irq;
case 0x05:
case 0x06:
if (d^dold) Pico.est.rendstatus |= PDRAW_SPRITES_MOVED;
break;
case 0x0c:
// renderers should update their palettes if sh/hi mode is changed
if ((d^dold)&8) Pico.m.dirtyPal = 1;
break;
default:
return;
}
sat = ((pvid->reg[5]&0x7f) << 9) | ((pvid->reg[6]&0x20) << 11);
satxbits = 9;
if (Pico.video.reg[12]&1)
sat &= ~0x200, satxbits = 10; // H40, zero lowest SAT bit
//elprintf(EL_STATUS, "spritep moved to %04x", sat);
return;
update_irq:
#ifndef EMU_CORE_DEBUG
// update IRQ level
if (!SekShouldInterrupt()) // hack
{
int lines, pints, irq = 0;
lines = (pvid->reg[1] & 0x20) | (pvid->reg[0] & 0x10);
pints = pvid->pending_ints & lines;
if (pints & 0x20) irq = 6;
else if (pints & 0x10) irq = 4;
SekInterrupt(irq); // update line
// this is broken because cost of current insn isn't known here
if (irq) SekEndRun(21); // make it delayed
}
#endif
}
else
{
// High word of command:
pvid->command&=0x0000ffff;
pvid->command|=d<<16;
pvid->pending=1;
}
}
break;
// case 0x08: // 08 0a - HV counter - lock up
// case 0x0c: // 0c 0e - HV counter - lock up
// case 0x10: // 10 12 - PSG - handled by caller
// case 0x14: // 14 16 - PSG - handled by caller
// case 0x18: // 18 1a - no effect?
case 0x1c: // 1c 1e - debug
pvid->debug = d;
pvid->debug_p = 0;
if (d & (1 << 6)) {
pvid->debug_p |= PVD_KILL_A | PVD_KILL_B;
pvid->debug_p |= PVD_KILL_S_LO | PVD_KILL_S_HI;
}
switch ((d >> 7) & 3) {
case 1:
pvid->debug_p &= ~(PVD_KILL_S_LO | PVD_KILL_S_HI);
pvid->debug_p |= PVD_FORCE_S;
break;
case 2:
pvid->debug_p &= ~PVD_KILL_A;
pvid->debug_p |= PVD_FORCE_A;
break;
case 3:
pvid->debug_p &= ~PVD_KILL_B;
pvid->debug_p |= PVD_FORCE_B;
break;
}
break;
}
}
static u32 VideoSr(const struct PicoVideo *pv)
{
unsigned int c, d = pv->status;
unsigned int hp = pv->reg[12]&1 ? 15*488/210+1 : 15*488/171+1; // HBLANK start
unsigned int hl = pv->reg[12]&1 ? 37*488/210+1 : 28*488/171+1; // HBLANK len
c = SekCyclesDone() - Pico.t.m68c_line_start;
if (c - hp < hl)
d |= SR_HB;
PicoVideoFIFOSync(c);
if (fifo_total >= 4)
d |= SR_FULL;
else if (!fifo_total)
d |= SR_EMPT;
return d;
}
PICO_INTERNAL_ASM unsigned int PicoVideoRead(unsigned int a)
{
a &= 0x1c;
if (a == 0x04) // control port
{
struct PicoVideo *pv = &Pico.video;
unsigned int d = VideoSr(pv);
if (pv->pending) {
CommandChange();
pv->pending = 0;
}
elprintf(EL_SR, "SR read: %04x [%u] @ %06x", d, SekCyclesDone(), SekPc);
return d;
}
// H-counter info (based on Generator):
// frame:
// | <- hblank? -> |
// start <416> hint <36> hdisplay <38> end // CPU cycles
// |---------...---------|------------|-------------|
// 0 B6 E4 FF // 40 cells
// 0 93 E8 FF // 32 cells
// Gens (?) v-render
// start <hblank=84> hint hdisplay <404> |
// |---------------------|--------------------------|
// E4 (hc[0x43]==0) 07 B1 // 40
// E8 (hc[0x45]==0) 05 91 // 32
// check: Sonic 3D Blast bonus, Cannon Fodder, Chase HQ II, 3 Ninjas kick back, Road Rash 3, Skitchin', Wheel of Fortune
if ((a&0x1c)==0x08)
{
unsigned int d;
d = (SekCyclesDone() - Pico.t.m68c_line_start) & 0x1ff; // FIXME
if (Pico.video.reg[0]&2)
d = Pico.video.hv_latch;
else if (Pico.video.reg[12]&1)
d = hcounts_40[d] | (Pico.video.v_counter << 8);
else d = hcounts_32[d] | (Pico.video.v_counter << 8);
elprintf(EL_HVCNT, "hv: %02x %02x [%u] @ %06x", d, Pico.video.v_counter, SekCyclesDone(), SekPc);
return d;
}
if (a==0x00) // data port
{
return VideoRead();
}
return 0;
}
unsigned char PicoVideoRead8DataH(void)
{
return VideoRead() >> 8;
}
unsigned char PicoVideoRead8DataL(void)
{
return VideoRead();
}
unsigned char PicoVideoRead8CtlH(void)
{
u8 d = VideoSr(&Pico.video) >> 8;
if (Pico.video.pending) {
CommandChange();
Pico.video.pending = 0;
}
elprintf(EL_SR, "SR read (h): %02x @ %06x", d, SekPc);
return d;
}
unsigned char PicoVideoRead8CtlL(void)
{
u8 d = VideoSr(&Pico.video);
if (Pico.video.pending) {
CommandChange();
Pico.video.pending = 0;
}
elprintf(EL_SR, "SR read (l): %02x @ %06x", d, SekPc);
return d;
}
unsigned char PicoVideoRead8HV_H(void)
{
elprintf(EL_HVCNT, "vcounter: %02x [%u] @ %06x", Pico.video.v_counter, SekCyclesDone(), SekPc);
return Pico.video.v_counter;
}
// FIXME: broken
unsigned char PicoVideoRead8HV_L(void)
{
u32 d = (SekCyclesDone() - Pico.t.m68c_line_start) & 0x1ff; // FIXME
if (Pico.video.reg[0]&2)
d = Pico.video.hv_latch;
else if (Pico.video.reg[12]&1)
d = hcounts_40[d];
else d = hcounts_32[d];
elprintf(EL_HVCNT, "hcounter: %02x [%u] @ %06x", d, SekCyclesDone(), SekPc);
return d;
}
void PicoVideoSave(void)
{
struct PicoVideo *pv = &Pico.video;
int l, x;
// account for all outstanding xfers XXX kludge, entry attr's not saved
for (l = fifo_ql, x = fifo_qx + l-1; l > 1; l--, x--)
pv->fifo_cnt += (fifo_queue[x&7] >> 3) << (fifo_queue[x&7] & FQ_BYTE);
}
void PicoVideoLoad(void)
{
struct PicoVideo *pv = &Pico.video;
int l;
// convert former dma_xfers (why was this in PicoMisc anyway?)
if (Pico.m.dma_xfers) {
pv->fifo_cnt = Pico.m.dma_xfers * (pv->type == 1 ? 2 : 1);
fifo_total = Pico.m.dma_xfers;
Pico.m.dma_xfers = 0;
}
sat = ((pv->reg[5]&0x7f) << 9) | ((pv->reg[6]&0x20) << 11);
satxbits = 9;
if (pv->reg[12]&1)
sat &= ~0x200, satxbits = 10; // H40, zero lowest SAT bit
// rebuild SAT cache XXX wrong since cache and memory can differ
for (l = 0; l < 80; l++) {
*((u16 *)VdpSATCache + 2*l ) = PicoMem.vram[(sat>>1) + l*4 ];
*((u16 *)VdpSATCache + 2*l+1) = PicoMem.vram[(sat>>1) + l*4 + 1];
}
}
// vim:shiftwidth=2:ts=2:expandtab