picodrive/pico/draw.c
kub 16b11d9171 rendering, fix bgr555 output mode
NB not done for ARM asm since no target uses bgr555
2020-12-05 15:20:15 +01:00

2067 lines
62 KiB
C

/*
* line renderer
* (c) Copyright Dave, 2004
* (C) notaz, 2006-2010
* (C) kub, 2019-2020
*
* This work is licensed under the terms of MAME license.
* See COPYING file in the top-level directory.
*/
/*
* The renderer has 4 modes now:
* - normal
* - shadow/hilight (s/h)
* - "sonic mode" for midline palette changes (8bit mode only)
* - accurate sprites (AS) [+ s/h]
*
* s/h uses upper bits for both priority and shadow/hilight flags.
* "sonic mode" is autodetected, shadow/hilight is enabled by emulated game.
* AS is enabled by user and takes priority over "sonic mode".
*
* since renderer always draws line in 8bit mode, there are 2 spare bits:
* b \ mode: s/h sonic
* 00 normal pal index
* 01 hilight pal index
* 10 shadow pal index
* 11 hilight|shadow=normal pal index
*
* sprite s/h can only be correctly done after the plane rendering s/h state is
* known since the s/h result changes if there's at least one high prio plane.
* sprite op rendering is deferred until this is known, and hilight is used as
* mark since it can't occur before sprite ops:
* x1 op marker pal index
*
* low prio s/h rendering:
* - plane and non-op sprite pixels have shadow
* - s/h sprite op pixel rendering is marked with hilight (deferred)
* high prio s/h rendering:
* - plane and non-op sprite pixels are normal
* - all s/h sprite op pixels (either marked or high prio) are rendered
*
* not handled properly:
* - high prio s/h sprite op overlapping low prio sprite shows sprite, not A,B,G
* - in debug sprite-masked, transparent high-prio sprite px don't remove shadow
*/
#include "pico_int.h"
#define FORCE // layer forcing via debug register?
int (*PicoScanBegin)(unsigned int num) = NULL;
int (*PicoScanEnd) (unsigned int num) = NULL;
static unsigned char DefHighCol[8+320+8];
unsigned char *HighColBase = DefHighCol;
int HighColIncrement;
static unsigned int DefOutBuff[320*2/2];
void *DrawLineDestBase = DefOutBuff;
int DrawLineDestIncrement;
static int HighCacheA[41*2+1]; // caches for high layers
static int HighCacheB[41*2+1];
static int HighPreSpr[80*2+1]; // slightly preprocessed sprites
unsigned int VdpSATCache[128]; // VDP sprite cache (1st 32 sprite attr bits)
// NB don't change any defines without checking their usage in ASM
#if defined(USE_BGR555)
#define PXCONV(t) ((t & 0x000e000e)<< 1) | ((t & 0x00e000e0)<<2) | ((t & 0x0e000e00)<<3)
#define PXMASKL 0x04210421 // 0x0c630c63, LSB for all colours
#define PXMASKH 0x39ce39ce // 0x3def3def, all but MSB for all colours
#else // RGB565
#define PXCONV(t) ((t & 0x000e000e)<<12) | ((t & 0x00e000e0)<<3) | ((t & 0x0e000e00)>>7)
#define PXMASKL 0x08610861 // 0x18e318e3
#define PXMASKH 0x738e738e // 0x7bef7bef
#endif
#define LF_PLANE (1 << 0) // must be = 1
#define LF_SH (1 << 1) // must be = 2
//#define LF_FORCE (1 << 2)
#define LF_PLANE_A 0
#define LF_PLANE_B 1
#define SPRL_HAVE_HI 0x80 // have hi priority sprites
#define SPRL_HAVE_LO 0x40 // *lo*
#define SPRL_MAY_HAVE_OP 0x20 // may have operator sprites on the line
#define SPRL_LO_ABOVE_HI 0x10 // low priority sprites may be on top of hi
#define SPRL_HAVE_X 0x08 // have sprites with x != 0
#define SPRL_TILE_OVFL 0x04 // tile limit exceeded on previous line
#define SPRL_HAVE_MASK0 0x02 // have sprite with x == 0 in 1st slot
#define SPRL_MASKED 0x01 // lo prio masking by sprite with x == 0 active
unsigned char HighLnSpr[240][4+MAX_LINE_SPRITES+1]; // sprite_count, ^flags, tile_count, sprites_total, [spritep]..., last_width
int rendstatus_old;
int rendlines;
static int skip_next_line=0;
struct TileStrip
{
int nametab; // Position in VRAM of name table (for this tile line)
int line; // Line number in pixels 0x000-0x3ff within the virtual tilemap
int hscroll; // Horizontal scroll value in pixels for the line
int xmask; // X-Mask (0x1f - 0x7f) for horizontal wraparound in the tilemap
int *hc; // cache for high tile codes and their positions
int cells; // cells (tiles) to draw (32 col mode doesn't need to update whole 320)
};
// stuff available in asm:
#ifdef _ASM_DRAW_C
void DrawWindow(int tstart, int tend, int prio, int sh,
struct PicoEState *est);
void DrawAllSprites(unsigned char *sprited, int prio, int sh,
struct PicoEState *est);
void DrawTilesFromCache(int *hc, int sh, int rlim,
struct PicoEState *est);
void DrawSpritesSHi(unsigned char *sprited, struct PicoEState *est);
void DrawLayer(int plane_sh, int *hcache, int cellskip, int maxcells,
struct PicoEState *est);
void *blockcpy(void *dst, const void *src, size_t n);
void blockcpy_or(void *dst, void *src, size_t n, int pat);
#else
// utility
void blockcpy_or(void *dst, void *src, size_t n, int pat)
{
unsigned char *pd = dst, *ps = src;
for (; n; n--)
*pd++ = (unsigned char) (*ps++ | pat);
}
#define blockcpy memcpy
#endif
#define TileNormMaker_(pix_func,ret) \
{ \
unsigned int t; \
\
t = (pack&0x0000f000)>>12; pix_func(0); \
t = (pack&0x00000f00)>> 8; pix_func(1); \
t = (pack&0x000000f0)>> 4; pix_func(2); \
t = (pack&0x0000000f) ; pix_func(3); \
t = (pack&0xf0000000)>>28; pix_func(4); \
t = (pack&0x0f000000)>>24; pix_func(5); \
t = (pack&0x00f00000)>>20; pix_func(6); \
t = (pack&0x000f0000)>>16; pix_func(7); \
return ret; \
}
#define TileFlipMaker_(pix_func,ret) \
{ \
unsigned int t; \
\
t = (pack&0x000f0000)>>16; pix_func(0); \
t = (pack&0x00f00000)>>20; pix_func(1); \
t = (pack&0x0f000000)>>24; pix_func(2); \
t = (pack&0xf0000000)>>28; pix_func(3); \
t = (pack&0x0000000f) ; pix_func(4); \
t = (pack&0x000000f0)>> 4; pix_func(5); \
t = (pack&0x00000f00)>> 8; pix_func(6); \
t = (pack&0x0000f000)>>12; pix_func(7); \
return ret; \
}
#define TileNormMaker(funcname, pix_func) \
static void funcname(unsigned char *pd, unsigned int pack, int pal) \
TileNormMaker_(pix_func,)
#define TileFlipMaker(funcname, pix_func) \
static void funcname(unsigned char *pd, unsigned int pack, int pal) \
TileFlipMaker_(pix_func,)
#define TileNormMakerAS(funcname, pix_func) \
static unsigned funcname(unsigned m, unsigned char *pd, unsigned int pack, int pal) \
TileNormMaker_(pix_func,m)
#define TileFlipMakerAS(funcname, pix_func) \
static unsigned funcname(unsigned m, unsigned char *pd, unsigned int pack, int pal) \
TileFlipMaker_(pix_func,m)
// draw layer or non-s/h sprite pixels (no operator colors)
#define pix_just_write(x) \
if (t) pd[x]=pal|t
TileNormMaker(TileNorm, pix_just_write)
TileFlipMaker(TileFlip, pix_just_write)
#ifndef _ASM_DRAW_C
// draw sprite pixels, process operator colors
#define pix_sh(x) \
if (t) { \
if (t>=0xe) pd[x]|=(t-1)<<6; /* 80 shadow, 40 hilight */ \
else pd[x]=pal|t; \
}
TileNormMaker(TileNormSH, pix_sh)
TileFlipMaker(TileFlipSH, pix_sh)
// draw sprite pixels, mark but don't process operator colors
#define pix_sh_markop(x) \
if (t) { \
if (t>=0xe) pd[x]|=0x40; \
else pd[x]=pal|t; \
}
TileNormMaker(TileNormSH_markop, pix_sh_markop)
TileFlipMaker(TileFlipSH_markop, pix_sh_markop)
#endif
// draw low prio sprite operator pixels if visible (i.e. marked)
#define pix_sh_onlyop(x) \
if (t>=0xe && (pd[x]&0x40)) \
pd[x]=(pd[x]&~0x40)|((t-1)<<6)
#ifndef _ASM_DRAW_C
TileNormMaker(TileNormSH_onlyop_lp, pix_sh_onlyop)
TileFlipMaker(TileFlipSH_onlyop_lp, pix_sh_onlyop)
#endif
// AS: sprite mask bits in m shifted to bits 8-15, see DrawSpritesHiAS
// draw high prio sprite pixels (AS)
#define pix_as(x) \
if (t && (m & (1<<(x+8)))) m &= ~(1<<(x+8)), pd[x] = pal | t
TileNormMakerAS(TileNormAS, pix_as)
TileFlipMakerAS(TileFlipAS, pix_as)
// draw high prio sprite pixels, process operator colors (AS)
// NB sprite+planes: h+s->n, h+[nh]->h, s+[nhs]->s, hence mask h before op
#define pix_sh_as(x) \
if (t && (m & (1<<(x+8)))) { \
m &= ~(1<<(x+8)); \
if (t>=0xe) pd[x]=(pd[x]&~0x40)|((t-1)<<6); \
else pd[x] = pal | t; \
}
TileNormMakerAS(TileNormSH_AS, pix_sh_as)
TileFlipMakerAS(TileFlipSH_AS, pix_sh_as)
// draw only sprite operator pixels (AS)
#define pix_sh_as_onlyop(x) \
if (t && (m & (1<<(x+8)))) { \
m &= ~(1<<(x+8)); \
pix_sh_onlyop(x); \
}
TileNormMakerAS(TileNormSH_AS_onlyop_lp, pix_sh_as_onlyop)
TileFlipMakerAS(TileFlipSH_AS_onlyop_lp, pix_sh_as_onlyop)
// mark low prio sprite pixels (AS)
#define pix_sh_as_onlymark(x) \
if (t) m &= ~(1<<(x+8))
TileNormMakerAS(TileNormAS_onlymark, pix_sh_as_onlymark)
TileFlipMakerAS(TileFlipAS_onlymark, pix_sh_as_onlymark)
#ifdef FORCE
// NB s/h already resolved by non-forced drawing
// forced both layer draw (through debug reg)
#define pix_and(x) \
pal |= 0xc0; /* leave s/h bits untouched in pixel "and" */ \
pd[x] &= pal | t
TileNormMaker(TileNorm_and, pix_and)
TileFlipMaker(TileFlip_and, pix_and)
// forced sprite draw (through debug reg)
#define pix_sh_as_and(x) \
pal |= 0xc0; /* leave s/h bits untouched in pixel "and" */ \
if (m & (1<<(x+8))) { \
m &= ~(1<<(x+8)); \
if (t<0xe) pd[x] &= pal | t; \
}
TileNormMakerAS(TileNormSH_AS_and, pix_sh_as_and)
TileFlipMakerAS(TileFlipSH_AS_and, pix_sh_as_and)
#endif
// --------------------------------------------
#ifndef _ASM_DRAW_C
static void DrawStrip(struct TileStrip *ts, int lflags, int cellskip)
{
unsigned char *pd = Pico.est.HighCol;
int *hc = ts->hc;
int tilex, dx, ty, cells;
int oldcode = -1, blank = -1; // The tile we know is blank
unsigned int pal = 0, pack = 0, sh;
// Draw tiles across screen:
sh = (lflags & LF_SH) << 6; // shadow
tilex=((-ts->hscroll)>>3)+cellskip;
ty=(ts->line&7)<<1; // Y-Offset into tile
dx=((ts->hscroll-1)&7)+1;
cells = ts->cells - cellskip;
if(dx != 8) cells++; // have hscroll, need to draw 1 cell more
dx+=cellskip<<3;
// int force = (lflags&LF_FORCE) << 13;
for (; cells > 0; dx+=8, tilex++, cells--)
{
u32 code = PicoMem.vram[ts->nametab + (tilex & ts->xmask)];
// code &= ~force; // forced always draw everything
if (code == blank && !((code & 0x8000) && sh))
continue;
if (code!=oldcode) {
oldcode = code;
pack = 0;
if (code != blank) {
// Get tile address/2:
u32 addr = ((code&0x7ff)<<4) + ty;
if (code & 0x1000) addr ^= 0xe; // Y-flip
pal = ((code>>9)&0x30) | sh; // shadow
pack = *(unsigned int *)(PicoMem.vram + addr);
if (!pack)
blank = code;
}
}
if (code & 0x8000) { // (un-forced) high priority tile
int cval = code | (dx<<16) | (ty<<25);
if (code & 0x1000) cval ^= 0xe<<25;
*hc++ = cval, *hc++ = pack; // cache it
} else if (code != blank) {
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
// terminate the cache list
*hc = 0;
// if oldcode wasn't changed, it means all layer is hi priority
if (oldcode == -1) Pico.est.rendstatus |= PDRAW_PLANE_HI_PRIO;
}
// this is messy
static void DrawStripVSRam(struct TileStrip *ts, int plane_sh, int cellskip)
{
unsigned char *pd = Pico.est.HighCol;
int *hc = ts->hc;
int tilex, dx, ty = 0, addr = 0, cell = 0, nametabadd = 0;
int oldcode = -1, blank = -1; // The tile we know is blank
unsigned int pal = 0, scan = Pico.est.DrawScanline, sh, plane;
// Draw tiles across screen:
sh = (plane_sh & LF_SH) << 6; // shadow
plane = (plane_sh & LF_PLANE); // plane to draw
tilex=(-ts->hscroll)>>3;
dx=((ts->hscroll-1)&7)+1;
if (ts->hscroll & 0x0f) {
int adj = ((ts->hscroll ^ dx) >> 3) & 1;
cell -= adj + 1;
ts->cells -= adj;
PicoMem.vsram[0x3e] = PicoMem.vsram[0x3f] = plane_sh >> 16;
}
cell+=cellskip;
tilex+=cellskip;
dx+=cellskip<<3;
// int force = (plane_sh&LF_FORCE) << 13;
if ((cell&1)==1)
{
int line,vscroll;
vscroll = PicoMem.vsram[plane + (cell&0x3e)];
// Find the line in the name table
line=(vscroll+scan)&ts->line&0xffff; // ts->line is really ymask ..
nametabadd=(line>>3)<<(ts->line>>24); // .. and shift[width]
ty=(line&7)<<1; // Y-Offset into tile
}
for (; cell < ts->cells; dx+=8,tilex++,cell++)
{
u32 code, pack;
if ((cell&1)==0)
{
int line,vscroll;
vscroll = PicoMem.vsram[plane + (cell&0x3e)];
// Find the line in the name table
line=(vscroll+scan)&ts->line&0xffff; // ts->line is really ymask ..
nametabadd=(line>>3)<<(ts->line>>24); // .. and shift[width]
ty=(line&7)<<1; // Y-Offset into tile
}
code= PicoMem.vram[ts->nametab + nametabadd + (tilex & ts->xmask)];
// code &= ~force; // forced always draw everything
code |= ty<<16; // add ty since that can change pixel row for every 2nd tile
if (code == blank && !((code & 0x8000) && sh))
continue;
if (code!=oldcode) {
oldcode = code;
// Get tile address/2:
addr = (code&0x7ff)<<4;
pal = ((code>>9)&0x30) | sh; // shadow
}
pack = (code & 0x1000 ? ty^0xe : ty); // Y-flip
pack = *(unsigned int *)(PicoMem.vram + addr+pack);
if (!pack)
blank = code;
if (code & 0x8000) { // (un-forced) high priority tile
int cval = (u16)code | (dx<<16) | (ty<<25);
if (code & 0x1000) cval ^= 0xe<<25;
*hc++ = cval, *hc++ = pack; // cache it
} else if (code != blank) {
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
// terminate the cache list
*hc = 0;
if (oldcode == -1) Pico.est.rendstatus |= PDRAW_PLANE_HI_PRIO;
}
#endif
#ifndef _ASM_DRAW_C
static
#endif
void DrawStripInterlace(struct TileStrip *ts, int plane_sh)
{
unsigned char *pd = Pico.est.HighCol;
int *hc = ts->hc;
int tilex = 0, dx = 0, ty = 0, cells;
int oldcode = -1, blank = -1; // The tile we know is blank
unsigned int pal = 0, pack = 0, sh;
// Draw tiles across screen:
sh = (plane_sh & LF_SH) << 6; // shadow
tilex=(-ts->hscroll)>>3;
ty=(ts->line&15)<<1; // Y-Offset into tile
dx=((ts->hscroll-1)&7)+1;
cells = ts->cells;
if(dx != 8) cells++; // have hscroll, need to draw 1 cell more
// int force = (plane_sh&LF_FORCE) << 13;
for (; cells; dx+=8,tilex++,cells--)
{
u32 code = PicoMem.vram[ts->nametab + (tilex & ts->xmask)];
// code &= ~force; // forced always draw everything
if (code == blank && !(code & 0x8000))
continue;
if (code!=oldcode) {
oldcode = code;
pack = 0;
if (code != blank) {
// Get tile address/2:
u32 addr = ((code&0x3ff)<<5) + ty;
if (code & 0x1000) addr ^= 0x1e; // Y-flip
pal = ((code>>9)&0x30) | sh; // shadow
pack = *(unsigned int *)(PicoMem.vram + addr);
if (!pack)
blank = code;
}
}
if (code & 0x8000) { // high priority tile
if ((plane_sh&LF_SH) | (code!=blank)) {
int cval = (code&0xfc00) | ((code&0x3ff)<<1) | (dx<<16) | (ty<<25);
if (code & 0x1000) cval ^= 0x1e<<25;
*hc++ = cval, *hc++ = pack; // cache it
}
continue;
} else if (code != blank) {
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
// terminate the cache list
*hc = 0;
}
// --------------------------------------------
#ifndef _ASM_DRAW_C
static void DrawLayer(int plane_sh, int *hcache, int cellskip, int maxcells,
struct PicoEState *est)
{
struct PicoVideo *pvid=&Pico.video;
const char shift[4]={5,6,5,7}; // 32,64 or 128 sized tilemaps (2 is invalid)
struct TileStrip ts;
int width, height, ymask;
int vscroll, htab;
ts.hc=hcache;
ts.cells=maxcells;
// Work out the TileStrip to draw
// Work out the name table size: 32 64 or 128 tiles (0-3)
width=pvid->reg[16];
height=(width>>4)&3; width&=3;
ts.xmask=(1<<shift[width])-1; // X Mask in tiles (0x1f-0x7f)
ymask=(height<<8)|0xff; // Y Mask in pixels
switch (width) {
case 1: ymask &= 0x1ff; break;
case 2: ymask = 0x007; break;
case 3: ymask = 0x0ff; break;
}
// Find name table:
if (plane_sh&LF_PLANE) ts.nametab=(pvid->reg[4]&0x07)<<12; // B
else ts.nametab=(pvid->reg[2]&0x38)<< 9; // A
htab=pvid->reg[13]<<9; // Horizontal scroll table address
switch (pvid->reg[11]&3) {
case 1: htab += (est->DrawScanline<<1) & 0x0f; break;
case 2: htab += (est->DrawScanline<<1) & ~0x0f; break; // Offset by tile
case 3: htab += (est->DrawScanline<<1); break; // Offset by line
}
htab+=plane_sh&LF_PLANE; // A or B
// Get horizontal scroll value, will be masked later
ts.hscroll = PicoMem.vram[htab & 0x7fff];
if((pvid->reg[12]&6) == 6) {
// interlace mode 2
vscroll = PicoMem.vsram[plane_sh&LF_PLANE]; // Get vertical scroll value
// Find the line in the name table
ts.line=(vscroll+(est->DrawScanline<<1))&((ymask<<1)|1);
ts.nametab+=(ts.line>>4)<<shift[width];
DrawStripInterlace(&ts, plane_sh);
} else if( pvid->reg[11]&4) {
// shit, we have 2-cell column based vscroll
// luckily this doesn't happen too often
ts.line=ymask|(shift[width]<<24); // save some stuff instead of line
// vscroll value for leftmost cells in case of hscroll not on 16px boundary
// XXX it's unclear what exactly the hw is doing. Continue reading where it
// stopped last seems to work best (H40: 0x50 (wrap->0x00), H32 0x40).
plane_sh |= PicoMem.vsram[(pvid->reg[12]&1?0x00:0x20) + (plane_sh&LF_PLANE)] << 16;
DrawStripVSRam(&ts, plane_sh, cellskip);
} else {
vscroll = PicoMem.vsram[plane_sh&LF_PLANE]; // Get vertical scroll value
// Find the line in the name table
ts.line=(vscroll+est->DrawScanline)&ymask;
ts.nametab+=(ts.line>>3)<<shift[width];
DrawStrip(&ts, plane_sh, cellskip);
}
}
// --------------------------------------------
// tstart & tend are tile pair numbers
static void DrawWindow(int tstart, int tend, int prio, int sh,
struct PicoEState *est)
{
unsigned char *pd = Pico.est.HighCol;
struct PicoVideo *pvid = &Pico.video;
int tilex,ty,nametab,code=0;
int blank=-1; // The tile we know is blank
// Find name table line:
if (pvid->reg[12]&1)
{
nametab=(pvid->reg[3]&0x3c)<<9; // 40-cell mode
nametab+=(est->DrawScanline>>3)<<6;
}
else
{
nametab=(pvid->reg[3]&0x3e)<<9; // 32-cell mode
nametab+=(est->DrawScanline>>3)<<5;
}
tilex=tstart<<1;
if (prio && !(est->rendstatus & PDRAW_WND_DIFF_PRIO)) {
// all tiles processed in low prio pass
return;
}
tend<<=1;
ty=(est->DrawScanline&7)<<1; // Y-Offset into tile
// Draw tiles across screen:
if (!sh)
{
for (; tilex < tend; tilex++)
{
unsigned int pack;
int dx, addr;
int pal;
code = PicoMem.vram[nametab + tilex];
if ((code>>15) != prio) {
est->rendstatus |= PDRAW_WND_DIFF_PRIO;
continue;
}
if (code==blank) continue;
// Get tile address/2:
addr=(code&0x7ff)<<4;
if (code&0x1000) addr+=14-ty; else addr+=ty; // Y-flip
pack = *(unsigned int *)(PicoMem.vram + addr);
if (!pack) {
blank = code;
continue;
}
pal = ((code >> 9) & 0x30);
dx = 8 + (tilex << 3);
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
else
{
for (; tilex < tend; tilex++)
{
unsigned int pack;
int dx, addr;
int pal;
code = PicoMem.vram[nametab + tilex];
if((code>>15) != prio) {
est->rendstatus |= PDRAW_WND_DIFF_PRIO;
continue;
}
pal=((code>>9)&0x30);
if (prio) {
int *zb = (int *)(est->HighCol+8+(tilex<<3));
*zb++ &= 0x7f7f7f7f;
*zb &= 0x7f7f7f7f;
} else {
pal |= 0x80;
}
if(code==blank) continue;
// Get tile address/2:
addr=(code&0x7ff)<<4;
if (code&0x1000) addr+=14-ty; else addr+=ty; // Y-flip
pack = *(unsigned int *)(PicoMem.vram + addr);
if (!pack) {
blank = code;
continue;
}
dx = 8 + (tilex << 3);
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
}
// --------------------------------------------
static void DrawTilesFromCacheShPrep(void)
{
// as some layer has covered whole line with hi priority tiles,
// we can process whole line and then act as if sh/hi mode was off,
// but leave lo pri op sprite markers alone
int c = 320/4, *zb = (int *)(Pico.est.HighCol+8);
Pico.est.rendstatus |= PDRAW_SHHI_DONE;
while (c--)
{
*zb++ &= 0x7f7f7f7f;
}
}
static void DrawTilesFromCache(int *hc, int sh, int rlim, struct PicoEState *est)
{
unsigned char *pd = Pico.est.HighCol;
int code, dx;
unsigned int pack;
int pal;
// *ts->hc++ = code | (dx<<16) | (ty<<25); // cache it
if (sh && (est->rendstatus & (PDRAW_SHHI_DONE|PDRAW_PLANE_HI_PRIO)))
{
if (!(est->rendstatus & PDRAW_SHHI_DONE))
DrawTilesFromCacheShPrep();
sh = 0;
}
if (!sh)
{
while ((code=*hc++)) {
pack = *hc++;
if (!pack)
continue;
dx = (code >> 16) & 0x1ff;
pal = ((code >> 9) & 0x30);
if (rlim-dx < 0)
goto last_cut_tile;
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
else
{
while ((code=*hc++)) {
unsigned char *zb;
dx = (code >> 16) & 0x1ff;
zb = est->HighCol+dx;
*zb++ &= 0x7f; *zb++ &= 0x7f; *zb++ &= 0x7f; *zb++ &= 0x7f;
*zb++ &= 0x7f; *zb++ &= 0x7f; *zb++ &= 0x7f; *zb++ &= 0x7f;
pack = *hc++;
if (!pack)
continue;
pal = ((code >> 9) & 0x30);
if (rlim - dx < 0)
goto last_cut_tile;
if (code & 0x0800) TileFlip(pd + dx, pack, pal);
else TileNorm(pd + dx, pack, pal);
}
}
return;
last_cut_tile:
// for vertical window cutoff
{
unsigned int t;
pd += dx;
if (code&0x0800)
{
switch (rlim-dx+8)
{
case 7: t=pack&0x00000f00; if (t) pd[6]=(unsigned char)(pal|(t>> 8)); // "break" is left out intentionally
case 6: t=pack&0x000000f0; if (t) pd[5]=(unsigned char)(pal|(t>> 4));
case 5: t=pack&0x0000000f; if (t) pd[4]=(unsigned char)(pal|(t ));
case 4: t=pack&0xf0000000; if (t) pd[3]=(unsigned char)(pal|(t>>28));
case 3: t=pack&0x0f000000; if (t) pd[2]=(unsigned char)(pal|(t>>24));
case 2: t=pack&0x00f00000; if (t) pd[1]=(unsigned char)(pal|(t>>20));
case 1: t=pack&0x000f0000; if (t) pd[0]=(unsigned char)(pal|(t>>16));
default: break;
}
}
else
{
switch (rlim-dx+8)
{
case 7: t=pack&0x00f00000; if (t) pd[6]=(unsigned char)(pal|(t>>20));
case 6: t=pack&0x0f000000; if (t) pd[5]=(unsigned char)(pal|(t>>24));
case 5: t=pack&0xf0000000; if (t) pd[4]=(unsigned char)(pal|(t>>28));
case 4: t=pack&0x0000000f; if (t) pd[3]=(unsigned char)(pal|(t ));
case 3: t=pack&0x000000f0; if (t) pd[2]=(unsigned char)(pal|(t>> 4));
case 2: t=pack&0x00000f00; if (t) pd[1]=(unsigned char)(pal|(t>> 8));
case 1: t=pack&0x0000f000; if (t) pd[0]=(unsigned char)(pal|(t>>12));
default: break;
}
}
}
}
// --------------------------------------------
// Index + 0 : hhhhvvvv ab--hhvv yyyyyyyy yyyyyyyy // a: offscreen h, b: offs. v, h: horiz. size
// Index + 4 : xxxxxxxx xxxxxxxx pccvhnnn nnnnnnnn // x: x coord + 8
static void DrawSprite(int *sprite, int sh, int w)
{
void (*fTileFunc)(unsigned char *pd, unsigned int pack, int pal);
unsigned char *pd = Pico.est.HighCol;
int width=0,height=0;
int row=0,code=0;
int pal;
int tile=0,delta=0;
int sx, sy;
// parse the sprite data
sy=sprite[0];
code=sprite[1];
sx=code>>16; // X
width=sy>>28;
height=(sy>>24)&7; // Width and height in tiles
sy=(sy<<16)>>16; // Y
row=Pico.est.DrawScanline-sy; // Row of the sprite we are on
if (code&0x1000) row=(height<<3)-1-row; // Flip Y
tile=code + (row>>3); // Tile number increases going down
delta=height; // Delta to increase tile by going right
if (code&0x0800) { tile+=delta*(width-1); delta=-delta; } // Flip X
tile &= 0x7ff; tile<<=4; tile+=(row&7)<<1; // Tile address
delta<<=4; // Delta of address
pal=(code>>9)&0x30;
pal|=sh<<7; // shadow
if (sh && (code&0x6000) == 0x6000) {
if(code&0x0800) fTileFunc=TileFlipSH_markop;
else fTileFunc=TileNormSH_markop;
} else {
if(code&0x0800) fTileFunc=TileFlip;
else fTileFunc=TileNorm;
}
if (w) width = w; // tile limit
for (; width; width--,sx+=8,tile+=delta)
{
unsigned int pack;
if(sx<=0) continue;
if(sx>=328) break; // Offscreen
pack = *(unsigned int *)(PicoMem.vram + (tile & 0x7fff));
fTileFunc(pd + sx, pack, pal);
}
}
#endif
static void DrawSpriteInterlace(unsigned int *sprite)
{
unsigned char *pd = Pico.est.HighCol;
int width=0,height=0;
int row=0,code=0;
int pal;
int tile=0,delta=0;
int sx, sy;
// parse the sprite data
sy=sprite[0];
height=sy>>24;
sy=(sy&0x3ff)-0x100; // Y
width=(height>>2)&3; height&=3;
width++; height++; // Width and height in tiles
row=(Pico.est.DrawScanline<<1)-sy; // Row of the sprite we are on
code=sprite[1];
sx=((code>>16)&0x1ff)-0x78; // X
if (code&0x1000) row^=(16<<height)-1; // Flip Y
tile=code&0x3ff; // Tile number
tile+=row>>4; // Tile number increases going down
delta=height; // Delta to increase tile by going right
if (code&0x0800) { tile+=delta*(width-1); delta=-delta; } // Flip X
tile<<=5; tile+=(row&15)<<1; // Tile address
delta<<=5; // Delta of address
pal=((code>>9)&0x30); // Get palette pointer
for (; width; width--,sx+=8,tile+=delta)
{
unsigned int pack;
if(sx<=0) continue;
if(sx>=328) break; // Offscreen
pack = *(unsigned int *)(PicoMem.vram + (tile & 0x7fff));
if (code & 0x0800) TileFlip(pd + sx, pack, pal);
else TileNorm(pd + sx, pack, pal);
}
}
static NOINLINE void DrawAllSpritesInterlace(int pri, int sh)
{
struct PicoVideo *pvid=&Pico.video;
int i,u,table,link=0,sline=Pico.est.DrawScanline<<1;
unsigned int *sprites[80]; // Sprite index
int max_sprites = Pico.video.reg[12]&1 ? 80 : 64;
table=pvid->reg[5]&0x7f;
if (pvid->reg[12]&1) table&=0x7e; // Lowest bit 0 in 40-cell mode
table<<=8; // Get sprite table address/2
for (i = u = 0; u < max_sprites && link < max_sprites; u++)
{
unsigned int *sprite;
int code, sx, sy, height;
sprite=(unsigned int *)(PicoMem.vram+((table+(link<<2))&0x7ffc)); // Find sprite
// get sprite info
code = sprite[0];
sx = sprite[1];
if(((sx>>15)&1) != pri) goto nextsprite; // wrong priority sprite
// check if it is on this line
sy = (code&0x3ff)-0x100;
height = (((code>>24)&3)+1)<<4;
if((sline < sy) | (sline >= sy+height)) goto nextsprite; // no
// check if sprite is not hidden offscreen
sx = (sx>>16)&0x1ff;
sx -= 0x78; // Get X coordinate + 8
if((sx <= -8*3) | (sx >= 328)) goto nextsprite;
// sprite is good, save it's pointer
sprites[i++]=sprite;
nextsprite:
// Find next sprite
link=(code>>16)&0x7f;
if(!link) break; // End of sprites
}
// Go through sprites backwards:
for (i-- ;i>=0; i--)
DrawSpriteInterlace(sprites[i]);
}
#ifndef _ASM_DRAW_C
/*
* s/h drawing: lo_layers|40, lo_sprites|40 && mark_op,
* hi_layers&=~40, hi_sprites
*
* Index + 0 : hhhhvvvv ----hhvv yyyyyyyy yyyyyyyy // v, h: vert./horiz. size
* Index + 4 : xxxxxxxx xxxxxxxx pccvhnnn nnnnnnnn // x: x coord + 8
*/
static void DrawSpritesSHi(unsigned char *sprited, const struct PicoEState *est)
{
static void (*tilefuncs[2][2][2])(unsigned char *, unsigned, int) = {
{ {NULL, NULL}, {TileNorm, TileFlip} },
{ {TileNormSH_onlyop_lp, TileFlipSH_onlyop_lp}, {TileNormSH, TileFlipSH} }
}; // [sh?][hi?][flip?]
void (*fTileFunc)(unsigned char *pd, unsigned int pack, int pal);
unsigned char *pd = Pico.est.HighCol;
unsigned char *p;
int cnt, w;
cnt = sprited[0] & 0x7f;
if (cnt == 0) return;
p = &sprited[4];
if ((sprited[1] & (SPRL_TILE_OVFL|SPRL_HAVE_MASK0)) == (SPRL_TILE_OVFL|SPRL_HAVE_MASK0))
return; // masking effective due to tile overflow
// Go through sprites backwards:
w = p[cnt]; // possibly clipped width of last sprite
for (cnt--; cnt >= 0; cnt--, w = 0)
{
int *sprite, code, pal, tile, sx, sy;
int offs, delta, width, height, row;
offs = (p[cnt] & 0x7f) * 2;
sprite = est->HighPreSpr + offs;
code = sprite[1];
pal = (code>>9)&0x30;
fTileFunc = tilefuncs[pal == 0x30][!!(code & 0x8000)][!!(code & 0x800)];
if (fTileFunc == NULL) continue; // non-operator low sprite, already drawn
// parse remaining sprite data
sy=sprite[0];
sx=code>>16; // X
width=sy>>28;
height=(sy>>24)&7; // Width and height in tiles
sy=(sy<<16)>>16; // Y
row=est->DrawScanline-sy; // Row of the sprite we are on
if (code&0x1000) row=(height<<3)-1-row; // Flip Y
tile=code + (row>>3); // Tile number increases going down
delta=height; // Delta to increase tile by going right
if (code&0x0800) { tile+=delta*(width-1); delta=-delta; } // Flip X
tile &= 0x7ff; tile<<=4; tile+=(row&7)<<1; // Tile address
delta<<=4; // Delta of address
if (w) width = w; // tile limit
for (; width; width--,sx+=8,tile+=delta)
{
unsigned int pack;
if(sx<=0) continue;
if(sx>=328) break; // Offscreen
pack = *(unsigned int *)(PicoMem.vram + (tile & 0x7fff));
fTileFunc(pd + sx, pack, pal);
}
}
}
#endif // !_ASM_DRAW_C
static void DrawSpritesHiAS(unsigned char *sprited, int sh)
{
static unsigned (*tilefuncs[2][2][2])(unsigned, unsigned char *, unsigned, int) = {
{ {TileNormAS_onlymark, TileFlipAS_onlymark}, {TileNormAS, TileFlipAS} },
{ {TileNormSH_AS_onlyop_lp, TileFlipSH_AS_onlyop_lp}, {TileNormSH_AS, TileFlipSH_AS} }
}; // [sh?][hi?][flip?]
unsigned (*fTileFunc)(unsigned m, unsigned char *pd, unsigned int pack, int pal);
unsigned char *pd = Pico.est.HighCol;
unsigned char mb[sizeof(DefHighCol)/8];
unsigned char *p, *mp;
unsigned m;
int entry, cnt;
cnt = sprited[0] & 0x7f;
if (cnt == 0) return;
memset(mb, 0xff, sizeof(mb));
p = &sprited[4];
if ((sprited[1] & (SPRL_TILE_OVFL|SPRL_HAVE_MASK0)) == (SPRL_TILE_OVFL|SPRL_HAVE_MASK0))
return; // masking effective due to tile overflow
// Go through sprites:
for (entry = 0; entry < cnt; entry++)
{
int *sprite, code, pal, tile, sx, sy;
int offs, delta, width, height, row;
offs = (p[entry] & 0x7f) * 2;
sprite = HighPreSpr + offs;
code = sprite[1];
pal = (code>>9)&0x30;
fTileFunc = tilefuncs[(sh && pal == 0x30)][!!(code&0x8000)][!!(code&0x800)];
// parse remaining sprite data
sy=sprite[0];
sx=code>>16; // X
width=sy>>28;
height=(sy>>24)&7; // Width and height in tiles
sy=(sy<<16)>>16; // Y
row=Pico.est.DrawScanline-sy; // Row of the sprite we are on
if (code&0x1000) row=(height<<3)-1-row; // Flip Y
tile=code + (row>>3); // Tile number increases going down
delta=height; // Delta to increase tile by going right
if (code&0x0800) { tile+=delta*(width-1); delta=-delta; } // Flip X
tile &= 0x7ff; tile<<=4; tile+=(row&7)<<1; // Tile address
delta<<=4; // Delta of address
if (entry+1 == cnt) width = p[entry+1]; // last sprite width limited?
while (sx <= 0 && width) width--, sx+=8, tile+=delta; // Offscreen
mp = mb+(sx>>3);
for (m = *mp; width; width--, sx+=8, tile+=delta, *mp++ = m, m >>= 8)
{
unsigned int pack;
if(sx>=328) break; // Offscreen
pack = *(unsigned int *)(PicoMem.vram + (tile & 0x7fff));
m |= mp[1] << 8; // next mask byte
// shift mask bits to bits 8-15 for easier load/store handling
m = fTileFunc(m << (8-(sx&0x7)), pd + sx, pack, pal) >> (8-(sx&0x7));
}
*mp = m; // write last mask byte
}
}
#ifdef FORCE
// NB lots of duplicate code, all for the sake of a small performance gain.
static void DrawStripForced(struct TileStrip *ts, int cellskip)
{
unsigned char *pd = Pico.est.HighCol;
int tilex, dx, ty, code=0, addr=0, cells;
int oldcode = -1;
int pal = 0;
// Draw tiles across screen:
tilex=((-ts->hscroll)>>3)+cellskip;
ty=(ts->line&7)<<1; // Y-Offset into tile
dx=((ts->hscroll-1)&7)+1;
cells = ts->cells - cellskip;
if(dx != 8) cells++; // have hscroll, need to draw 1 cell more
dx+=cellskip<<3;
for (; cells > 0; dx+=8, tilex++, cells--)
{
unsigned int pack;
code = PicoMem.vram[ts->nametab + (tilex & ts->xmask)];
if (code!=oldcode) {
oldcode = code;
// Get tile address/2:
addr = ((code&0x7ff)<<4) + ty;
if (code & 0x1000) addr^=0xe; // Y-flip
pal = (code>>9)&0x30;
}
pack = *(unsigned int *)(PicoMem.vram + addr);
if (code & 0x0800) TileFlip_and(pd + dx, pack, pal);
else TileNorm_and(pd + dx, pack, pal);
}
}
static void DrawStripVSRamForced(struct TileStrip *ts, int plane_sh, int cellskip)
{
unsigned char *pd = Pico.est.HighCol;
int tilex, dx, ty=0, code=0, addr=0, cell=0, nametabadd=0;
int oldcode=-1;
int pal=0, scan=Pico.est.DrawScanline, plane;
// Draw tiles across screen:
plane = plane_sh & LF_PLANE;
tilex=(-ts->hscroll)>>3;
dx=((ts->hscroll-1)&7)+1;
if (ts->hscroll & 0x0f) {
int adj = ((ts->hscroll ^ dx) >> 3) & 1;
cell -= adj + 1;
ts->cells -= adj;
PicoMem.vsram[0x3e] = PicoMem.vsram[0x3f] = plane_sh >> 16;
}
cell+=cellskip;
tilex+=cellskip;
dx+=cellskip<<3;
if ((cell&1)==1)
{
int line,vscroll;
vscroll = PicoMem.vsram[plane + (cell&0x3e)];
// Find the line in the name table
line=(vscroll+scan)&ts->line&0xffff; // ts->line is really ymask ..
nametabadd=(line>>3)<<(ts->line>>24); // .. and shift[width]
ty=(line&7)<<1; // Y-Offset into tile
}
for (; cell < ts->cells; dx+=8,tilex++,cell++)
{
unsigned int pack;
if ((cell&1)==0)
{
int line,vscroll;
vscroll = PicoMem.vsram[plane + (cell&0x3e)];
// Find the line in the name table
line=(vscroll+scan)&ts->line&0xffff; // ts->line is really ymask ..
nametabadd=(line>>3)<<(ts->line>>24); // .. and shift[width]
ty=(line&7)<<1; // Y-Offset into tile
}
code=PicoMem.vram[ts->nametab+nametabadd+(tilex&ts->xmask)];
if (code!=oldcode) {
oldcode = code;
// Get tile address/2:
addr=(code&0x7ff)<<4;
pal = (code>>9)&0x30; // shadow
}
pack = code & 0x1000 ? ty^0xe : ty; // Y-flip
pack = *(unsigned int *)(PicoMem.vram + addr+pack);
if (code & 0x0800) TileFlip_and(pd + dx, pack, pal);
else TileNorm_and(pd + dx, pack, pal);
}
}
void DrawStripInterlaceForced(struct TileStrip *ts)
{
unsigned char *pd = Pico.est.HighCol;
int tilex = 0, dx = 0, ty = 0, cells;
int oldcode = -1;
unsigned int pal = 0, pack = 0;
// Draw tiles across screen:
tilex=(-ts->hscroll)>>3;
ty=(ts->line&15)<<1; // Y-Offset into tile
dx=((ts->hscroll-1)&7)+1;
cells = ts->cells;
if(dx != 8) cells++; // have hscroll, need to draw 1 cell more
for (; cells; dx+=8,tilex++,cells--)
{
u32 code = PicoMem.vram[ts->nametab + (tilex & ts->xmask)];
if (code!=oldcode) {
oldcode = code;
// Get tile address/2:
u32 addr = ((code&0x3ff)<<5) + ty;
if (code & 0x1000) addr ^= 0x1e; // Y-flip
pal = (code>>9)&0x30; // shadow
pack = *(unsigned int *)(PicoMem.vram + addr);
}
if (code & 0x0800) TileFlip_and(pd + dx, pack, pal);
else TileNorm_and(pd + dx, pack, pal);
}
}
// XXX only duplicated to avoid ARM asm hassles
static void DrawLayerForced(int plane_sh, int cellskip, int maxcells,
struct PicoEState *est)
{
struct PicoVideo *pvid=&Pico.video;
const char shift[4]={5,6,5,7}; // 32,64 or 128 sized tilemaps (2 is invalid)
struct TileStrip ts;
int width, height, ymask;
int vscroll, htab;
ts.cells=maxcells;
// Work out the TileStrip to draw
// Work out the name table size: 32 64 or 128 tiles (0-3)
width=pvid->reg[16];
height=(width>>4)&3; width&=3;
ts.xmask=(1<<shift[width])-1; // X Mask in tiles (0x1f-0x7f)
ymask=(height<<8)|0xff; // Y Mask in pixels
switch (width) {
case 1: ymask &= 0x1ff; break;
case 2: ymask = 0x007; break;
case 3: ymask = 0x0ff; break;
}
// Find name table:
if (plane_sh&1) ts.nametab=(pvid->reg[4]&0x07)<<12; // B
else ts.nametab=(pvid->reg[2]&0x38)<< 9; // A
htab=pvid->reg[13]<<9; // Horizontal scroll table address
switch (pvid->reg[11]&3) {
case 1: htab += (est->DrawScanline<<1) & 0x0f; break;
case 2: htab += (est->DrawScanline<<1) & ~0x0f; break; // Offset by tile
case 3: htab += (est->DrawScanline<<1); break; // Offset by line
}
htab+=plane_sh&1; // A or B
// Get horizontal scroll value, will be masked later
ts.hscroll = PicoMem.vram[htab & 0x7fff];
if((pvid->reg[12]&6) == 6) {
// interlace mode 2
vscroll = PicoMem.vsram[plane_sh & 1]; // Get vertical scroll value
// Find the line in the name table
ts.line=(vscroll+(est->DrawScanline<<1))&((ymask<<1)|1);
ts.nametab+=(ts.line>>4)<<shift[width];
DrawStripInterlaceForced(&ts);
} else if( pvid->reg[11]&4) {
// shit, we have 2-cell column based vscroll
// luckily this doesn't happen too often
ts.line=ymask|(shift[width]<<24); // save some stuff instead of line
// vscroll value for leftmost cells in case of hscroll not on 16px boundary
// XXX it's unclear what exactly the hw is doing. Continue reading where it
// stopped last seems to work best (H40: 0x50 (wrap->0x00), H32 0x40).
plane_sh |= PicoMem.vsram[(pvid->reg[12]&1?0x00:0x20) + (plane_sh&1)] << 16;
DrawStripVSRamForced(&ts, plane_sh, cellskip);
} else {
vscroll = PicoMem.vsram[plane_sh & 1]; // Get vertical scroll value
// Find the line in the name table
ts.line=(vscroll+est->DrawScanline)&ymask;
ts.nametab+=(ts.line>>3)<<shift[width];
DrawStripForced(&ts, cellskip);
}
}
static void DrawSpritesForced(unsigned char *sprited)
{
unsigned (*fTileFunc)(unsigned m, unsigned char *pd, unsigned int pack, int pal);
unsigned char *pd = Pico.est.HighCol;
unsigned char mb[sizeof(DefHighCol)/8];
unsigned char *p, *mp;
unsigned m;
int entry, cnt;
cnt = sprited[0] & 0x7f;
if (cnt == 0) { memset(pd, 0, sizeof(DefHighCol)); return; }
memset(mb, 0xff, sizeof(mb));
p = &sprited[4];
if ((sprited[1] & (SPRL_TILE_OVFL|SPRL_HAVE_MASK0)) == (SPRL_TILE_OVFL|SPRL_HAVE_MASK0))
return; // masking effective due to tile overflow
// Go through sprites:
for (entry = 0; entry < cnt; entry++)
{
int *sprite, code, pal, tile, sx, sy;
int offs, delta, width, height, row;
offs = (p[entry] & 0x7f) * 2;
sprite = HighPreSpr + offs;
code = sprite[1];
pal = (code>>9)&0x30;
if (code&0x800) fTileFunc = TileFlipSH_AS_and;
else fTileFunc = TileNormSH_AS_and;
// parse remaining sprite data
sy=sprite[0];
sx=code>>16; // X
width=sy>>28;
height=(sy>>24)&7; // Width and height in tiles
sy=(sy<<16)>>16; // Y
row=Pico.est.DrawScanline-sy; // Row of the sprite we are on
if (code&0x1000) row=(height<<3)-1-row; // Flip Y
tile=code + (row>>3); // Tile number increases going down
delta=height; // Delta to increase tile by going right
if (code&0x0800) { tile+=delta*(width-1); delta=-delta; } // Flip X
tile &= 0x7ff; tile<<=4; tile+=(row&7)<<1; // Tile address
delta<<=4; // Delta of address
if (entry+1 == cnt) width = p[entry+1]; // last sprite width limited?
while (sx <= 0 && width) width--, sx+=8, tile+=delta; // Offscreen
mp = mb+(sx>>3);
for (m = *mp; width; width--, sx+=8, tile+=delta, *mp++ = m, m >>= 8)
{
unsigned int pack;
if(sx>=328) break; // Offscreen
pack = *(unsigned int *)(PicoMem.vram + (tile & 0x7fff));
m |= mp[1] << 8; // next mask byte
// shift mask bits to bits 8-15 for easier load/store handling
m = fTileFunc(m << (8-(sx&0x7)), pd + sx, pack, pal) >> (8-(sx&0x7));
}
*mp = m; // write last mask byte
}
// anything not covered by a sprite is off (XXX or bg?)
for (cnt = 1; cnt < sizeof(mb)-1; cnt++)
if (mb[cnt] == 0xff) {
*(u32 *)(pd+8*cnt+0) = 0;
*(u32 *)(pd+8*cnt+4) = 0;
} else if (mb[cnt])
for (m = 0; m < 8; m++)
if (mb[cnt] & (1<<m))
pd[8*cnt+m] = 0;
}
#endif
// Index + 0 : ----hhvv -lllllll -------y yyyyyyyy
// Index + 4 : -------x xxxxxxxx pccvhnnn nnnnnnnn
// v
// Index + 0 : hhhhvvvv ----hhvv yyyyyyyy yyyyyyyy // v, h: vert./horiz. size
// Index + 4 : xxxxxxxx xxxxxxxx pccvhnnn nnnnnnnn // x: x coord + 8
static NOINLINE void PrepareSprites(int max_lines)
{
const struct PicoVideo *pvid=&Pico.video;
const struct PicoEState *est=&Pico.est;
int u,link=0,sh;
int table=0;
int *pd = HighPreSpr;
int max_sprites = 80, max_width = 328;
int max_line_sprites = 20; // 20 sprites, 40 tiles
if (!(Pico.video.reg[12]&1))
max_sprites = 64, max_line_sprites = 16, max_width = 264;
if (PicoIn.opt & POPT_DIS_SPRITE_LIM)
max_line_sprites = MAX_LINE_SPRITES;
sh = Pico.video.reg[0xC]&8; // shadow/hilight?
table=pvid->reg[5]&0x7f;
if (pvid->reg[12]&1) table&=0x7e; // Lowest bit 0 in 40-cell mode
table<<=8; // Get sprite table address/2
for (u = est->DrawScanline; u < max_lines; u++)
*((int *)&HighLnSpr[u][0]) = 0;
for (u = 0; u < max_sprites && link < max_sprites; u++)
{
unsigned int *sprite;
int code, code2, sx, sy, hv, height, width;
sprite=(unsigned int *)(PicoMem.vram+((table+(link<<2))&0x7ffc)); // Find sprite
// parse sprite info. the 1st half comes from the VDPs internal cache,
// the 2nd half is read from VRAM
code = VdpSATCache[link]; // normally but not always equal to sprite[0]
sy = (code&0x1ff)-0x80;
hv = (code>>24)&0xf;
height = (hv&3)+1;
width = (hv>>2)+1;
code2 = sprite[1];
sx = (code2>>16)&0x1ff;
sx -= 0x78; // Get X coordinate + 8
if (sy < max_lines && sy + (height<<3) >= est->DrawScanline) // sprite onscreen (y)?
{
int entry, y, w, sx_min, onscr_x, maybe_op = 0;
sx_min = 8-(width<<3);
onscr_x = sx_min < sx && sx < max_width;
if (sh && (code2 & 0x6000) == 0x6000)
maybe_op = SPRL_MAY_HAVE_OP;
entry = ((pd - HighPreSpr) / 2) | ((code2>>8)&0x80);
y = (sy >= est->DrawScanline) ? sy : est->DrawScanline;
for (; y < sy + (height<<3) && y < max_lines; y++)
{
unsigned char *p = &HighLnSpr[y][0];
int cnt = p[0];
if (p[3] >= max_line_sprites) continue; // sprite limit?
if (p[1] & SPRL_MASKED) continue; // masked?
w = width;
if (p[2] + width > max_line_sprites*2) { // tile limit?
if (y+1 < 240) HighLnSpr[y+1][1] |= SPRL_TILE_OVFL;
if (p[2] >= max_line_sprites*2) continue;
w = max_line_sprites*2 - p[2];
}
p[2] += w;
p[3] ++;
if (sx == -0x78) {
if (p[1] & (SPRL_HAVE_X|SPRL_TILE_OVFL))
p[1] |= SPRL_MASKED; // masked, no more sprites for this line
if (!(p[1] & SPRL_HAVE_X) && cnt == 0)
p[1] |= SPRL_HAVE_MASK0; // 1st sprite is masking
} else
p[1] |= SPRL_HAVE_X;
if (!onscr_x) continue; // offscreen x
p[4+cnt] = entry;
p[5+cnt] = w; // width clipped by tile limit for sprite renderer
p[0] = cnt + 1;
p[1] |= (entry & 0x80) ? SPRL_HAVE_HI : SPRL_HAVE_LO;
p[1] |= maybe_op; // there might be op sprites on this line
if (cnt > 0 && (code2 & 0x8000) && !(p[4+cnt-1]&0x80))
p[1] |= SPRL_LO_ABOVE_HI;
}
}
*pd++ = (width<<28)|(height<<24)|(hv<<16)|((unsigned short)sy);
*pd++ = (sx<<16)|((unsigned short)code2);
// Find next sprite
link=(code>>16)&0x7f;
if (!link) break; // End of sprites
}
*pd = 0;
#if 0
for (u = 0; u < max_lines; u++)
{
int y;
printf("c%03i: f %x c %2i/%2i w %2i: ", u, HighLnSpr[u][1],
HighLnSpr[u][0], HighLnSpr[u][3], HighLnSpr[u][2]);
for (y = 0; y < HighLnSpr[u][0]; y++) {
int *sp = HighPreSpr + (HighLnSpr[u][y+4]&0x7f) * 2;
printf(" %i(%x/%x)", HighLnSpr[u][y+4],sp[0],sp[1]);
}
printf("\n");
}
#endif
}
#ifndef _ASM_DRAW_C
static void DrawAllSprites(unsigned char *sprited, int prio, int sh,
struct PicoEState *est)
{
unsigned char *p;
int cnt, w;
cnt = sprited[0] & 0x7f;
if (cnt == 0) return;
p = &sprited[4];
if ((sprited[1] & (SPRL_TILE_OVFL|SPRL_HAVE_MASK0)) == (SPRL_TILE_OVFL|SPRL_HAVE_MASK0))
return; // masking effective due to tile overflow
// Go through sprites backwards:
w = p[cnt]; // possibly clipped width of last sprite
for (cnt--; cnt >= 0; cnt--, w = 0)
{
int *sp = HighPreSpr + (p[cnt]&0x7f) * 2;
if ((p[cnt] >> 7) != prio) continue;
DrawSprite(sp, sh, w);
}
}
// --------------------------------------------
void BackFill(int reg7, int sh, struct PicoEState *est)
{
unsigned int back;
// Start with a blank scanline (background colour):
back=reg7&0x3f;
back|=sh<<7; // shadow
back|=back<<8;
back|=back<<16;
memset32((int *)(est->HighCol+8), back, 320/4);
}
#endif
// --------------------------------------------
void PicoDoHighPal555_8bit(int sh, int line, struct PicoEState *est)
{
unsigned int *spal, *dpal;
unsigned int cnt = (sh ? 1 : est->SonicPalCount+1);
unsigned int t, i;
// reset dirty only if there are no outstanding changes
if (Pico.m.dirtyPal == 2)
Pico.m.dirtyPal = 0;
// In Sonic render mode palettes were backuped in SonicPal
spal = (void *)est->SonicPal;
dpal = (void *)est->HighPal;
// additional palettes stored after in-frame changes
for (i = 0; i < cnt * 0x40 / 2; i++) {
t = spal[i];
// treat it like it was 4-bit per channel, since in s/h mode it somewhat is that.
// otherwise intensity difference between this and s/h will be wrong
t = PXCONV(t);
t |= (t >> 4) & PXMASKL;
dpal[i] = dpal[0xc0/2 + i] = t;
}
// norm: xxx0, sh: 0xxx, hi: 0xxx + 7
if (sh)
{
// shadowed pixels
for (i = 0; i < 0x40 / 2; i++)
dpal[0x80/2 + i] = (dpal[i] >> 1) & PXMASKH;
// hilighted pixels
for (i = 0; i < 0x40 / 2; i++) {
t = ((dpal[i] >> 1) & PXMASKH) + PXMASKH;
t |= (t >> 4) & PXMASKL;
dpal[0x40/2 + i] = t;
}
// shadowed pixels in color 14 always appear normal (hw bug?)
unsigned short *hpal = est->HighPal;
hpal[0x80 + 0x0e] = hpal[0x0e];
hpal[0x80 + 0x1e] = hpal[0x1e];
hpal[0x80 + 0x2e] = hpal[0x2e];
}
}
#ifndef _ASM_DRAW_C
void PicoDoHighPal555(int sh, int line, struct PicoEState *est)
{
unsigned int *spal, *dpal;
unsigned int t, i;
Pico.m.dirtyPal = 0;
spal = (void *)PicoMem.cram;
dpal = (void *)est->HighPal;
for (i = 0; i < 0x40 / 2; i++) {
t = spal[i];
// treat it like it was 4-bit per channel, since in s/h mode it somewhat is that.
// otherwise intensity difference between this and s/h will be wrong
t = PXCONV(t);
t |= (t >> 4) & PXMASKL;
dpal[i] = dpal[0xc0/2 + i] = t;
}
// norm: xxx0, sh: 0xxx, hi: 0xxx + 7
if (sh)
{
// shadowed pixels
for (i = 0; i < 0x40 / 2; i++)
dpal[0x80/2 + i] = (dpal[i] >> 1) & PXMASKH;
// hilighted pixels
for (i = 0; i < 0x40 / 2; i++) {
t = ((dpal[i] >> 1) & PXMASKH) + PXMASKH;
t |= (t >> 4) & PXMASKL;
dpal[0x40/2 + i] = t;
}
// shadowed pixels in color 14 always appear normal (hw bug?)
unsigned short *hpal = est->HighPal;
hpal[0x80 + 0x0e] = hpal[0x0e];
hpal[0x80 + 0x1e] = hpal[0x1e];
hpal[0x80 + 0x2e] = hpal[0x2e];
}
}
void FinalizeLine555(int sh, int line, struct PicoEState *est)
{
unsigned short *pd=est->DrawLineDest;
unsigned char *ps=est->HighCol+8;
unsigned short *pal=est->HighPal;
int len;
PicoDrawUpdateHighPal();
if (Pico.video.reg[12]&1) {
len = 320;
} else {
if (!(PicoIn.opt&POPT_DIS_32C_BORDER)) pd+=32;
len = 256;
}
{
#if 1
int i;
for (i = len; i > 0; i-=4) {
*pd++ = pal[*ps++];
*pd++ = pal[*ps++];
*pd++ = pal[*ps++];
*pd++ = pal[*ps++];
}
#else
extern void amips_clut(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
extern void amips_clut_6bit(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
if (!sh)
amips_clut_6bit(pd, ps, pal, len);
else amips_clut(pd, ps, pal, len);
#endif
}
}
#endif
static void FinalizeLine8bit(int sh, int line, struct PicoEState *est)
{
unsigned char *pd = est->DrawLineDest;
int len;
static int dirty_line;
if (Pico.m.dirtyPal == 1)
{
// a hack for mid-frame palette changes
if (!(est->rendstatus & PDRAW_SONIC_MODE) | (line - dirty_line > 4)) {
// store a maximum of 2 additional palettes in SonicPal
if (est->SonicPalCount < 2)
est->SonicPalCount ++;
dirty_line = line;
est->rendstatus |= PDRAW_SONIC_MODE;
}
blockcpy(est->SonicPal+est->SonicPalCount*0x40, PicoMem.cram, 0x40*2);
Pico.m.dirtyPal = 2;
}
if (Pico.video.reg[12]&1) {
len = 320;
} else {
if (!(PicoIn.opt & POPT_DIS_32C_BORDER))
pd += 32;
len = 256;
}
if (DrawLineDestBase == HighColBase) {
if (!sh && (est->rendstatus & PDRAW_SONIC_MODE))
blockcpy_or(pd+8, est->HighCol+8, len, est->SonicPalCount*0x40);
} else if (!sh && (est->rendstatus & PDRAW_SONIC_MODE)) {
// select active backup palette
blockcpy_or(pd, est->HighCol+8, len, est->SonicPalCount*0x40);
} else {
blockcpy(pd, est->HighCol+8, len);
}
}
static void (*FinalizeLine)(int sh, int line, struct PicoEState *est);
// --------------------------------------------
static int DrawDisplay(int sh)
{
struct PicoEState *est=&Pico.est;
unsigned char *sprited = &HighLnSpr[est->DrawScanline][0];
struct PicoVideo *pvid=&Pico.video;
int win=0, edge=0, hvwind=0, lflags;
int maxw, maxcells;
est->rendstatus &= ~(PDRAW_SHHI_DONE|PDRAW_PLANE_HI_PRIO|PDRAW_WND_DIFF_PRIO);
if (pvid->reg[12]&1) {
maxw = 328; maxcells = 40;
} else {
maxw = 264; maxcells = 32;
}
// Find out if the window is on this line:
win=pvid->reg[0x12];
edge=(win&0x1f)<<3;
if (win&0x80) { if (est->DrawScanline>=edge) hvwind=1; }
else { if (est->DrawScanline< edge) hvwind=1; }
if (!hvwind) // we might have a vertical window here
{
win=pvid->reg[0x11];
edge=win&0x1f;
if (win&0x80) {
if (!edge) hvwind=1;
else if(edge < (maxcells>>1)) hvwind=2;
} else {
if (!edge);
else if(edge < (maxcells>>1)) hvwind=2;
else hvwind=1;
}
}
/* - layer B low - */
if (!(pvid->debug_p & PVD_KILL_B)) {
lflags = LF_PLANE_B | (sh<<1);
DrawLayer(lflags, HighCacheB, 0, maxcells, est);
}
/* - layer A low - */
lflags = LF_PLANE_A | (sh<<1);
if (pvid->debug_p & PVD_KILL_A)
;
else if (hvwind == 1)
DrawWindow(0, maxcells>>1, 0, sh, est);
else if (hvwind == 2) {
DrawLayer(lflags, HighCacheA, (win&0x80) ? 0 : edge<<1, (win&0x80) ? edge<<1 : maxcells, est);
DrawWindow( (win&0x80) ? edge : 0, (win&0x80) ? maxcells>>1 : edge, 0, sh, est);
}
else
DrawLayer(lflags, HighCacheA, 0, maxcells, est);
/* - sprites low - */
if (pvid->debug_p & PVD_KILL_S_LO)
;
else if (est->rendstatus & PDRAW_INTERLACE)
DrawAllSpritesInterlace(0, sh);
else if (sprited[1] & SPRL_HAVE_LO)
DrawAllSprites(sprited, 0, sh, est);
/* - layer B hi - */
if (!(pvid->debug_p & PVD_KILL_B) && HighCacheB[0])
DrawTilesFromCache(HighCacheB, sh, maxw, est);
/* - layer A hi - */
if (pvid->debug_p & PVD_KILL_A)
;
else if (hvwind == 1)
DrawWindow(0, maxcells>>1, 1, sh, est);
else if (hvwind == 2) {
if (HighCacheA[0])
DrawTilesFromCache(HighCacheA, sh, (win&0x80) ? edge<<4 : maxw, est);
DrawWindow((win&0x80) ? edge : 0, (win&0x80) ? maxcells>>1 : edge, 1, sh, est);
} else
if (HighCacheA[0])
DrawTilesFromCache(HighCacheA, sh, maxw, est);
/* - sprites hi - */
if (pvid->debug_p & PVD_KILL_S_HI)
;
else if (est->rendstatus & PDRAW_INTERLACE)
DrawAllSpritesInterlace(1, sh);
// have sprites without layer pri bit ontop of sprites with that bit
else if ((sprited[1] & SPRL_LO_ABOVE_HI) && (PicoIn.opt & POPT_ACC_SPRITES))
DrawSpritesHiAS(sprited, sh);
else if (sh && (sprited[1] & SPRL_MAY_HAVE_OP))
DrawSpritesSHi(sprited, est);
else if (sprited[1] & SPRL_HAVE_HI)
DrawAllSprites(sprited, 1, 0, est);
#ifdef FORCE
if (pvid->debug_p & PVD_FORCE_B) {
lflags = LF_PLANE_B | (sh<<1);
DrawLayerForced(lflags, 0, maxcells, est);
} else if (pvid->debug_p & PVD_FORCE_A) {
lflags = LF_PLANE_A | (sh<<1);
DrawLayerForced(lflags, 0, maxcells, est);
} else if (pvid->debug_p & PVD_FORCE_S)
DrawSpritesForced(sprited);
#endif
#if 0
{
int *c, a, b;
for (a = 0, c = HighCacheA; *c; c+=2, a++);
for (b = 0, c = HighCacheB; *c; c+=2, b++);
printf("%i:%03i: a=%i, b=%i\n", Pico.m.frame_count,
Pico.est.DrawScanline, a, b);
}
#endif
return 0;
}
// MUST be called every frame
PICO_INTERNAL void PicoFrameStart(void)
{
int offs = 8, lines = 224;
int dirty = ((Pico.est.rendstatus & PDRAW_SONIC_MODE) || Pico.m.dirtyPal);
int sprep = Pico.est.rendstatus & (PDRAW_SPRITES_MOVED|PDRAW_DIRTY_SPRITES);
int skipped = Pico.est.rendstatus & PDRAW_SKIP_FRAME;
// prepare to do this frame
Pico.est.rendstatus = 0;
if ((Pico.video.reg[12] & 6) == 6)
Pico.est.rendstatus |= PDRAW_INTERLACE; // interlace mode
if (!(Pico.video.reg[12] & 1))
Pico.est.rendstatus |= PDRAW_32_COLS;
if (Pico.video.reg[1] & 8) {
offs = 0;
lines = 240;
}
if (Pico.est.rendstatus != rendstatus_old || lines != rendlines) {
rendlines = lines;
// mode_change() might reset rendstatus_old by calling SetColorFormat
emu_video_mode_change((lines == 240) ? 0 : 8,
lines, (Pico.video.reg[12] & 1) ? 0 : 1);
rendstatus_old = Pico.est.rendstatus;
}
if (PicoIn.skipFrame) // preserve this until something is rendered at last
Pico.est.rendstatus |= PDRAW_SKIP_FRAME;
if (sprep | skipped)
Pico.est.rendstatus |= PDRAW_PARSE_SPRITES;
Pico.est.HighCol = HighColBase + offs * HighColIncrement;
Pico.est.DrawLineDest = (char *)DrawLineDestBase + offs * DrawLineDestIncrement;
Pico.est.DrawScanline = 0;
skip_next_line = 0;
if (FinalizeLine == FinalizeLine8bit) {
// make a backup of the current palette in case Sonic mode is detected later
Pico.est.SonicPalCount = 0;
Pico.m.dirtyPal = (dirty ? 2 : 0); // mark as dirty but already copied
blockcpy(Pico.est.SonicPal, PicoMem.cram, 0x40*2);
}
if (PicoIn.opt & POPT_ALT_RENDERER)
return;
}
static void DrawBlankedLine(int line, int offs, int sh, int bgc)
{
if (PicoScanBegin != NULL)
PicoScanBegin(line + offs);
BackFill(bgc, sh, &Pico.est);
if (FinalizeLine != NULL)
FinalizeLine(sh, line, &Pico.est);
if (PicoScanEnd != NULL)
PicoScanEnd(line + offs);
Pico.est.HighCol += HighColIncrement;
Pico.est.DrawLineDest = (char *)Pico.est.DrawLineDest + DrawLineDestIncrement;
}
static void PicoLine(int line, int offs, int sh, int bgc)
{
int skip = 0;
if (skip_next_line > 0) {
skip_next_line--;
return;
}
Pico.est.DrawScanline = line;
if (PicoScanBegin != NULL)
skip = PicoScanBegin(line + offs);
if (skip) {
skip_next_line = skip - 1;
return;
}
if (Pico.video.debug_p & (PVD_FORCE_A | PVD_FORCE_B | PVD_FORCE_S))
bgc = 0x3f;
// Draw screen:
BackFill(bgc, sh, &Pico.est);
if (Pico.video.reg[1]&0x40)
DrawDisplay(sh);
if (FinalizeLine != NULL)
FinalizeLine(sh, line, &Pico.est);
if (PicoScanEnd != NULL)
skip_next_line = PicoScanEnd(line + offs);
Pico.est.HighCol += HighColIncrement;
Pico.est.DrawLineDest = (char *)Pico.est.DrawLineDest + DrawLineDestIncrement;
}
void PicoDrawSync(int to, int blank_last_line)
{
struct PicoEState *est = &Pico.est;
int line, offs = 0;
int sh = (Pico.video.reg[0xC] & 8) >> 3; // shadow/hilight?
int bgc = Pico.video.reg[7];
pprof_start(draw);
if (rendlines != 240) {
offs = 8;
if (to > 223)
to = 223;
}
if (est->DrawScanline <= to - blank_last_line && (est->rendstatus &
(PDRAW_SPRITES_MOVED|PDRAW_DIRTY_SPRITES|PDRAW_PARSE_SPRITES)))
PrepareSprites(to - blank_last_line + 1);
for (line = est->DrawScanline; line < to; line++)
PicoLine(line, offs, sh, bgc);
// last line
if (line <= to)
{
if (blank_last_line)
DrawBlankedLine(line, offs, sh, bgc);
else PicoLine(line, offs, sh, bgc);
line++;
}
est->DrawScanline = line;
pprof_end(draw);
}
// also works for fast renderer
void PicoDrawUpdateHighPal(void)
{
struct PicoEState *est = &Pico.est;
if (Pico.m.dirtyPal) {
int sh = (Pico.video.reg[0xC] & 8) >> 3; // shadow/hilight?
if ((PicoIn.opt & POPT_ALT_RENDERER) | (est->rendstatus & PDRAW_SONIC_MODE))
sh = 0; // no s/h support
if (PicoIn.AHW & PAHW_SMS)
PicoDoHighPal555M4();
else if (FinalizeLine == FinalizeLine8bit)
PicoDoHighPal555_8bit(sh, 0, est);
else
PicoDoHighPal555(sh, 0, est);
// cover for sprite priority bits if not in s/h or sonic mode
if (!sh && !(est->rendstatus & PDRAW_SONIC_MODE)) {
blockcpy(est->HighPal+0x40, est->HighPal, 0x40*2);
blockcpy(est->HighPal+0x80, est->HighPal, 0x80*2);
}
}
}
void PicoDrawSetOutFormat(pdso_t which, int use_32x_line_mode)
{
PicoDrawSetInternalBuf(NULL, 0);
switch (which)
{
case PDF_8BIT:
FinalizeLine = FinalizeLine8bit;
break;
case PDF_RGB555:
if ((PicoIn.AHW & PAHW_32X) && use_32x_line_mode)
FinalizeLine = FinalizeLine32xRGB555;
else
FinalizeLine = FinalizeLine555;
break;
default:
FinalizeLine = NULL;
PicoDrawSetOutBufMD(Pico.est.Draw2FB+8, 328);
break;
}
if (PicoIn.AHW & PAHW_32X)
PicoDrawSetOutFormat32x(which, use_32x_line_mode);
PicoDrawSetOutputMode4(which);
rendstatus_old = -1;
}
void PicoDrawSetOutBufMD(void *dest, int increment)
{
if (FinalizeLine == FinalizeLine8bit && increment == 328) {
// kludge for no-copy mode
PicoDrawSetInternalBuf(dest, increment);
}
if (dest != NULL) {
DrawLineDestBase = dest;
DrawLineDestIncrement = increment;
Pico.est.DrawLineDest = (char *)DrawLineDestBase + Pico.est.DrawScanline * increment;
}
else {
DrawLineDestBase = DefOutBuff;
DrawLineDestIncrement = 0;
Pico.est.DrawLineDest = DefOutBuff;
}
}
// note: may be called on the middle of frame
void PicoDrawSetOutBuf(void *dest, int increment)
{
if (PicoIn.AHW & PAHW_32X)
PicoDrawSetOutBuf32X(dest, increment);
else
PicoDrawSetOutBufMD(dest, increment);
}
void PicoDrawSetInternalBuf(void *dest, int increment)
{
if (dest != NULL) {
HighColBase = dest;
HighColIncrement = increment;
Pico.est.HighCol = HighColBase + Pico.est.DrawScanline * increment;
}
else {
HighColBase = DefHighCol;
HighColIncrement = 0;
Pico.est.HighCol = DefHighCol;
}
}
void PicoDrawSetCallbacks(int (*begin)(unsigned int num), int (*end)(unsigned int num))
{
PicoScanBegin = NULL;
PicoScanEnd = NULL;
PicoScan32xBegin = NULL;
PicoScan32xEnd = NULL;
if ((PicoIn.AHW & PAHW_32X) && FinalizeLine != FinalizeLine32xRGB555) {
PicoScan32xBegin = begin;
PicoScan32xEnd = end;
}
else {
PicoScanBegin = begin;
PicoScanEnd = end;
}
}
void PicoDrawInit(void)
{
Pico.est.DrawLineDest = DefOutBuff;
Pico.est.HighCol = HighColBase;
Pico.est.HighPreSpr = HighPreSpr;
rendstatus_old = -1;
}
// vim:ts=2:sw=2:expandtab