mirror of
https://github.com/RaySollium99/picodrive.git
synced 2025-09-05 07:17:45 -04:00
sdl, complete overhaul of hardware/software scaling
This commit is contained in:
parent
6651998e9f
commit
d5d1778252
21 changed files with 1233 additions and 547 deletions
2
Makefile
2
Makefile
|
@ -210,7 +210,7 @@ endif
|
||||||
ifeq "$(USE_FRONTEND)" "1"
|
ifeq "$(USE_FRONTEND)" "1"
|
||||||
|
|
||||||
# common
|
# common
|
||||||
OBJS += platform/common/main.o platform/common/emu.o \
|
OBJS += platform/common/main.o platform/common/emu.o platform/common/upscale.o \
|
||||||
platform/common/menu_pico.o platform/common/config_file.o
|
platform/common/menu_pico.o platform/common/config_file.o
|
||||||
|
|
||||||
# libpicofe
|
# libpicofe
|
||||||
|
|
|
@ -122,7 +122,7 @@ void FinalizeLine32xRGB555(int sh, int line, struct PicoEState *est)
|
||||||
FinalizeLine555(sh, line, est);
|
FinalizeLine555(sh, line, est);
|
||||||
|
|
||||||
if ((Pico32x.vdp_regs[0] & P32XV_Mx) == 0 || // 32x blanking
|
if ((Pico32x.vdp_regs[0] & P32XV_Mx) == 0 || // 32x blanking
|
||||||
// XXX: how is 32col mode hadled by real hardware?
|
// XXX: how is 32col mode handled by real hardware?
|
||||||
!(Pico.video.reg[12] & 1) || // 32col mode
|
!(Pico.video.reg[12] & 1) || // 32col mode
|
||||||
(Pico.video.debug_p & PVD_KILL_32X))
|
(Pico.video.debug_p & PVD_KILL_32X))
|
||||||
{
|
{
|
||||||
|
@ -162,6 +162,7 @@ void FinalizeLine32xRGB555(int sh, int line, struct PicoEState *est)
|
||||||
|
|
||||||
#define PICOSCAN_POST \
|
#define PICOSCAN_POST \
|
||||||
PicoScan32xEnd(l + (lines_sft_offs & 0xff)); \
|
PicoScan32xEnd(l + (lines_sft_offs & 0xff)); \
|
||||||
|
Pico.est.DrawLineDest = (char *)Pico.est.DrawLineDest + DrawLineDestIncrement32x; \
|
||||||
|
|
||||||
#define make_do_loop(name, pre_code, post_code, md_code) \
|
#define make_do_loop(name, pre_code, post_code, md_code) \
|
||||||
/* Direct Color Mode */ \
|
/* Direct Color Mode */ \
|
||||||
|
@ -260,6 +261,7 @@ void PicoDraw32xLayer(int offs, int lines, int md_bg)
|
||||||
int which_func;
|
int which_func;
|
||||||
|
|
||||||
Pico.est.DrawLineDest = (char *)DrawLineDestBase32x + offs * DrawLineDestIncrement32x;
|
Pico.est.DrawLineDest = (char *)DrawLineDestBase32x + offs * DrawLineDestIncrement32x;
|
||||||
|
Pico.est.DrawLineDestIncr = DrawLineDestIncrement32x;
|
||||||
dram = Pico32xMem->dram[Pico32x.vdp_regs[0x0a/2] & P32XV_FS];
|
dram = Pico32xMem->dram[Pico32x.vdp_regs[0x0a/2] & P32XV_FS];
|
||||||
|
|
||||||
if (Pico32xDrawMode == PDM32X_BOTH)
|
if (Pico32xDrawMode == PDM32X_BOTH)
|
||||||
|
@ -330,7 +332,7 @@ void PicoDraw32xLayerMdOnly(int offs, int lines)
|
||||||
dst[p + 2] = pal[*pmd++];
|
dst[p + 2] = pal[*pmd++];
|
||||||
dst[p + 3] = pal[*pmd++];
|
dst[p + 3] = pal[*pmd++];
|
||||||
}
|
}
|
||||||
dst = (void *)((char *)dst + DrawLineDestIncrement32x);
|
dst = Pico.est.DrawLineDest = (char *)dst + DrawLineDestIncrement32x;
|
||||||
pmd += 328 - plen;
|
pmd += 328 - plen;
|
||||||
if (have_scan)
|
if (have_scan)
|
||||||
PicoScan32xEnd(l + offs);
|
PicoScan32xEnd(l + offs);
|
||||||
|
|
|
@ -20,11 +20,11 @@
|
||||||
|
|
||||||
PIC_LDR_INIT()
|
PIC_LDR_INIT()
|
||||||
|
|
||||||
.macro call_scan_prep cond est @ &Pico.est
|
.macro call_scan_prep cond pico @ &Pico
|
||||||
.if \cond
|
.if \cond
|
||||||
PIC_LDR(r4, r6, PicoScan32xBegin)
|
PIC_LDR(r4, r6, PicoScan32xBegin)
|
||||||
PIC_LDR(r5, r6, PicoScan32xEnd)
|
PIC_LDR(r5, r6, PicoScan32xEnd)
|
||||||
ldr r6, [\est, #OFS_EST_DrawLineDest]
|
add r6, \pico, #OFS_Pico_est
|
||||||
ldr r4, [r4]
|
ldr r4, [r4]
|
||||||
ldr r5, [r5]
|
ldr r5, [r5]
|
||||||
stmfd sp!, {r4,r5,r6}
|
stmfd sp!, {r4,r5,r6}
|
||||||
|
@ -44,9 +44,9 @@
|
||||||
add r0, r0, r4
|
add r0, r0, r4
|
||||||
mov lr, pc
|
mov lr, pc
|
||||||
ldr pc, [sp, #(3+0)*4]
|
ldr pc, [sp, #(3+0)*4]
|
||||||
ldr r0, [sp, #(3+2)*4] @ &DrawLineDest
|
ldr r0, [sp, #(3+2)*4] @ &Pico.est
|
||||||
ldmfd sp!, {r1-r3}
|
ldmfd sp!, {r1-r3}
|
||||||
ldr r0, [r0]
|
ldr r0, [r0, #OFS_EST_DrawLineDest]
|
||||||
.endif
|
.endif
|
||||||
.endm
|
.endm
|
||||||
|
|
||||||
|
@ -57,6 +57,11 @@
|
||||||
add r0, r0, r4
|
add r0, r0, r4
|
||||||
mov lr, pc
|
mov lr, pc
|
||||||
ldr pc, [sp, #(4+1)*4]
|
ldr pc, [sp, #(4+1)*4]
|
||||||
|
ldr r1, [sp, #(3+2)*4] @ &Pico.est
|
||||||
|
ldr r0, [r1, #OFS_EST_DrawLineDest]
|
||||||
|
ldr r2, [r1, #OFS_EST_DrawLineDestIncr]
|
||||||
|
add r0, r0, r2
|
||||||
|
str r0, [r1]
|
||||||
ldmfd sp!, {r0-r3}
|
ldmfd sp!, {r0-r3}
|
||||||
.endif
|
.endif
|
||||||
.endm
|
.endm
|
||||||
|
@ -71,6 +76,7 @@
|
||||||
PIC_LDR(lr, r9, Pico)
|
PIC_LDR(lr, r9, Pico)
|
||||||
PIC_LDR(r10,r9, Pico32x)
|
PIC_LDR(r10,r9, Pico32x)
|
||||||
ldr r11, [lr, #OFS_Pico_est+OFS_EST_Draw2FB]
|
ldr r11, [lr, #OFS_Pico_est+OFS_EST_Draw2FB]
|
||||||
|
ldr r12, [lr, #OFS_Pico_est+OFS_EST_DrawLineDestIncr]
|
||||||
ldrh r10,[r10, #0x40] @ Pico32x.vdp_regs[0]
|
ldrh r10,[r10, #0x40] @ Pico32x.vdp_regs[0]
|
||||||
add r9, lr, #OFS_Pico_est+OFS_EST_HighPal @ palmd
|
add r9, lr, #OFS_Pico_est+OFS_EST_HighPal @ palmd
|
||||||
|
|
||||||
|
@ -88,6 +94,9 @@
|
||||||
|
|
||||||
0: @ loop_outer:
|
0: @ loop_outer:
|
||||||
call_scan_end \call_scan
|
call_scan_end \call_scan
|
||||||
|
ldr r12, [r9, #OFS_EST_DrawLineDestIncr-OFS_EST_HighPal]
|
||||||
|
sub r0, r0, #320*2
|
||||||
|
add r0, r0, r12
|
||||||
add r4, r4, #1
|
add r4, r4, #1
|
||||||
cmp r4, r2, lsr #16
|
cmp r4, r2, lsr #16
|
||||||
call_scan_fin_ge \call_scan
|
call_scan_fin_ge \call_scan
|
||||||
|
@ -248,6 +257,9 @@
|
||||||
|
|
||||||
0: @ loop_outer:
|
0: @ loop_outer:
|
||||||
call_scan_end \call_scan
|
call_scan_end \call_scan
|
||||||
|
ldr r12, [r9, #OFS_EST_DrawLineDestIncr-OFS_EST_HighPal]
|
||||||
|
sub r0, r0, #320*2
|
||||||
|
add r0, r0, r12
|
||||||
add r4, r4, #1
|
add r4, r4, #1
|
||||||
cmp r4, r2, lsr #16
|
cmp r4, r2, lsr #16
|
||||||
call_scan_fin_ge \call_scan
|
call_scan_fin_ge \call_scan
|
||||||
|
@ -417,6 +429,9 @@
|
||||||
|
|
||||||
0: @ loop_outer:
|
0: @ loop_outer:
|
||||||
call_scan_end \call_scan
|
call_scan_end \call_scan
|
||||||
|
ldr r12, [r9, #OFS_EST_DrawLineDestIncr-OFS_EST_HighPal]
|
||||||
|
sub r0, r0, #320*2
|
||||||
|
add r0, r0, r12
|
||||||
add r4, r4, #1
|
add r4, r4, #1
|
||||||
cmp r4, r2, lsr #16
|
cmp r4, r2, lsr #16
|
||||||
call_scan_fin_ge \call_scan
|
call_scan_fin_ge \call_scan
|
||||||
|
|
67
pico/draw.c
67
pico/draw.c
|
@ -44,6 +44,8 @@
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#include "pico_int.h"
|
#include "pico_int.h"
|
||||||
|
#include <platform/common/upscale.h>
|
||||||
|
|
||||||
#define FORCE // layer forcing via debug register?
|
#define FORCE // layer forcing via debug register?
|
||||||
|
|
||||||
int (*PicoScanBegin)(unsigned int num) = NULL;
|
int (*PicoScanBegin)(unsigned int num) = NULL;
|
||||||
|
@ -1407,7 +1409,7 @@ static NOINLINE void PrepareSprites(int max_lines)
|
||||||
|
|
||||||
if (!(Pico.video.reg[12]&1))
|
if (!(Pico.video.reg[12]&1))
|
||||||
max_sprites = 64, max_line_sprites = 16, max_width = 264;
|
max_sprites = 64, max_line_sprites = 16, max_width = 264;
|
||||||
if (PicoIn.opt & POPT_DIS_SPRITE_LIM)
|
if (*est->PicoOpt & POPT_DIS_SPRITE_LIM)
|
||||||
max_line_sprites = MAX_LINE_SPRITES;
|
max_line_sprites = MAX_LINE_SPRITES;
|
||||||
|
|
||||||
sh = Pico.video.reg[0xC]&8; // shadow/hilight?
|
sh = Pico.video.reg[0xC]&8; // shadow/hilight?
|
||||||
|
@ -1643,20 +1645,20 @@ void FinalizeLine555(int sh, int line, struct PicoEState *est)
|
||||||
if (Pico.video.reg[12]&1) {
|
if (Pico.video.reg[12]&1) {
|
||||||
len = 320;
|
len = 320;
|
||||||
} else {
|
} else {
|
||||||
if (!(PicoIn.opt&POPT_DIS_32C_BORDER)) pd+=32;
|
|
||||||
len = 256;
|
len = 256;
|
||||||
}
|
}
|
||||||
|
|
||||||
{
|
if ((*est->PicoOpt & POPT_EN_SOFTSCALE) && len == 256) {
|
||||||
#if 1
|
switch (PicoIn.filter) {
|
||||||
int i;
|
case 3: h_upscale_bl4_4_5(pd, 320, ps, 256, 256, f_pal); break;
|
||||||
|
case 2: h_upscale_bl2_4_5(pd, 320, ps, 256, 256, f_pal); break;
|
||||||
for (i = len; i > 0; i-=4) {
|
case 1: h_upscale_snn_4_5(pd, 320, ps, 256, 256, f_pal); break;
|
||||||
*pd++ = pal[*ps++];
|
default: h_upscale_nn_4_5(pd, 320, ps, 256, 256, f_pal); break;
|
||||||
*pd++ = pal[*ps++];
|
|
||||||
*pd++ = pal[*ps++];
|
|
||||||
*pd++ = pal[*ps++];
|
|
||||||
}
|
}
|
||||||
|
} else {
|
||||||
|
if (!(*est->PicoOpt & POPT_DIS_32C_BORDER) && len == 256) pd += 32;
|
||||||
|
#if 1
|
||||||
|
h_copy(pd, 320, ps, 320, len, f_pal);
|
||||||
#else
|
#else
|
||||||
extern void amips_clut(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
|
extern void amips_clut(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
|
||||||
extern void amips_clut_6bit(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
|
extern void amips_clut_6bit(unsigned short *dst, unsigned char *src, unsigned short *pal, int count);
|
||||||
|
@ -1691,21 +1693,34 @@ static void FinalizeLine8bit(int sh, int line, struct PicoEState *est)
|
||||||
if (Pico.video.reg[12]&1) {
|
if (Pico.video.reg[12]&1) {
|
||||||
len = 320;
|
len = 320;
|
||||||
} else {
|
} else {
|
||||||
if (!(PicoIn.opt & POPT_DIS_32C_BORDER))
|
|
||||||
pd += 32;
|
|
||||||
len = 256;
|
len = 256;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (DrawLineDestIncrement == 0) {
|
if ((PicoIn.opt & POPT_EN_SOFTSCALE) && len == 256) {
|
||||||
|
unsigned char *ps = est->HighCol+8;
|
||||||
|
unsigned char pal = 0;
|
||||||
|
|
||||||
if (!sh && (est->rendstatus & PDRAW_SONIC_MODE))
|
if (!sh && (est->rendstatus & PDRAW_SONIC_MODE))
|
||||||
blockcpy_or(pd+8, est->HighCol+8, len, est->SonicPalCount*0x40);
|
pal = est->SonicPalCount*0x40;
|
||||||
} else if (!sh && (est->rendstatus & PDRAW_SONIC_MODE)) {
|
if (DrawLineDestIncrement == 0)
|
||||||
|
pd = est->HighCol+8;
|
||||||
|
// Smoothing can't be used with CLUT, hence it's always Nearest Neighbour.
|
||||||
|
// use reverse version since src and dest ptr may be the same.
|
||||||
|
rh_upscale_nn_4_5(pd, 320, ps, 256, len, f_or);
|
||||||
|
} else if (DrawLineDestIncrement == 0) {
|
||||||
|
if (!sh && (est->rendstatus & PDRAW_SONIC_MODE))
|
||||||
|
blockcpy_or(est->HighCol+8, est->HighCol+8, len, est->SonicPalCount*0x40);
|
||||||
|
} else {
|
||||||
|
if (!(PicoIn.opt & POPT_DIS_32C_BORDER))
|
||||||
|
pd += 32;
|
||||||
|
if (!sh && (est->rendstatus & PDRAW_SONIC_MODE)) {
|
||||||
// select active backup palette
|
// select active backup palette
|
||||||
blockcpy_or(pd, est->HighCol+8, len, est->SonicPalCount*0x40);
|
blockcpy_or(pd, est->HighCol+8, len, est->SonicPalCount*0x40);
|
||||||
} else {
|
} else {
|
||||||
blockcpy(pd, est->HighCol+8, len);
|
blockcpy(pd, est->HighCol+8, len);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
static void (*FinalizeLine)(int sh, int line, struct PicoEState *est);
|
static void (*FinalizeLine)(int sh, int line, struct PicoEState *est);
|
||||||
|
|
||||||
|
@ -1828,7 +1843,7 @@ static int DrawDisplay(int sh)
|
||||||
// MUST be called every frame
|
// MUST be called every frame
|
||||||
PICO_INTERNAL void PicoFrameStart(void)
|
PICO_INTERNAL void PicoFrameStart(void)
|
||||||
{
|
{
|
||||||
int offs = 8, lines = 224;
|
int loffs = 8, lines = 224, coffs = 0, columns = 320;
|
||||||
int dirty = ((Pico.est.rendstatus & PDRAW_SONIC_MODE) || Pico.m.dirtyPal);
|
int dirty = ((Pico.est.rendstatus & PDRAW_SONIC_MODE) || Pico.m.dirtyPal);
|
||||||
int sprep = Pico.est.rendstatus & (PDRAW_SPRITES_MOVED|PDRAW_DIRTY_SPRITES);
|
int sprep = Pico.est.rendstatus & (PDRAW_SPRITES_MOVED|PDRAW_DIRTY_SPRITES);
|
||||||
int skipped = Pico.est.rendstatus & PDRAW_SKIP_FRAME;
|
int skipped = Pico.est.rendstatus & PDRAW_SKIP_FRAME;
|
||||||
|
@ -1837,19 +1852,25 @@ PICO_INTERNAL void PicoFrameStart(void)
|
||||||
Pico.est.rendstatus = 0;
|
Pico.est.rendstatus = 0;
|
||||||
if ((Pico.video.reg[12] & 6) == 6)
|
if ((Pico.video.reg[12] & 6) == 6)
|
||||||
Pico.est.rendstatus |= PDRAW_INTERLACE; // interlace mode
|
Pico.est.rendstatus |= PDRAW_INTERLACE; // interlace mode
|
||||||
if (!(Pico.video.reg[12] & 1))
|
if (!(Pico.video.reg[12] & 1)) {
|
||||||
Pico.est.rendstatus |= PDRAW_32_COLS;
|
Pico.est.rendstatus |= PDRAW_32_COLS;
|
||||||
|
if (!(PicoIn.opt & POPT_EN_SOFTSCALE)) {
|
||||||
|
columns = 256;
|
||||||
|
coffs = 32;
|
||||||
|
}
|
||||||
|
}
|
||||||
if (Pico.video.reg[1] & 8) {
|
if (Pico.video.reg[1] & 8) {
|
||||||
Pico.est.rendstatus |= PDRAW_30_ROWS;
|
Pico.est.rendstatus |= PDRAW_30_ROWS;
|
||||||
offs = 0;
|
|
||||||
lines = 240;
|
lines = 240;
|
||||||
|
loffs = 0;
|
||||||
}
|
}
|
||||||
|
if (PicoIn.opt & POPT_DIS_32C_BORDER)
|
||||||
|
coffs = 0;
|
||||||
|
|
||||||
if (Pico.est.rendstatus != rendstatus_old || lines != rendlines) {
|
if (Pico.est.rendstatus != rendstatus_old || lines != rendlines) {
|
||||||
rendlines = lines;
|
rendlines = lines;
|
||||||
// mode_change() might reset rendstatus_old by calling SetColorFormat
|
// mode_change() might reset rendstatus_old by calling SetColorFormat
|
||||||
emu_video_mode_change((lines == 240) ? 0 : 8,
|
emu_video_mode_change(loffs, lines, coffs, columns);
|
||||||
lines, (Pico.video.reg[12] & 1) ? 0 : 1);
|
|
||||||
rendstatus_old = Pico.est.rendstatus;
|
rendstatus_old = Pico.est.rendstatus;
|
||||||
}
|
}
|
||||||
if (PicoIn.skipFrame) // preserve this until something is rendered at last
|
if (PicoIn.skipFrame) // preserve this until something is rendered at last
|
||||||
|
@ -1857,8 +1878,8 @@ PICO_INTERNAL void PicoFrameStart(void)
|
||||||
if (sprep | skipped)
|
if (sprep | skipped)
|
||||||
Pico.est.rendstatus |= PDRAW_PARSE_SPRITES;
|
Pico.est.rendstatus |= PDRAW_PARSE_SPRITES;
|
||||||
|
|
||||||
Pico.est.HighCol = HighColBase + offs * HighColIncrement;
|
Pico.est.HighCol = HighColBase + loffs * HighColIncrement;
|
||||||
Pico.est.DrawLineDest = (char *)DrawLineDestBase + offs * DrawLineDestIncrement;
|
Pico.est.DrawLineDest = (char *)DrawLineDestBase + loffs * DrawLineDestIncrement;
|
||||||
Pico.est.DrawScanline = 0;
|
Pico.est.DrawScanline = 0;
|
||||||
skip_next_line = 0;
|
skip_next_line = 0;
|
||||||
|
|
||||||
|
|
207
pico/draw_arm.S
207
pico/draw_arm.S
|
@ -1653,9 +1653,9 @@ FinalizeLine555:
|
||||||
tst r12, #1
|
tst r12, #1
|
||||||
movne r2, #320/8 @ len
|
movne r2, #320/8 @ len
|
||||||
bne .fl_no32colRGB555
|
bne .fl_no32colRGB555
|
||||||
ldr r4, [r10, #OFS_EST_PicoOpt]
|
ldr r5, [r10, #OFS_EST_PicoOpt]
|
||||||
mov r2, #256/8
|
mov r2, #256/8
|
||||||
ldr r4, [r4]
|
ldr r4, [r5]
|
||||||
tst r4, #0x4000
|
tst r4, #0x4000
|
||||||
bne .fl_32scale_RGB555
|
bne .fl_32scale_RGB555
|
||||||
tst r4, #0x0100
|
tst r4, #0x0100
|
||||||
|
@ -1705,15 +1705,25 @@ FinalizeLine555:
|
||||||
|
|
||||||
|
|
||||||
.fl_32scale_RGB555:
|
.fl_32scale_RGB555:
|
||||||
mov r9, #0x3900 @ f800 07e0 001f | e000 0780 001c | 3800 01e0 0007
|
ldr r5, [r5, #OFS_PicoIn_filter-OFS_PicoIn_opt]
|
||||||
orr r9, r9, #0x00e7
|
|
||||||
|
mov r9, #0xf700 @ f800 07e0 001f | e000 0780 001c | 3800 01e0 0007
|
||||||
|
orr r9, r9, #0x00de
|
||||||
|
|
||||||
#ifdef UNALIGNED_DRAWLINEDEST
|
#ifdef UNALIGNED_DRAWLINEDEST
|
||||||
tst r0, #2
|
tst r0, #2
|
||||||
bne .fl_32scale_RGB555u
|
bne .fl_32scale_RGB555u
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
.fl_loop32scale_RGB555:
|
ands r5, r5, #0x3
|
||||||
|
addne pc, pc, r5, lsl #2
|
||||||
|
b .fl_32scale_nn
|
||||||
|
b .fl_32scale_nn
|
||||||
|
b .fl_32scale_snn
|
||||||
|
b .fl_32scale_bl2
|
||||||
|
b .fl_32scale_bl4
|
||||||
|
|
||||||
|
.fl_32scale_nn:
|
||||||
ldr r12, [r1], #4
|
ldr r12, [r1], #4
|
||||||
ldr r7, [r1], #4
|
ldr r7, [r1], #4
|
||||||
|
|
||||||
|
@ -1721,16 +1731,163 @@ FinalizeLine555:
|
||||||
ldrh r4, [r3, r4]
|
ldrh r4, [r3, r4]
|
||||||
and r5, lr, r12, lsr #7
|
and r5, lr, r12, lsr #7
|
||||||
ldrh r5, [r3, r5]
|
ldrh r5, [r3, r5]
|
||||||
and r4, r4, r9, lsl #2
|
and r6, lr, r12, lsr #15
|
||||||
|
ldrh r6, [r3, r6]
|
||||||
|
and r10,lr, r12, lsr #23
|
||||||
|
ldrh r10,[r3, r10]
|
||||||
|
|
||||||
|
orr r4, r4, r5, lsl #16
|
||||||
|
orr r5, r6, r6, lsl #16
|
||||||
|
|
||||||
|
and r6, lr, r7, lsl #1
|
||||||
|
ldrh r6, [r3, r6]
|
||||||
|
and r8, lr, r7, lsr #7
|
||||||
|
ldrh r8, [r3, r8]
|
||||||
|
and r12,lr, r7, lsr #15
|
||||||
|
ldrh r12,[r3, r12]
|
||||||
|
and r7, lr, r7, lsr #23
|
||||||
|
ldrh r7, [r3, r7]
|
||||||
|
|
||||||
|
orr r6, r10,r6, lsl #16
|
||||||
|
orr r8, r8,r12, lsl #16
|
||||||
|
|
||||||
|
subs r2, r2, #1
|
||||||
|
|
||||||
|
orr r10,r12,r7, lsl #16
|
||||||
|
|
||||||
|
stmia r0!, {r4,r5,r6,r8,r10}
|
||||||
|
bne .fl_32scale_nn
|
||||||
|
|
||||||
|
ldmfd sp!, {r4-r10,pc}
|
||||||
|
|
||||||
|
.fl_32scale_snn:
|
||||||
|
ldr r12, [r1], #4
|
||||||
|
ldr r7, [r1], #4
|
||||||
|
|
||||||
|
and r4, lr, r12, lsl #1
|
||||||
|
ldrh r4, [r3, r4]
|
||||||
|
and r5, lr, r12, lsr #7
|
||||||
|
ldrh r5, [r3, r5]
|
||||||
|
and r6, lr, r12, lsr #15
|
||||||
|
ldrh r6, [r3, r6]
|
||||||
|
and r10,lr, r12, lsr #23
|
||||||
|
ldrh r10,[r3, r10]
|
||||||
|
|
||||||
|
and r4, r4, r9
|
||||||
|
and r5, r5, r9
|
||||||
|
orr r4, r4, r5, lsl #16
|
||||||
|
and r6, r6, r9
|
||||||
|
add r5, r5, r6
|
||||||
|
mov r5, r5, lsr #1
|
||||||
|
orr r5, r5, r6, lsl #16
|
||||||
|
|
||||||
|
and r6, lr, r7, lsl #1
|
||||||
|
ldrh r6, [r3, r6]
|
||||||
|
and r8, lr, r7, lsr #7
|
||||||
|
ldrh r8, [r3, r8]
|
||||||
|
and r12,lr, r7, lsr #15
|
||||||
|
ldrh r12,[r3, r12]
|
||||||
|
and r7, lr, r7, lsr #23
|
||||||
|
ldrh r7, [r3, r7]
|
||||||
|
|
||||||
|
and r6, r6, r9
|
||||||
|
and r10,r10,r9
|
||||||
|
orr r6, r10,r6, lsl #16
|
||||||
|
and r12,r12,r9
|
||||||
|
and r7, r7, r9
|
||||||
|
orr r10,r12,r7, lsl #16
|
||||||
|
|
||||||
|
and r8, r8, r9
|
||||||
|
add r12,r12,r8
|
||||||
|
mov r12,r12,lsr #1
|
||||||
|
orr r8, r8,r12, lsl #16
|
||||||
|
|
||||||
|
subs r2, r2, #1
|
||||||
|
|
||||||
|
stmia r0!, {r4,r5,r6,r8,r10}
|
||||||
|
bne .fl_32scale_snn
|
||||||
|
|
||||||
|
ldmfd sp!, {r4-r10,pc}
|
||||||
|
|
||||||
|
.fl_32scale_bl2:
|
||||||
|
ldr r12, [r1], #4
|
||||||
|
ldr r7, [r1], #4
|
||||||
|
|
||||||
|
and r4, lr, r12, lsl #1
|
||||||
|
ldrh r4, [r3, r4]
|
||||||
|
and r5, lr, r12, lsr #7
|
||||||
|
ldrh r5, [r3, r5]
|
||||||
|
and r6, lr, r12, lsr #15
|
||||||
|
ldrh r6, [r3, r6]
|
||||||
|
|
||||||
|
and r4, r4, r9
|
||||||
|
and r5, r5, r9
|
||||||
|
add r10,r4, r5
|
||||||
|
mov r10,r10,lsr #1
|
||||||
|
orr r4, r4, r10,lsl #16 @ px0 | (px0+px1)/2
|
||||||
|
|
||||||
|
and r6, r6, r9
|
||||||
|
add r5, r5, r6
|
||||||
|
mov r5, r5, lsr #1
|
||||||
|
orr r5, r5, r6, lsl #16 @ (px1+px2)/2 | px2
|
||||||
|
|
||||||
|
and r10,lr, r12, lsr #23
|
||||||
|
ldrh r10,[r3, r10]
|
||||||
|
and r8, lr, r7, lsl #1
|
||||||
|
ldrh r8, [r3, r8]
|
||||||
|
|
||||||
|
and r10,r10,r9
|
||||||
|
and r8, r8, r9
|
||||||
|
orr r6, r10,r8, lsl #16 @ px3 | px4
|
||||||
|
|
||||||
|
and r12,lr, r7, lsr #15
|
||||||
|
ldrh r12,[r3, r12]
|
||||||
|
and r10, lr, r7, lsr #23
|
||||||
|
ldrh r10, [r3, r10]
|
||||||
|
and r7, lr, r7, lsr #7
|
||||||
|
ldrh r7, [r3, r7]
|
||||||
|
|
||||||
|
and r12,r12,r9
|
||||||
|
and r10,r10,r9
|
||||||
|
orr r10,r12,r10, lsl #16 @ px6 | px7
|
||||||
|
|
||||||
|
and r7, r7, r9
|
||||||
|
add r12,r12,r7
|
||||||
|
add r8, r8, r7
|
||||||
|
mov r8, r8, lsr #1
|
||||||
|
mov r12,r12,lsr #1
|
||||||
|
orr r8, r8,r12, lsl #16 @ (px4+px5)/2 | (px5+px6)/2
|
||||||
|
|
||||||
|
subs r2, r2, #1
|
||||||
|
|
||||||
|
stmia r0!, {r4,r5,r6,r8,r10}
|
||||||
|
bne .fl_32scale_bl2
|
||||||
|
|
||||||
|
ldmfd sp!, {r4-r10,pc}
|
||||||
|
|
||||||
|
.fl_32scale_bl4:
|
||||||
|
ldr r12, [r1], #4
|
||||||
|
ldr r7, [r1], #4
|
||||||
|
|
||||||
|
and r4, lr, r12,lsl #1
|
||||||
|
ldrh r4, [r3, r4]
|
||||||
|
and r5, lr, r12,lsr #7
|
||||||
|
ldrh r5, [r3, r5]
|
||||||
|
|
||||||
|
@ r4 = 1/4px0+3/4px1 : px0
|
||||||
|
and r4, r4, r9
|
||||||
orr r4, r4, r4, lsl #14 @ r4[31:16] = 1/4 pix_s 0
|
orr r4, r4, r4, lsl #14 @ r4[31:16] = 1/4 pix_s 0
|
||||||
and r5, r5, r9, lsl #2
|
and r5, r5, r9
|
||||||
sub r6, r5, r5, lsr #2 @ r6 = 3/4 pix_s 1
|
sub r6, r5, r5, lsr #2 @ r6 = 3/4 pix_s 1
|
||||||
add r4, r4, r6, lsl #16 @ pix_d 0, 1
|
add r4, r4, r6, lsl #16 @ pix_d 0, 1
|
||||||
|
|
||||||
and r6, lr, r12,lsr #15
|
and r6, lr, r12,lsr #15
|
||||||
ldrh r6, [r3, r6]
|
ldrh r6, [r3, r6]
|
||||||
and r12,lr, r12,lsr #23
|
and r12,lr, r12,lsr #23
|
||||||
ldrh r12,[r3, r12]
|
ldrh r12,[r3, r12]
|
||||||
and r6, r6, r9, lsl #2
|
|
||||||
|
@ r5 = 3/4px2+1/4px3 : (px1+px2)/2
|
||||||
|
and r6, r6, r9
|
||||||
add r5, r5, r6
|
add r5, r5, r6
|
||||||
mov r5, r5, lsr #1
|
mov r5, r5, lsr #1
|
||||||
sub r6, r6, r6, lsr #2 @ r6 = 3/4 pix_s 2
|
sub r6, r6, r6, lsr #2 @ r6 = 3/4 pix_s 2
|
||||||
|
@ -1738,32 +1895,38 @@ FinalizeLine555:
|
||||||
|
|
||||||
and r6, lr, r7, lsl #1
|
and r6, lr, r7, lsl #1
|
||||||
ldrh r6, [r3, r6]
|
ldrh r6, [r3, r6]
|
||||||
and r12,r12,r9, lsl #2
|
and r12,r12,r9
|
||||||
add r5, r5, r12,lsl #14 @ pix_d 2, 3
|
add r5, r5, r12,lsl #14 @ pix_d 2, 3
|
||||||
and r6, r6, r9, lsl #2
|
|
||||||
|
@ r6 = px4 : px3
|
||||||
|
and r6, r6, r9
|
||||||
orr r6, r12,r6, lsl #16 @ pix_d 4, 5
|
orr r6, r12,r6, lsl #16 @ pix_d 4, 5
|
||||||
|
|
||||||
|
@ r8 = (px5+px6)/2 : 1/4px4+3/4px5
|
||||||
and r12,lr, r7, lsr #7
|
and r12,lr, r7, lsr #7
|
||||||
ldrh r12,[r3, r12]
|
ldrh r12,[r3, r12]
|
||||||
and r10,lr, r7, lsr #15
|
and r10,lr, r7, lsr #15
|
||||||
ldrh r10,[r3, r10]
|
ldrh r10,[r3, r10]
|
||||||
and r12,r12,r9, lsl #2
|
and r12,r12,r9
|
||||||
sub r8, r12,r12,lsr #2 @ r8 = 3/4 pix_s 1
|
sub r8, r12,r12,lsr #2 @ r8 = 3/4 pix_s 1
|
||||||
add r8, r8, r6, lsr #18
|
add r8, r8, r6, lsr #18
|
||||||
|
|
||||||
and r7, lr, r7, lsr #23
|
and r7, lr, r7, lsr #23
|
||||||
ldrh r7, [r3, r7]
|
ldrh r7, [r3, r7]
|
||||||
and r10,r10,r9, lsl #2
|
and r10,r10,r9
|
||||||
orr r8, r8, r10,lsl #15
|
orr r8, r8, r10,lsl #15
|
||||||
add r8, r8, r12,lsl #15 @ pix_d 6, 7
|
add r8, r8, r12,lsl #15 @ pix_d 6, 7
|
||||||
|
|
||||||
|
@ r10 = px7 : 3/4px6+1/4px7
|
||||||
sub r10,r10,r10,lsr #2 @ r10= 3/4 pix_s 2
|
sub r10,r10,r10,lsr #2 @ r10= 3/4 pix_s 2
|
||||||
and r7, r7, r9, lsl #2
|
and r7, r7, r9
|
||||||
add r10,r10,r7, lsr #2 @ += 1/4 pix_s 3
|
add r10,r10,r7, lsr #2 @ += 1/4 pix_s 3
|
||||||
orr r10,r10,r7, lsl #16 @ pix_d 8, 9
|
orr r10,r10,r7, lsl #16 @ pix_d 8, 9
|
||||||
|
|
||||||
subs r2, r2, #1
|
subs r2, r2, #1
|
||||||
|
|
||||||
stmia r0!, {r4,r5,r6,r8,r10}
|
stmia r0!, {r4,r5,r6,r8,r10}
|
||||||
bne .fl_loop32scale_RGB555
|
bne .fl_32scale_bl4
|
||||||
|
|
||||||
ldmfd sp!, {r4-r10,pc}
|
ldmfd sp!, {r4-r10,pc}
|
||||||
|
|
||||||
|
@ -1826,10 +1989,10 @@ FinalizeLine555:
|
||||||
ldrh r6, [r3, r6]
|
ldrh r6, [r3, r6]
|
||||||
and r5, lr, r12,lsr #7
|
and r5, lr, r12,lsr #7
|
||||||
ldrh r5, [r3, r5]
|
ldrh r5, [r3, r5]
|
||||||
and r6, r6, r9, lsl #2
|
and r6, r6, r9
|
||||||
orr r4, r4, r6, lsl #16 @ r4 = pix_d -1, 0
|
orr r4, r4, r6, lsl #16 @ r4 = pix_d -1, 0
|
||||||
|
|
||||||
and r5, r5, r9, lsl #2
|
and r5, r5, r9
|
||||||
sub r8, r5, r5, lsr #2 @ r8 = 3/4 pix_s 1
|
sub r8, r5, r5, lsr #2 @ r8 = 3/4 pix_s 1
|
||||||
add r6, r8, r6, lsr #2 @ r6 = (1/4 pix_s 0) + (3/4 pix_s 1)
|
add r6, r8, r6, lsr #2 @ r6 = (1/4 pix_s 0) + (3/4 pix_s 1)
|
||||||
orr r5, r6, r5, lsl #15
|
orr r5, r6, r5, lsl #15
|
||||||
|
@ -1838,20 +2001,20 @@ FinalizeLine555:
|
||||||
ldrh r6, [r3, r6]
|
ldrh r6, [r3, r6]
|
||||||
and r12,lr, r12,lsr #23
|
and r12,lr, r12,lsr #23
|
||||||
ldrh r12,[r3, r12]
|
ldrh r12,[r3, r12]
|
||||||
and r6, r6, r9, lsl #2
|
and r6, r6, r9
|
||||||
add r5, r5, r6, lsl #15 @ r5 = pix_d 1, 2
|
add r5, r5, r6, lsl #15 @ r5 = pix_d 1, 2
|
||||||
|
|
||||||
and r8, lr, r7, lsl #1
|
and r8, lr, r7, lsl #1
|
||||||
ldrh r8, [r3, r8]
|
ldrh r8, [r3, r8]
|
||||||
and r10,lr, r7, lsr #7
|
and r10,lr, r7, lsr #7
|
||||||
ldrh r10,[r3, r10]
|
ldrh r10,[r3, r10]
|
||||||
and r12,r12,r9, lsl #2
|
and r12,r12,r9
|
||||||
sub r6, r6, r6, lsr #2 @ r6 = 3/4 pix_s 2
|
sub r6, r6, r6, lsr #2 @ r6 = 3/4 pix_s 2
|
||||||
add r6, r6, r12,lsr #2
|
add r6, r6, r12,lsr #2
|
||||||
orr r6, r6, r12,lsl #16 @ r6 = pix_d 3, 4
|
orr r6, r6, r12,lsl #16 @ r6 = pix_d 3, 4
|
||||||
|
|
||||||
and r8, r8, r9, lsl #2
|
and r8, r8, r9
|
||||||
and r10,r10,r9, lsl #2
|
and r10,r10,r9
|
||||||
sub r12,r10,r10,lsr #2 @ r12 = 3/4 pix_s 5
|
sub r12,r10,r10,lsr #2 @ r12 = 3/4 pix_s 5
|
||||||
orr r8, r8, r8, lsl #14
|
orr r8, r8, r8, lsl #14
|
||||||
add r8, r8, r12,lsl #16 @ r8 = pix_d 5, 6
|
add r8, r8, r12,lsl #16 @ r8 = pix_d 5, 6
|
||||||
|
@ -1859,12 +2022,12 @@ FinalizeLine555:
|
||||||
ldrh r12,[r3, r12]
|
ldrh r12,[r3, r12]
|
||||||
and r7, lr, r7, lsr #23
|
and r7, lr, r7, lsr #23
|
||||||
ldrh r7, [r3, r7]
|
ldrh r7, [r3, r7]
|
||||||
and r12,r12,r9, lsl #2
|
and r12,r12,r9
|
||||||
add r10,r10,r12
|
add r10,r10,r12
|
||||||
mov r10,r10, lsr #1
|
mov r10,r10, lsr #1
|
||||||
sub r12,r12,r12,lsr #2 @ r12 = 3/4 pix_s 6
|
sub r12,r12,r12,lsr #2 @ r12 = 3/4 pix_s 6
|
||||||
orr r10,r10,r12,lsl #16
|
orr r10,r10,r12,lsl #16
|
||||||
and r7, r7, r9, lsl #2
|
and r7, r7, r9
|
||||||
add r10,r10,r7, lsl #14 @ r10 = pix_d 7, 8
|
add r10,r10,r7, lsl #14 @ r10 = pix_d 7, 8
|
||||||
|
|
||||||
subs r2, r2, #1
|
subs r2, r2, #1
|
||||||
|
|
17
pico/mode4.c
17
pico/mode4.c
|
@ -291,7 +291,7 @@ void PicoFrameStartMode4(void)
|
||||||
}
|
}
|
||||||
|
|
||||||
if (Pico.est.rendstatus != rendstatus_old || lines != rendlines) {
|
if (Pico.est.rendstatus != rendstatus_old || lines != rendlines) {
|
||||||
emu_video_mode_change(screen_offset, lines, 1);
|
emu_video_mode_change(screen_offset, lines, line_offset, 256);
|
||||||
rendstatus_old = Pico.est.rendstatus;
|
rendstatus_old = Pico.est.rendstatus;
|
||||||
rendlines = lines;
|
rendlines = lines;
|
||||||
}
|
}
|
||||||
|
@ -352,6 +352,8 @@ void PicoDoHighPal555M4(void)
|
||||||
Pico.est.HighPal[0xe0] = 0;
|
Pico.est.HighPal[0xe0] = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#include <platform/common/upscale.h>
|
||||||
|
|
||||||
static void FinalizeLineRGB555M4(int line)
|
static void FinalizeLineRGB555M4(int line)
|
||||||
{
|
{
|
||||||
if (Pico.m.dirtyPal)
|
if (Pico.m.dirtyPal)
|
||||||
|
@ -364,15 +366,20 @@ static void FinalizeLineRGB555M4(int line)
|
||||||
|
|
||||||
static void FinalizeLine8bitM4(int line)
|
static void FinalizeLine8bitM4(int line)
|
||||||
{
|
{
|
||||||
unsigned char *pd = Pico.est.DrawLineDest;
|
unsigned char *pd = Pico.est.DrawLineDest + line_offset;
|
||||||
|
unsigned char *ps = Pico.est.HighCol + line_offset + 8;
|
||||||
|
|
||||||
if (DrawLineDestIncrement)
|
if (DrawLineDestIncrement) {
|
||||||
memcpy(pd + line_offset, Pico.est.HighCol + line_offset + 8, 256);
|
if (PicoIn.opt & POPT_EN_SOFTSCALE)
|
||||||
|
rh_upscale_nn_4_5(pd, 320, ps, 256, 256, f_nop);
|
||||||
|
else
|
||||||
|
memcpy(pd, ps, 256);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void PicoDrawSetOutputMode4(pdso_t which)
|
void PicoDrawSetOutputMode4(pdso_t which)
|
||||||
{
|
{
|
||||||
line_offset = PicoIn.opt & POPT_DIS_32C_BORDER ? 0 : 32;
|
line_offset = PicoIn.opt & (POPT_DIS_32C_BORDER|POPT_EN_SOFTSCALE) ? 0 : 32;
|
||||||
switch (which)
|
switch (which)
|
||||||
{
|
{
|
||||||
case PDF_8BIT: FinalizeLineM4 = FinalizeLine8bitM4; break;
|
case PDF_8BIT: FinalizeLineM4 = FinalizeLine8bitM4; break;
|
||||||
|
|
|
@ -41,7 +41,7 @@ extern void *plat_mem_get_for_drc(size_t size);
|
||||||
extern int plat_mem_set_exec(void *ptr, size_t size);
|
extern int plat_mem_set_exec(void *ptr, size_t size);
|
||||||
|
|
||||||
// this one should handle display mode changes
|
// this one should handle display mode changes
|
||||||
extern void emu_video_mode_change(int start_line, int line_count, int is_32cols);
|
extern void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count);
|
||||||
|
|
||||||
// this must switch to 16bpp mode
|
// this must switch to 16bpp mode
|
||||||
extern void emu_32x_startup(void);
|
extern void emu_32x_startup(void);
|
||||||
|
@ -86,7 +86,7 @@ extern void *p32x_bios_g, *p32x_bios_m, *p32x_bios_s;
|
||||||
|
|
||||||
// the emulator is configured and some status is reported
|
// the emulator is configured and some status is reported
|
||||||
// through this global state (not saved in savestates)
|
// through this global state (not saved in savestates)
|
||||||
typedef struct
|
typedef struct PicoInterface
|
||||||
{
|
{
|
||||||
unsigned int opt; // POPT_* bitfield
|
unsigned int opt; // POPT_* bitfield
|
||||||
|
|
||||||
|
@ -101,6 +101,8 @@ typedef struct
|
||||||
unsigned short quirks; // game-specific quirks: PQUIRK_*
|
unsigned short quirks; // game-specific quirks: PQUIRK_*
|
||||||
unsigned short overclockM68k; // overclock the emulated 68k, in %
|
unsigned short overclockM68k; // overclock the emulated 68k, in %
|
||||||
|
|
||||||
|
unsigned short filter; // softscale filter type
|
||||||
|
|
||||||
int sndRate; // rate in Hz
|
int sndRate; // rate in Hz
|
||||||
int sndFilterAlpha; // Low pass sound filter alpha (Q16)
|
int sndFilterAlpha; // Low pass sound filter alpha (Q16)
|
||||||
short *sndOut; // PCM output buffer
|
short *sndOut; // PCM output buffer
|
||||||
|
|
|
@ -356,6 +356,7 @@ struct PicoEState
|
||||||
int DrawScanline;
|
int DrawScanline;
|
||||||
int rendstatus;
|
int rendstatus;
|
||||||
void *DrawLineDest; // draw destination
|
void *DrawLineDest; // draw destination
|
||||||
|
int DrawLineDestIncr;
|
||||||
unsigned char *HighCol;
|
unsigned char *HighCol;
|
||||||
s32 *HighPreSpr;
|
s32 *HighPreSpr;
|
||||||
struct Pico *Pico;
|
struct Pico *Pico;
|
||||||
|
|
|
@ -1219,7 +1219,7 @@ void emu_cmn_forced_frame(int no_scale, int do_emu, void *buf)
|
||||||
memset32((short *)g_screen_ptr + g_screen_ppitch * y, 0,
|
memset32((short *)g_screen_ptr + g_screen_ppitch * y, 0,
|
||||||
g_screen_width * 2 / 4);
|
g_screen_width * 2 / 4);
|
||||||
|
|
||||||
PicoIn.opt &= ~POPT_ALT_RENDERER;
|
PicoIn.opt &= ~(POPT_ALT_RENDERER|POPT_EN_SOFTSCALE);
|
||||||
PicoIn.opt |= POPT_ACC_SPRITES;
|
PicoIn.opt |= POPT_ACC_SPRITES;
|
||||||
if (!no_scale && currentConfig.scaling)
|
if (!no_scale && currentConfig.scaling)
|
||||||
PicoIn.opt |= POPT_EN_SOFTSCALE;
|
PicoIn.opt |= POPT_EN_SOFTSCALE;
|
||||||
|
|
|
@ -37,10 +37,19 @@ extern int g_screen_ppitch; // pitch in pixels
|
||||||
|
|
||||||
enum {
|
enum {
|
||||||
EOPT_SCALE_NONE = 0,
|
EOPT_SCALE_NONE = 0,
|
||||||
EOPT_SCALE_SW,
|
// linux, GP2X:
|
||||||
|
EOPT_SCALE_SW = 1,
|
||||||
EOPT_SCALE_HW,
|
EOPT_SCALE_HW,
|
||||||
};
|
};
|
||||||
|
|
||||||
|
enum {
|
||||||
|
EOPT_FILTER_NONE = 0,
|
||||||
|
// software scalers
|
||||||
|
EOPT_FILTER_SMOOTHER = 1,
|
||||||
|
EOPT_FILTER_BILINEAR1,
|
||||||
|
EOPT_FILTER_BILINEAR2,
|
||||||
|
};
|
||||||
|
|
||||||
enum {
|
enum {
|
||||||
EOPT_CONFIRM_NONE = 0,
|
EOPT_CONFIRM_NONE = 0,
|
||||||
EOPT_CONFIRM_SAVE = 1,
|
EOPT_CONFIRM_SAVE = 1,
|
||||||
|
@ -63,7 +72,7 @@ typedef struct _currentConfig_t {
|
||||||
int CPUclock;
|
int CPUclock;
|
||||||
int volume;
|
int volume;
|
||||||
int gamma;
|
int gamma;
|
||||||
int scaling; // gp2x: EOPT_SCALE_*; psp: bilinear filtering
|
int scaling; // EOPT_SCALE_*
|
||||||
int vscaling;
|
int vscaling;
|
||||||
int rotation; // for UIQ
|
int rotation; // for UIQ
|
||||||
float scale; // psp: screen scale
|
float scale; // psp: screen scale
|
||||||
|
@ -72,7 +81,7 @@ typedef struct _currentConfig_t {
|
||||||
int turbo_rate;
|
int turbo_rate;
|
||||||
int renderer;
|
int renderer;
|
||||||
int renderer32x;
|
int renderer32x;
|
||||||
int filter; // pandora
|
int filter; // EOPT_FILTER_* video filter
|
||||||
int analog_deadzone;
|
int analog_deadzone;
|
||||||
int msh2_khz;
|
int msh2_khz;
|
||||||
int ssh2_khz;
|
int ssh2_khz;
|
||||||
|
@ -180,6 +189,7 @@ void plat_update_volume(int has_changed, int is_up);
|
||||||
/* should be in libpicofe/plat.h */
|
/* should be in libpicofe/plat.h */
|
||||||
void plat_video_clear_status(void);
|
void plat_video_clear_status(void);
|
||||||
void plat_video_clear_buffers(void);
|
void plat_video_clear_buffers(void);
|
||||||
|
void plat_video_set_size(int w, int h);
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
} // extern "C"
|
} // extern "C"
|
||||||
|
|
|
@ -22,6 +22,7 @@
|
||||||
#include <pico/pico_int.h>
|
#include <pico/pico_int.h>
|
||||||
|
|
||||||
static void *shadow_fb;
|
static void *shadow_fb;
|
||||||
|
static struct area { int w, h; } area;
|
||||||
|
|
||||||
static struct in_pdata in_sdl_platform_data = {
|
static struct in_pdata in_sdl_platform_data = {
|
||||||
.defbinds = in_sdl_defbinds,
|
.defbinds = in_sdl_defbinds,
|
||||||
|
@ -81,13 +82,14 @@ void bgr_to_uyvy_init(void)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void rgb565_to_uyvy(void *d, const void *s, int pixels, int x2)
|
void rgb565_to_uyvy(void *d, const void *s, int w, int h, int pitch, int x2)
|
||||||
{
|
{
|
||||||
uint32_t *dst = d;
|
uint32_t *dst = d;
|
||||||
const uint16_t *src = s;
|
const uint16_t *src = s;
|
||||||
|
int i;
|
||||||
|
|
||||||
if (x2)
|
if (x2) while (h--) {
|
||||||
for (; pixels > 0; src += 4, dst += 4, pixels -= 4)
|
for (i = w; i > 0; src += 4, dst += 4, i -= 4)
|
||||||
{
|
{
|
||||||
struct uyvy *uyvy0 = yuv_uyvy + src[0], *uyvy1 = yuv_uyvy + src[1];
|
struct uyvy *uyvy0 = yuv_uyvy + src[0], *uyvy1 = yuv_uyvy + src[1];
|
||||||
struct uyvy *uyvy2 = yuv_uyvy + src[2], *uyvy3 = yuv_uyvy + src[3];
|
struct uyvy *uyvy2 = yuv_uyvy + src[2], *uyvy3 = yuv_uyvy + src[3];
|
||||||
|
@ -102,8 +104,10 @@ void rgb565_to_uyvy(void *d, const void *s, int pixels, int x2)
|
||||||
dst[2] = uyvy2->y | (uyvy2->vyu << 8);
|
dst[2] = uyvy2->y | (uyvy2->vyu << 8);
|
||||||
dst[3] = uyvy3->y | (uyvy3->vyu << 8);
|
dst[3] = uyvy3->y | (uyvy3->vyu << 8);
|
||||||
#endif
|
#endif
|
||||||
} else
|
}
|
||||||
for (; pixels > 0; src += 4, dst += 2, pixels -= 4)
|
src += pitch - w;
|
||||||
|
} else while (h--) {
|
||||||
|
for (i = w; i > 0; src += 4, dst += 2, i -= 4)
|
||||||
{
|
{
|
||||||
struct uyvy *uyvy0 = yuv_uyvy + src[0], *uyvy1 = yuv_uyvy + src[1];
|
struct uyvy *uyvy0 = yuv_uyvy + src[0], *uyvy1 = yuv_uyvy + src[1];
|
||||||
struct uyvy *uyvy2 = yuv_uyvy + src[2], *uyvy3 = yuv_uyvy + src[3];
|
struct uyvy *uyvy2 = yuv_uyvy + src[2], *uyvy3 = yuv_uyvy + src[3];
|
||||||
|
@ -115,20 +119,40 @@ void rgb565_to_uyvy(void *d, const void *s, int pixels, int x2)
|
||||||
dst[1] = uyvy3->y | (uyvy2->vyu << 8);
|
dst[1] = uyvy3->y | (uyvy2->vyu << 8);
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
src += pitch - w;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static int clear_buf_cnt, clear_stat_cnt;
|
static int clear_buf_cnt, clear_stat_cnt;
|
||||||
|
|
||||||
|
void plat_video_set_size(int w, int h)
|
||||||
|
{
|
||||||
|
if (area.w != w || area.h != h) {
|
||||||
|
area = (struct area) { w, h };
|
||||||
|
|
||||||
|
if (plat_sdl_change_video_mode(w, h, 0) < 0) {
|
||||||
|
// failed, revert to original resolution
|
||||||
|
plat_sdl_change_video_mode(g_screen_width, g_screen_height, 0);
|
||||||
|
w = g_screen_width, h = g_screen_height;
|
||||||
|
}
|
||||||
|
if (!plat_sdl_overlay && !plat_sdl_gl_active) {
|
||||||
|
g_screen_width = w;
|
||||||
|
g_screen_height = h;
|
||||||
|
g_screen_ppitch = w;
|
||||||
|
g_screen_ptr = plat_sdl_screen->pixels;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
void plat_video_flip(void)
|
void plat_video_flip(void)
|
||||||
{
|
{
|
||||||
if (plat_sdl_overlay != NULL) {
|
if (plat_sdl_overlay != NULL) {
|
||||||
SDL_Rect dstrect =
|
SDL_Rect dstrect =
|
||||||
{ 0, 0, plat_sdl_screen->w, plat_sdl_screen->h };
|
{ 0, 0, plat_sdl_screen->w, plat_sdl_screen->h };
|
||||||
|
|
||||||
SDL_LockYUVOverlay(plat_sdl_overlay);
|
SDL_LockYUVOverlay(plat_sdl_overlay);
|
||||||
rgb565_to_uyvy(plat_sdl_overlay->pixels[0], shadow_fb,
|
rgb565_to_uyvy(plat_sdl_overlay->pixels[0], shadow_fb,
|
||||||
g_screen_ppitch * g_screen_height,
|
area.w, area.h, g_screen_ppitch,
|
||||||
plat_sdl_overlay->w > 2*plat_sdl_overlay->h);
|
plat_sdl_overlay->w >= 2*area.w);
|
||||||
SDL_UnlockYUVOverlay(plat_sdl_overlay);
|
SDL_UnlockYUVOverlay(plat_sdl_overlay);
|
||||||
SDL_DisplayYUVOverlay(plat_sdl_overlay, &dstrect);
|
SDL_DisplayYUVOverlay(plat_sdl_overlay, &dstrect);
|
||||||
}
|
}
|
||||||
|
@ -205,7 +229,7 @@ void plat_video_menu_end(void)
|
||||||
|
|
||||||
SDL_LockYUVOverlay(plat_sdl_overlay);
|
SDL_LockYUVOverlay(plat_sdl_overlay);
|
||||||
rgb565_to_uyvy(plat_sdl_overlay->pixels[0], shadow_fb,
|
rgb565_to_uyvy(plat_sdl_overlay->pixels[0], shadow_fb,
|
||||||
g_menuscreen_pp * g_menuscreen_h, 0);
|
g_menuscreen_w, g_menuscreen_h, g_menuscreen_pp, 0);
|
||||||
SDL_UnlockYUVOverlay(plat_sdl_overlay);
|
SDL_UnlockYUVOverlay(plat_sdl_overlay);
|
||||||
|
|
||||||
SDL_DisplayYUVOverlay(plat_sdl_overlay, &dstrect);
|
SDL_DisplayYUVOverlay(plat_sdl_overlay, &dstrect);
|
||||||
|
@ -227,10 +251,10 @@ void plat_video_menu_leave(void)
|
||||||
|
|
||||||
void plat_video_loop_prepare(void)
|
void plat_video_loop_prepare(void)
|
||||||
{
|
{
|
||||||
// take over any new vout settings XXX ask plat_sdl for scaling instead!
|
// take over any new vout settings
|
||||||
plat_sdl_change_video_mode(g_menuscreen_w, g_menuscreen_h, 0);
|
plat_sdl_change_video_mode(g_menuscreen_w, g_menuscreen_h, 0);
|
||||||
// switch over to scaled output if available
|
// switch over to scaled output if available
|
||||||
if (plat_sdl_overlay != NULL || plat_sdl_gl_active || currentConfig.scaling != EOPT_SCALE_NONE) {
|
if (plat_sdl_overlay != NULL || plat_sdl_gl_active) {
|
||||||
g_screen_width = 320;
|
g_screen_width = 320;
|
||||||
g_screen_height = 240;
|
g_screen_height = 240;
|
||||||
g_screen_ppitch = g_screen_width;
|
g_screen_ppitch = g_screen_width;
|
||||||
|
@ -246,6 +270,7 @@ void plat_video_loop_prepare(void)
|
||||||
g_screen_ptr = plat_sdl_screen->pixels;
|
g_screen_ptr = plat_sdl_screen->pixels;
|
||||||
}
|
}
|
||||||
plat_video_set_buffer(g_screen_ptr);
|
plat_video_set_buffer(g_screen_ptr);
|
||||||
|
plat_video_set_size(g_screen_width, g_screen_height);
|
||||||
}
|
}
|
||||||
|
|
||||||
void plat_early_init(void)
|
void plat_early_init(void)
|
||||||
|
|
|
@ -7,7 +7,7 @@
|
||||||
* nn: nearest neighbour
|
* nn: nearest neighbour
|
||||||
* snn: "smoothed" nearest neighbour (see below)
|
* snn: "smoothed" nearest neighbour (see below)
|
||||||
* bln: n-level-bilinear with n quantized weights
|
* bln: n-level-bilinear with n quantized weights
|
||||||
* quantization: 0: a<1/2*n, 1/n: 1/2*n<=a<3/2*n, etc
|
* quantization: 0: a<1/(2*n), 1/n: 1/(2*n)<=a<3/(2*n), etc
|
||||||
* currently n=2, n=4 are implemented (there's n=8 mixing, but no filters)
|
* currently n=2, n=4 are implemented (there's n=8 mixing, but no filters)
|
||||||
* [NB this has been brought to my attn, which is probably the same as bl2:
|
* [NB this has been brought to my attn, which is probably the same as bl2:
|
||||||
* https://www.drdobbs.com/image-scaling-with-bresenham/184405045?pgno=1]
|
* https://www.drdobbs.com/image-scaling-with-bresenham/184405045?pgno=1]
|
||||||
|
@ -18,490 +18,586 @@
|
||||||
* a sharper look than a bilinear filter, at the price of some visible jags
|
* a sharper look than a bilinear filter, at the price of some visible jags
|
||||||
* on diagonal edges.
|
* on diagonal edges.
|
||||||
*
|
*
|
||||||
* scaling modes:
|
* example scaling modes:
|
||||||
* 256x___ -> 320x___ only horizontal scaling. Produces an aspect error of
|
* 256x_Y_ -> 320x_Y_, H32/mode 4, PAR 5:4, for PAL DAR 4:3 (NTSC 7% aspect err)
|
||||||
* ~7% for NTSC 224 line modes, but is correct for PAL
|
* 256x224 -> 320x240, H32/mode 4, PAR 5:4, for NTSC DAR 4:3 (PAL 7% aspect err)
|
||||||
* 256/320x224/240
|
* 320x224 -> 320x240, PAR 1:1, for NTSC, DAR 4:3 (PAL 7% etc etc...)
|
||||||
* -> 320x240 always produces 320x240 at DAR 4:3
|
* 160x144 -> 320x240: GG, PAR 6:5, scaling to 320x240 for DAR 4:3
|
||||||
* 160x144 -> 320x240 game gear (currently unused)
|
|
||||||
*
|
*
|
||||||
* (C) 2021 kub <derkub@gmail.com>
|
* (C) 2021 kub <derkub@gmail.com>
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#include "upscale.h"
|
#include "upscale.h"
|
||||||
|
|
||||||
/* 256x___ -> 320x___, H32/mode 4, PAR 5:4, for PAL DAR 4:3 (wrong for NTSC) */
|
/* X x Y -> X*5/4 x Y */
|
||||||
void upscale_clut_nn_256_320x___(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int height)
|
void upscale_clut_nn_x_4_5(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
{
|
{
|
||||||
int y;
|
int y;
|
||||||
|
|
||||||
for (y = 0; y < height; y++) {
|
for (y = 0; y < height; y++) {
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_nop);
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_nop);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_nn_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal)
|
void upscale_rgb_nn_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y;
|
int y;
|
||||||
|
|
||||||
for (y = 0; y < height; y++) {
|
for (y = 0; y < height; y++) {
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_snn_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal)
|
void upscale_rgb_snn_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y;
|
int y;
|
||||||
|
|
||||||
for (y = 0; y < height; y++) {
|
for (y = 0; y < height; y++) {
|
||||||
h_upscale_snn_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_snn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl2_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal)
|
void upscale_rgb_bl2_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y;
|
int y;
|
||||||
|
|
||||||
for (y = 0; y < height; y++) {
|
for (y = 0; y < height; y++) {
|
||||||
h_upscale_bl2_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_bl2_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl4_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal)
|
void upscale_rgb_bl4_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y;
|
int y;
|
||||||
|
|
||||||
for (y = 0; y < height; y++) {
|
for (y = 0; y < height; y++) {
|
||||||
h_upscale_bl4_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_bl4_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* 256x224 -> 320x240, H32/mode 4, PAR 5:4, for NTSC DAR 4:3 (wrong for PAL) */
|
/* X x Y -> X*5/4 x Y*17/16 */
|
||||||
void upscale_clut_nn_256_320x224_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss)
|
void upscale_clut_nn_x_4_5_y_16_17(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 14:15, 0 1 2 3 4 5 6 6 7 8 9 10 11 12 13 */
|
for (y = 0; y < height; y += 16) {
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (j = 0; j < 8; j++) {
|
||||||
/* lines 0-6 */
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_nop);
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_nop);
|
|
||||||
}
|
}
|
||||||
/* lines 8-14 */
|
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 7; j++) {
|
for (j = 0; j < 8; j++) {
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_nop);
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_nop);
|
||||||
}
|
}
|
||||||
/* line 7 */
|
|
||||||
di -= 8*ds;
|
di -= 9*ds;
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
v_copy(&di[0], &di[-ds], swidth, f_nop);
|
||||||
di += 8*ds;
|
di += 9*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_nn_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_nn_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (y = 0; y < height; y += 16) {
|
||||||
for (j = 0; j < 7; j++) {
|
for (j = 0; j < 8; j++) {
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 7; j++) {
|
for (j = 0; j < 8; j++) {
|
||||||
h_upscale_nn_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_nn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
|
|
||||||
di -= 8*ds;
|
di -= 9*ds;
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
v_copy(&di[0], &di[-ds], swidth, f_nop);
|
||||||
di += 8*ds;
|
di += 9*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_snn_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_snn_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 14:15, 0 1 2 3 4 5 5+6 6+7 7+8 8 9 10 11 12 13 */
|
for (y = 0; y < height; y += 16) {
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (j = 0; j < 8; j++) {
|
||||||
for (j = 0; j < 7; j++) {
|
h_upscale_snn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
h_upscale_snn_4_5(di, ds, si, ss, 256, f_pal);
|
|
||||||
}
|
}
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 7; j++) {
|
for (j = 0; j < 8; j++) {
|
||||||
h_upscale_snn_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_snn_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* mix lines 6-8 */
|
/* mix lines 6-8 */
|
||||||
di -= 8*ds;
|
di -= 9*ds;
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_05, f_nop);
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_05, f_nop);
|
||||||
v_mix(&di[-ds], &di[-2*ds], &di[-ds], 320, p_05, f_nop);
|
v_mix(&di[-ds], &di[-2*ds], &di[-ds], swidth, p_05, f_nop);
|
||||||
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], 320, p_05, f_nop);
|
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], swidth, p_05, f_nop);
|
||||||
di += 8*ds;
|
di += 9*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bln_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_bl2_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 14:15, 0 1 2 2+3 3+4 4+5 5+6 6+7 7+8 8+9 9+10 10+11 11 12 13 */
|
for (y = 0; y < height; y += 16) {
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (j = 0; j < 4; j++) {
|
||||||
/* lines 0-2 */
|
h_upscale_bl2_4_5(di, ds, si, ss, width, f_pal);
|
||||||
for (j = 0; j < 3; j++) {
|
|
||||||
h_upscale_bln_4_5(di, ds, si, ss, 256, f_pal);
|
|
||||||
}
|
}
|
||||||
/* lines 3-11 mixing prep */
|
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 11; j++) {
|
for (j = 0; j < 12; j++) {
|
||||||
h_upscale_bln_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_bl2_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
di -= 12*ds;
|
/* mix lines 3-10 */
|
||||||
/* mixing line 3: line 2 = -ds, line 3 = +ds */
|
di -= 13*ds;
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_025, f_nop);
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_05, f_nop);
|
||||||
|
for (j = 0; j < 7; j++) {
|
||||||
di += ds;
|
di += ds;
|
||||||
/* mixing lines 4-5: line n-1 = 0, line n = +ds */
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_05, f_nop);
|
||||||
|
}
|
||||||
|
di += 6*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_bl4_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 16) {
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_025, f_nop);
|
h_upscale_bl4_4_5(di, ds, si, ss, width, f_pal);
|
||||||
di += ds;
|
|
||||||
}
|
}
|
||||||
/* mixing line 6-8 */
|
di += ds;
|
||||||
|
for (j = 0; j < 14; j++) {
|
||||||
|
h_upscale_bl4_4_5(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di -= 15*ds;
|
||||||
|
/* mixing line 2: line 1 = -ds, line 2 = +ds */
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_025, f_nop);
|
||||||
|
di += ds;
|
||||||
|
/* mixing lines 3-5: line n-1 = 0, line n = +ds */
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_05, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_025, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* mixing lines 9-11 */
|
/* mixing lines 6-9 */
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 4; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_075, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_05, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* lines 12-14, already in place */
|
/* mixing lines 10-13 */
|
||||||
|
for (j = 0; j < 4; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_075, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* lines 14-16, already in place */
|
||||||
di += 3*ds;
|
di += 3*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl2_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
/* "classic" upscaler as found in several emulators. It's really more like a
|
||||||
|
* x*4/3, y*16/15 upscaler, with an additional 5th row/17th line just inserted
|
||||||
|
* from the source image. That gives nice n/4,n/16 alpha values plus better
|
||||||
|
* symmetry in each block and avoids "borrowing" a row/line between blocks.
|
||||||
|
*/
|
||||||
|
void upscale_rgb_bln_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 14:15, 0 1 2 2+3 3+4 4+5 5+6 6+7 7+8 8+9 9+10 10 11 12 13 */
|
for (y = 0; y < height; y += 16) {
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (j = 0; j < 4; j++) {
|
||||||
|
h_upscale_bln_4_5(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di += ds;
|
||||||
|
for (j = 0; j < 12; j++) {
|
||||||
|
h_upscale_bln_4_5(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di -= 13*ds;
|
||||||
|
/* mixing line 4: line 3 = -ds, line 4 = +ds */
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_025, f_nop);
|
||||||
|
di += ds;
|
||||||
|
/* mixing lines 5-6: line n-1 = 0, line n = +ds */
|
||||||
|
for (j = 0; j < 2; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_025, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* mixing line 7-9 */
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_bl2_4_5(di, ds, si, ss, 256, f_pal);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_05, f_nop);
|
||||||
}
|
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 11; j++) {
|
|
||||||
h_upscale_bl2_4_5(di, ds, si, ss, 256, f_pal);
|
|
||||||
}
|
}
|
||||||
/* mix lines 3-10 */
|
/* mixing lines 10-12 */
|
||||||
di -= 12*ds;
|
for (j = 0; j < 3; j++) {
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_05, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_075, f_nop);
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
di += ds;
|
di += ds;
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_05, f_nop);
|
|
||||||
}
|
}
|
||||||
di += 5*ds;
|
/* lines 13-16, already in place */
|
||||||
|
di += 4*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl4_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
/* experimental 8 level bilinear for quality assessment */
|
||||||
|
void upscale_rgb_bl8_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 5/4;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 14:15, 0 0+1 1+2 2+3 3+4 4+5 5+6 6+7 7+8 8+9 9+10 10+11 11+12 12 13 */
|
for (y = 0; y < 224; y += 16) {
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (j = 0; j < 2; j++) {
|
||||||
/* line 0 */
|
h_upscale_bl8_4_5(di, ds, si, ss, width, f_pal);
|
||||||
h_upscale_bl4_4_5(di, ds, si, ss, 256, f_pal);
|
|
||||||
/* lines 1-14 mixing prep */
|
|
||||||
di += ds;
|
|
||||||
for (j = 0; j < 13; j++) {
|
|
||||||
h_upscale_bl4_4_5(di, ds, si, ss, 256, f_pal);
|
|
||||||
}
|
}
|
||||||
di -= 14*ds;
|
|
||||||
/* mixing line 1: line 0 = -ds, line 1 = +ds */
|
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_025, f_nop);
|
|
||||||
di += ds;
|
|
||||||
/* mixing lines 2-4: line n-1 = 0, line n = +ds */
|
|
||||||
for (j = 0; j < 3; j++) {
|
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_025, f_nop);
|
|
||||||
di += ds;
|
|
||||||
}
|
|
||||||
/* mixing lines 5-8 */
|
|
||||||
for (j = 0; j < 4; j++) {
|
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_05, f_nop);
|
|
||||||
di += ds;
|
|
||||||
}
|
|
||||||
/* mixing lines 9-12 */
|
|
||||||
for (j = 0; j < 4; j++) {
|
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_075, f_nop);
|
|
||||||
di += ds;
|
|
||||||
}
|
|
||||||
/* lines 13-14, already in place */
|
|
||||||
di += 2*ds;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
void upscale_rgb_bl8_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
|
||||||
{
|
|
||||||
int y, j, d;
|
|
||||||
|
|
||||||
/* 14:15, -1+0 0+1 1+2 2+3 3+4 4+5 5+6 6+7 7+8 8+9 9+10 10+11 11+12 12+13 13 */
|
|
||||||
for (y = 0, d = ds; y < 224; y += 14, d = -ds) {
|
|
||||||
/* lines 0-14 mixing prep */
|
|
||||||
di += ds;
|
di += ds;
|
||||||
for (j = 0; j < 14; j++) {
|
for (j = 0; j < 14; j++) {
|
||||||
h_upscale_bl8_4_5(di, ds, si, ss, 256, f_pal);
|
h_upscale_bl8_4_5(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
di -= 15*ds;
|
di -= 15*ds;
|
||||||
/* mixing line 0: line 0 = -ds, line 1 = +ds */
|
/* mixing line 2: line 2 = -ds, line 3 = +ds */
|
||||||
v_mix(&di[0], &di[d], &di[ds], 320, p_0125, f_nop);
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_0125, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
/* mixing line 1: line 1 = 0, line 2 = +ds */
|
/* mixing line 3: line 3 = 0, line 4 = +ds */
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_0125, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_0125, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
/* mixing lines 2-3: line n-1 = 0, line n = +ds */
|
/* mixing lines 4-5: line n-1 = 0, line n = +ds */
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_025, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], swidth, p_025, f_nop);
|
||||||
di += ds;
|
|
||||||
}
|
|
||||||
/* mixing lines 4-5 */
|
|
||||||
for (j = 0; j < 2; j++) {
|
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_0375, f_nop);
|
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* mixing lines 6-7 */
|
/* mixing lines 6-7 */
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_05, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], 320, p_0375, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* mixing lines 8-9 */
|
/* mixing lines 8-9 */
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_0625, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], 320, p_05, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* mixing lines 10-11 */
|
/* mixing lines 10-11 */
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_075, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], 320, p_0625, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* mixing lines 12-13 */
|
/* mixing lines 12-13 */
|
||||||
|
for (j = 0; j < 2; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], 320, p_075, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* mixing lines 14-15 */
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[0], &di[ds], 320, p_0875, f_nop);
|
v_mix(&di[0], &di[0], &di[ds], 320, p_0875, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* line 14, already in place */
|
/* line 16, already in place */
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* 320x224 -> 320x240, PAR 1:1, for NTSC, DAR 4:3 (wrong for PAL) */
|
/* X x Y -> X x Y*17/16 */
|
||||||
void upscale_clut_nn_320x224_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss)
|
void upscale_clut_nn_y_16_17(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
{
|
{
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (y = 0; y < height; y += 16) {
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_nop);
|
|
||||||
}
|
|
||||||
di += ds;
|
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_nop);
|
|
||||||
}
|
|
||||||
|
|
||||||
di -= 8*ds;
|
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
|
||||||
di += 8*ds;
|
|
||||||
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
void upscale_rgb_nn_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
|
||||||
{
|
|
||||||
int y, j;
|
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
|
||||||
di += ds;
|
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
|
||||||
|
|
||||||
di -= 8*ds;
|
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
|
||||||
di += 8*ds;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
void upscale_rgb_snn_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
|
||||||
{
|
|
||||||
int y, j;
|
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
|
||||||
di += ds;
|
|
||||||
for (j = 0; j < 7; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
|
||||||
|
|
||||||
di -= 8*ds;
|
|
||||||
v_mix(&di[ 0], &di[-ds], &di[ds], 320, p_05, f_nop);
|
|
||||||
v_mix(&di[-ds], &di[-2*ds], &di[-ds], 320, p_05, f_nop);
|
|
||||||
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], 320, p_05, f_nop);
|
|
||||||
di += 8*ds;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
void upscale_rgb_bl2_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
|
||||||
{
|
|
||||||
int y, j;
|
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
|
||||||
for (j = 0; j < 3; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
|
||||||
for (j = 0; j < 8; j++) {
|
for (j = 0; j < 8; j++) {
|
||||||
v_mix(&di[0], &si[-ss], &si[0], 320, p_05, f_pal);
|
h_copy(di, ds, si, ss, width, f_nop);
|
||||||
|
}
|
||||||
di += ds;
|
di += ds;
|
||||||
si += ss;
|
for (j = 0; j < 8; j++) {
|
||||||
}
|
h_copy(di, ds, si, ss, width, f_nop);
|
||||||
si -= ss;
|
|
||||||
for (j = 0; j < 4; j++) {
|
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
di -= 9*ds;
|
||||||
|
v_copy(&di[0], &di[-ds], width, f_nop);
|
||||||
|
di += 9*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl4_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_nn_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
for (y = 0; y < 224; y += 14) {
|
for (y = 0; y < height; y += 16) {
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
for (j = 0; j < 8; j++) {
|
||||||
for (j = 0; j < 4; j++) {
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
v_mix(&di[0], &si[-ss], &si[0], 320, p_025, f_pal);
|
|
||||||
di += ds;
|
|
||||||
si += ss;
|
|
||||||
}
|
}
|
||||||
for (j = 0; j < 4; j++) {
|
|
||||||
v_mix(&di[0], &si[-ss], &si[0], 320, p_05, f_pal);
|
|
||||||
di += ds;
|
di += ds;
|
||||||
si += ss;
|
for (j = 0; j < 8; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
|
||||||
|
di -= 9*ds;
|
||||||
|
v_copy(&di[0], &di[-ds], width, f_nop);
|
||||||
|
di += 9*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_snn_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 16) {
|
||||||
|
for (j = 0; j < 8; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
for (j = 0; j < 4; j++) {
|
|
||||||
v_mix(&di[0], &si[-ss], &si[0], 320, p_075, f_pal);
|
|
||||||
di += ds;
|
di += ds;
|
||||||
si += ss;
|
for (j = 0; j < 8; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
si -= ss;
|
|
||||||
|
/* mix lines 6-8 */
|
||||||
|
di -= 9*ds;
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], width, p_05, f_nop);
|
||||||
|
v_mix(&di[-ds], &di[-2*ds], &di[-ds], width, p_05, f_nop);
|
||||||
|
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], width, p_05, f_nop);
|
||||||
|
di += 9*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_bl2_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 16) {
|
||||||
|
for (j = 0; j < 4; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di += ds;
|
||||||
|
for (j = 0; j < 12; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
/* mix lines 3-10 */
|
||||||
|
di -= 13*ds;
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], width, p_05, f_nop);
|
||||||
|
for (j = 0; j < 7; j++) {
|
||||||
|
di += ds;
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], width, p_05, f_nop);
|
||||||
|
}
|
||||||
|
di += 6*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_bl4_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 16) {
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
h_copy(di, ds, si, ss, 320, f_pal);
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
|
di += ds;
|
||||||
|
for (j = 0; j < 14; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di -= 15*ds;
|
||||||
|
/* mixing line 2: line 1 = -ds, line 2 = +ds */
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], width, p_025, f_nop);
|
||||||
|
di += ds;
|
||||||
|
/* mixing lines 3-5: line n-1 = 0, line n = +ds */
|
||||||
|
for (j = 0; j < 3; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], width, p_025, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* mixing lines 6-9 */
|
||||||
|
for (j = 0; j < 4; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], width, p_05, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* mixing lines 10-13 */
|
||||||
|
for (j = 0; j < 4; j++) {
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], width, p_075, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* lines 14-16, already in place */
|
||||||
|
di += 3*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* 160x144 -> 320x240: GG, PAR 6:5, scaling to 320x240 for DAR 4:3 */
|
/* X x Y -> X*2/1 x Y, e.g. for X 160->320 (GG) */
|
||||||
/* NB for smoother image could scale to 288x216, x*9/5, y*3/2 ?
|
void upscale_clut_nn_x_1_2(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
* h: 11111 11112 22222 22233 33333 33444 44444 45555 55555
|
|
||||||
* 1 1 2 2+3 3 3+4 4 5 5
|
|
||||||
* v: 11 12 22
|
|
||||||
* 1 1+2 2
|
|
||||||
*/
|
|
||||||
void upscale_clut_nn_160_320x144_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss)
|
|
||||||
{
|
{
|
||||||
|
int y;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y++) {
|
||||||
|
h_upscale_nn_1_2(di, ds, si, ss, width, f_nop);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_nn_x_1_2(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y++) {
|
||||||
|
h_upscale_nn_1_2(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_bl2_x_1_2(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y++) {
|
||||||
|
h_upscale_bl2_1_2(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/* X x Y -> X*2/1 x Y*5/3 (GG) */
|
||||||
|
void upscale_clut_nn_x_1_2_y_3_5(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
|
{
|
||||||
|
int swidth = width * 2;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 3:5, 0 0 1 1 2 */
|
for (y = 0; y < height; y += 3) {
|
||||||
for (y = 0; y < 144; y += 3) {
|
|
||||||
/* lines 0,2,4 */
|
/* lines 0,2,4 */
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_nn_1_2(di, ds, si, ss, 160, f_nop);
|
h_upscale_nn_1_2(di, ds, si, ss, width, f_nop);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
/* lines 1,3 */
|
/* lines 1,3 */
|
||||||
di -= 5*ds;
|
di -= 5*ds;
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
v_copy(&di[0], &di[-ds], swidth, f_nop);
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_nn_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_nn_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 2;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
for (y = 0; y < 144; y += 3) {
|
for (y = 0; y < height; y += 3) {
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_nn_1_2(di, ds, si, ss, 160, f_pal);
|
h_upscale_nn_1_2(di, ds, si, ss, width, f_pal);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
di -= 5*ds;
|
di -= 5*ds;
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_copy(&di[0], &di[-ds], 320, f_nop);
|
v_copy(&di[0], &di[-ds], swidth, f_nop);
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_snn_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_bl2_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
|
int swidth = width * 2;
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 3:5, 0 0+1 1 1+2 2 */
|
for (y = 0; y < height; y += 3) {
|
||||||
for (y = 0; y < 144; y += 3) {
|
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_nn_1_2(di, ds, si, ss, 160, f_pal);
|
h_upscale_bl2_1_2(di, ds, si, ss, width, f_pal);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
di -= 5*ds;
|
di -= 5*ds;
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_05, f_nop);
|
v_mix(&di[0], &di[-ds], &di[ds], swidth, p_05, f_nop);
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl2_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_bl4_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int swidth = width * 2;
|
||||||
|
int y, j, d;
|
||||||
|
|
||||||
|
/* for 1st block backwards reference virtually duplicate source line 0 */
|
||||||
|
for (y = 0, d = 2*ds; y < height; y += 3, d = -ds) {
|
||||||
|
di += 2*ds;
|
||||||
|
for (j = 0; j < 3; j++) {
|
||||||
|
h_upscale_bl2_1_2(di, ds, si, ss, width, f_pal);
|
||||||
|
}
|
||||||
|
di -= 5*ds;
|
||||||
|
v_mix(&di[0], &di[d ], &di[2*ds], swidth, p_05, f_nop); /*-1+0 */
|
||||||
|
di += ds;
|
||||||
|
v_mix(&di[0], &di[ds], &di[2*ds], swidth, p_075, f_nop);/* 0+1 */
|
||||||
|
di += ds;
|
||||||
|
v_mix(&di[0], &di[ 0], &di[ ds], swidth, p_025, f_nop);/* 0+1 */
|
||||||
|
di += ds;
|
||||||
|
v_mix(&di[0], &di[ 0], &di[ ds], swidth, p_05, f_nop); /* 1+2 */
|
||||||
|
di += 2*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/* X x Y -> X x Y*5/3, e.g. for Y 144->240 (GG) */
|
||||||
|
void upscale_clut_nn_y_3_5(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height)
|
||||||
{
|
{
|
||||||
int y, j;
|
int y, j;
|
||||||
|
|
||||||
/* 3:5, 0 0+1 1 1+2 2 */
|
for (y = 0; y < height; y += 3) {
|
||||||
for (y = 0; y < 144; y += 3) {
|
/* lines 0,2,4 */
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_bl2_1_2(di, ds, si, ss, 160, f_pal);
|
h_copy(di, ds, si, ss, width, f_nop);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
/* lines 1,3 */
|
||||||
|
di -= 5*ds;
|
||||||
|
for (j = 0; j < 2; j++) {
|
||||||
|
v_copy(&di[0], &di[-ds], width, f_nop);
|
||||||
|
di += 2*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_nn_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 3) {
|
||||||
|
for (j = 0; j < 3; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
di += ds;
|
di += ds;
|
||||||
}
|
}
|
||||||
di -= 5*ds;
|
di -= 5*ds;
|
||||||
for (j = 0; j < 2; j++) {
|
for (j = 0; j < 2; j++) {
|
||||||
v_mix(&di[0], &di[-ds], &di[ds], 320, p_05, f_nop);
|
v_copy(&di[0], &di[-ds], width, f_nop);
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void upscale_rgb_bl4_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal)
|
void upscale_rgb_bl2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
|
{
|
||||||
|
int y, j;
|
||||||
|
|
||||||
|
for (y = 0; y < height; y += 3) {
|
||||||
|
for (j = 0; j < 3; j++) {
|
||||||
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
|
di += ds;
|
||||||
|
}
|
||||||
|
di -= 5*ds;
|
||||||
|
for (j = 0; j < 2; j++) {
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], width, p_05, f_nop);
|
||||||
|
di += 2*ds;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void upscale_rgb_bl4_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal)
|
||||||
{
|
{
|
||||||
int y, j, d;
|
int y, j, d;
|
||||||
|
|
||||||
/* 3:5, -1+0, 0+1 0+1 1+2 2
|
/* for 1st block backwards reference virtually duplicate source line 0 */
|
||||||
* for 1st block backwards reference virtually duplicate source line 0 */
|
for (y = 0, d = 2*ds; y < height; y += 3, d = -ds) {
|
||||||
for (y = 0, d = 2*ds; y < 144; y += 3, d = -ds) {
|
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
for (j = 0; j < 3; j++) {
|
for (j = 0; j < 3; j++) {
|
||||||
h_upscale_bl2_1_2(di, ds, si, ss, 160, f_pal);
|
h_copy(di, ds, si, ss, width, f_pal);
|
||||||
}
|
}
|
||||||
di -= 5*ds;
|
di -= 5*ds;
|
||||||
v_mix(&di[0], &di[d ], &di[2*ds], 320, p_05, f_nop); /*-1+0 */
|
v_mix(&di[0], &di[d ], &di[2*ds], width, p_05, f_nop); /*-1+0 */
|
||||||
di += ds;
|
di += ds;
|
||||||
v_mix(&di[0], &di[ds], &di[2*ds], 320, p_075, f_nop); /* 0+1 */
|
v_mix(&di[0], &di[ds], &di[2*ds], width, p_075, f_nop);/* 0+1 */
|
||||||
di += ds;
|
di += ds;
|
||||||
v_mix(&di[0], &di[ 0], &di[ ds], 320, p_025, f_nop); /* 0+1 */
|
v_mix(&di[0], &di[ 0], &di[ ds], width, p_025, f_nop);/* 0+1 */
|
||||||
di += ds;
|
di += ds;
|
||||||
v_mix(&di[0], &di[ 0], &di[ ds], 320, p_05, f_nop); /* 1+2 */
|
v_mix(&di[0], &di[ 0], &di[ ds], width, p_05, f_nop); /* 1+2 */
|
||||||
di += 2*ds;
|
di += 2*ds;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -7,7 +7,7 @@
|
||||||
* nn: nearest neighbour
|
* nn: nearest neighbour
|
||||||
* snn: "smoothed" nearest neighbour (see below)
|
* snn: "smoothed" nearest neighbour (see below)
|
||||||
* bln: n-level-bilinear with n quantized weights
|
* bln: n-level-bilinear with n quantized weights
|
||||||
* quantization: 0: a<1/2*n, 1/n: 1/2*n<=a<3/2*n, etc
|
* quantization: 0: a<1/(2*n), 1/n: 1/(2*n)<=a<3/(2*n), etc
|
||||||
* currently n=2, n=4 are implemented (there's n=8 mixing, but no filters)
|
* currently n=2, n=4 are implemented (there's n=8 mixing, but no filters)
|
||||||
* [NB this has been brought to my attn, which is probably the same as bl2:
|
* [NB this has been brought to my attn, which is probably the same as bl2:
|
||||||
* https://www.drdobbs.com/image-scaling-with-bresenham/184405045?pgno=1]
|
* https://www.drdobbs.com/image-scaling-with-bresenham/184405045?pgno=1]
|
||||||
|
@ -18,34 +18,37 @@
|
||||||
* a sharper look than a bilinear filter, at the price of some visible jags
|
* a sharper look than a bilinear filter, at the price of some visible jags
|
||||||
* on diagonal edges.
|
* on diagonal edges.
|
||||||
*
|
*
|
||||||
* scaling modes:
|
* example scaling modes:
|
||||||
* 256x___ -> 320x___ only horizontal scaling. Produces an aspect error of
|
* 256x_Y_ -> 320x_Y_, H32/mode 4, PAR 5:4, for PAL DAR 4:3 (NTSC 7% aspect err)
|
||||||
* ~7% for NTSC 224 line modes, but is correct for PAL
|
* 256x224 -> 320x240, H32/mode 4, PAR 5:4, for NTSC DAR 4:3 (PAL 7% aspect err)
|
||||||
* 256/320x224/240
|
* 320x224 -> 320x240, PAR 1:1, for NTSC, DAR 4:3 (PAL 7% etc etc...)
|
||||||
* -> 320x240 always produces 320x240 at DAR 4:3
|
* 160x144 -> 320x240: GG, PAR 6:5, scaling to 320x240 for DAR 4:3
|
||||||
* 160x144 -> 320x240 game gear (currently unused)
|
*
|
||||||
*
|
*
|
||||||
* (C) 2021 kub <derkub@gmail.com>
|
* (C) 2021 kub <derkub@gmail.com>
|
||||||
|
*
|
||||||
|
* This work is licensed under the terms of MAME license.
|
||||||
|
* See COPYING file in the top-level directory.
|
||||||
*/
|
*/
|
||||||
#include <pico/pico_types.h>
|
#include <pico/pico_types.h>
|
||||||
|
|
||||||
/* RGB565 pixel mixing, see https://www.compuphase.com/graphic/scale3.htm and
|
/* RGB565 pixel mixing, see https://www.compuphase.com/graphic/scale3.htm and
|
||||||
http://blargg.8bitalley.com/info/rgb_mixing.html */
|
http://blargg.8bitalley.com/info/rgb_mixing.html */
|
||||||
/* 2-level mixing */
|
/* 2-level mixing */
|
||||||
//#define p_05(p1,p2) (((p1)+(p2) + ( ((p1)^(p2))&0x0821))>>1) // round up
|
//#define p_05(d,p1,p2) d=(((p1)+(p2) + ( ((p1)^(p2))&0x0821))>>1) // round up
|
||||||
//#define p_05(p1,p2) (((p1)+(p2) - ( ((p1)^(p2))&0x0821))>>1) // round down
|
//#define p_05(d,p1,p2) d=(((p1)+(p2) - ( ((p1)^(p2))&0x0821))>>1) // round down
|
||||||
#define p_05(p1,p2) (((p1)&(p2)) + ((((p1)^(p2))&~0x0821)>>1))
|
#define p_05(d,p1,p2) d=(((p1)&(p2)) + ((((p1)^(p2))&~0x0821)>>1))
|
||||||
/* 4-level mixing, 2 times slower */
|
/* 4-level mixing, 2 times slower */
|
||||||
// 1/4*p1 + 3/4*p2 = 1/2*(1/2*(p1+p2) + p2)
|
// 1/4*p1 + 3/4*p2 = 1/2*(1/2*(p1+p2) + p2)
|
||||||
#define p_025(p1,p2) (t=p_05(p1, p2), p_05( t, p2))
|
#define p_025(d,p1,p2) p_05(t, p1, p2); p_05( d, t, p2)
|
||||||
#define p_075(p1,p2) p_025(p2,p1)
|
#define p_075(d,p1,p2) p_025(d,p2,p1)
|
||||||
/* 8-level mixing, 3 times slower */
|
/* 8-level mixing, 3 times slower */
|
||||||
// 1/8*p1 + 7/8*p2 = 1/2*(1/2*(1/2*(p1+p2) + p2) + p2)
|
// 1/8*p1 + 7/8*p2 = 1/2*(1/2*(1/2*(p1+p2) + p2) + p2)
|
||||||
#define p_0125(p1,p2) (t=p_05(p1, p2), u=p_05( t, p2), p_05( u, p2))
|
#define p_0125(d,p1,p2) p_05(t, p1, p2); p_05( u, t, p2); p_05( d, u, p2)
|
||||||
// 3/8*p1 + 5/8*p2 = 1/2*(1/2*(1/2*(p1+p2) + p2) + 1/2*(p1+p2))
|
// 3/8*p1 + 5/8*p2 = 1/2*(1/2*(1/2*(p1+p2) + p2) + 1/2*(p1+p2))
|
||||||
#define p_0375(p1,p2) (t=p_05(p1, p2), u=p_05( t, p2), p_05( u, t))
|
#define p_0375(d,p1,p2) p_05(t, p1, p2); p_05( u, t, p2); p_05( d, u, t)
|
||||||
#define p_0625(p1,p2) p_0375(p2,p1)
|
#define p_0625(d,p1,p2) p_0375(d,p2,p1)
|
||||||
#define p_0875(p1,p2) p_0125(p2,p1)
|
#define p_0875(d,p1,p2) p_0125(d,p2,p1)
|
||||||
|
|
||||||
/* pixel transforms */
|
/* pixel transforms */
|
||||||
#define f_pal(v) pal[v] // convert CLUT index -> RGB565
|
#define f_pal(v) pal[v] // convert CLUT index -> RGB565
|
||||||
|
@ -55,7 +58,7 @@
|
||||||
/*
|
/*
|
||||||
scalers h:
|
scalers h:
|
||||||
256->320: - (4:5) (256x224/240 -> 320x224/240)
|
256->320: - (4:5) (256x224/240 -> 320x224/240)
|
||||||
256->299: - (6:7) (256x224 -> 299x224, DAR 4:3, 10.5 px border )
|
256->299: - (6:7) (256x224 -> 299x224, alt?)
|
||||||
160->320: - (1:2) 2x (160x144 -> 320x240, GG)
|
160->320: - (1:2) 2x (160x144 -> 320x240, GG)
|
||||||
160->288: - (5:9) (160x144 -> 288x216, GG alt?)
|
160->288: - (5:9) (160x144 -> 288x216, GG alt?)
|
||||||
*/
|
*/
|
||||||
|
@ -95,7 +98,7 @@ scalers h:
|
||||||
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = f(si[1]); \
|
di[1] = f(si[1]); \
|
||||||
di[2] = p_05(f(si[1]),f(si[2])); \
|
p_05(di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = f(si[2]); \
|
di[3] = f(si[2]); \
|
||||||
di[4] = f(si[3]); \
|
di[4] = f(si[3]); \
|
||||||
} \
|
} \
|
||||||
|
@ -104,12 +107,12 @@ scalers h:
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
#define h_upscale_bln_4_5(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bln_4_5(di,ds,si,ss,w,f) do { \
|
||||||
int i, t; \
|
int i; u16 t; \
|
||||||
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = p_025(f(si[0]),f(si[1])); \
|
p_025(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_05 (f(si[1]),f(si[2])); \
|
p_05 (di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = p_075(f(si[2]),f(si[3])); \
|
p_075(di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = f(si[3]); \
|
di[4] = f(si[3]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/4*5; \
|
di += ds - w/4*5; \
|
||||||
|
@ -120,8 +123,8 @@ scalers h:
|
||||||
int i; \
|
int i; \
|
||||||
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = p_05(f(si[0]),f(si[1])); \
|
p_05(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_05(f(si[1]),f(si[2])); \
|
p_05(di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = f(si[2]); \
|
di[3] = f(si[2]); \
|
||||||
di[4] = f(si[3]); \
|
di[4] = f(si[3]); \
|
||||||
} \
|
} \
|
||||||
|
@ -130,12 +133,12 @@ scalers h:
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
#define h_upscale_bl4_4_5(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bl4_4_5(di,ds,si,ss,w,f) do { \
|
||||||
int i, t; uint p = f(si[0]); \
|
int i; u16 t, p = f(si[0]); \
|
||||||
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
||||||
di[0] = p_025(p, f(si[0])); \
|
p_025(di[0], p, f(si[0])); \
|
||||||
di[1] = p_05 (f(si[0]),f(si[1])); \
|
p_05 (di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_05 (f(si[1]),f(si[2])); \
|
p_05 (di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = p_075(f(si[2]),f(si[3])); \
|
p_075(di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = p = f(si[3]); \
|
di[4] = p = f(si[3]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/4*5; \
|
di += ds - w/4*5; \
|
||||||
|
@ -143,12 +146,12 @@ scalers h:
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
#define h_upscale_bl8_4_5(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bl8_4_5(di,ds,si,ss,w,f) do { \
|
||||||
int i, t, u; uint p = f(si[0]); \
|
int i; u16 t, u, p = f(si[0]); \
|
||||||
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
for (i = w/4; i > 0; i--, si += 4, di += 5) { \
|
||||||
di[0] = p_025(p, f(si[0])); \
|
p_025 (di[0], p, f(si[0])); \
|
||||||
di[1] = p_0375(f(si[0]),f(si[1])); \
|
p_0375(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_0625(f(si[1]),f(si[2])); \
|
p_0625(di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = p_075(f(si[2]),f(si[3])); \
|
p_075 (di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = p = f(si[3]); \
|
di[4] = p = f(si[3]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/4*5; \
|
di += ds - w/4*5; \
|
||||||
|
@ -195,7 +198,7 @@ scalers h:
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = f(si[1]); \
|
di[1] = f(si[1]); \
|
||||||
di[2] = f(si[2]); \
|
di[2] = f(si[2]); \
|
||||||
di[3] = p_05(f(si[2]),f(si[3])); \
|
p_05(di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = f(si[3]); \
|
di[4] = f(si[3]); \
|
||||||
di[5] = f(si[4]); \
|
di[5] = f(si[4]); \
|
||||||
di[6] = f(si[5]); \
|
di[6] = f(si[5]); \
|
||||||
|
@ -208,10 +211,10 @@ scalers h:
|
||||||
int i; \
|
int i; \
|
||||||
for (i = w/6; i > 0; i--, si += 6, di += 7) { \
|
for (i = w/6; i > 0; i--, si += 6, di += 7) { \
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = p_05(f(si[0]),f(si[1])); \
|
p_05(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_05(f(si[1]),f(si[2])); \
|
p_05(di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = p_05(f(si[2]),f(si[3])); \
|
p_05(di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = p_05(f(si[3]),f(si[4])); \
|
p_05(di[4], f(si[3]),f(si[4])); \
|
||||||
di[5] = f(si[4]); \
|
di[5] = f(si[4]); \
|
||||||
di[6] = f(si[5]); \
|
di[6] = f(si[5]); \
|
||||||
} \
|
} \
|
||||||
|
@ -220,14 +223,14 @@ scalers h:
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
#define h_upscale_bl4_6_7(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bl4_6_7(di,ds,si,ss,w,f) do { \
|
||||||
int i, t; uint p = f(si[0]); \
|
int i; u16 t p = f(si[0]); \
|
||||||
for (i = w/6; i > 0; i--, si += 6, di += 7) { \
|
for (i = w/6; i > 0; i--, si += 6, di += 7) { \
|
||||||
di[0] = p_025(p,f(si[0])); \
|
p_025(di[0], p, f(si[0])); \
|
||||||
di[1] = p_025(f(si[0]),f(si[1])); \
|
p_025(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = p_05 (f(si[1]),f(si[2])); \
|
p_05 (di[2], f(si[1]),f(si[2])); \
|
||||||
di[3] = p_05 (f(si[2]),f(si[3])); \
|
p_05 (di[3], f(si[2]),f(si[3])); \
|
||||||
di[4] = p_075(f(si[3]),f(si[4])); \
|
p_075(di[4], f(si[3]),f(si[4])); \
|
||||||
di[5] = p_075(f(si[4]),f(si[5])); \
|
p_075(di[5], f(si[4]),f(si[5])); \
|
||||||
di[6] = p = f(si[5]); \
|
di[6] = p = f(si[5]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/6*7; \
|
di += ds - w/6*7; \
|
||||||
|
@ -258,9 +261,9 @@ scalers h:
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = f(si[0]); \
|
di[1] = f(si[0]); \
|
||||||
di[2] = f(si[1]); \
|
di[2] = f(si[1]); \
|
||||||
di[3] = p_05(f(si[1]),f(si[2])); \
|
p_05(di[3], f(si[1]),f(si[2])); \
|
||||||
di[4] = f(si[2]); \
|
di[4] = f(si[2]); \
|
||||||
di[5] = p_05(f(si[2]),f(si[3])); \
|
p_05(di[5], f(si[2]),f(si[3])); \
|
||||||
di[6] = f(si[3]); \
|
di[6] = f(si[3]); \
|
||||||
di[7] = f(si[4]); \
|
di[7] = f(si[4]); \
|
||||||
di[8] = f(si[4]); \
|
di[8] = f(si[4]); \
|
||||||
|
@ -273,13 +276,13 @@ scalers h:
|
||||||
int i; \
|
int i; \
|
||||||
for (i = w/5; i > 0; i--, si += 5, di += 9) { \
|
for (i = w/5; i > 0; i--, si += 5, di += 9) { \
|
||||||
di[0] = f(si[0]); \
|
di[0] = f(si[0]); \
|
||||||
di[1] = p_05(f(si[0]),f(si[1])); \
|
p_05(di[1], f(si[0]),f(si[1])); \
|
||||||
di[2] = f(si[1]); \
|
di[2] = f(si[1]); \
|
||||||
di[3] = p_05(f(si[1]),f(si[2])); \
|
p_05(di[3], f(si[1]),f(si[2])); \
|
||||||
di[4] = f(si[2]); \
|
di[4] = f(si[2]); \
|
||||||
di[5] = p_05(f(si[2]),f(si[3])); \
|
p_05(di[5], f(si[2]),f(si[3])); \
|
||||||
di[6] = f(si[3]); \
|
di[6] = f(si[3]); \
|
||||||
di[7] = p_05(f(si[3]),f(si[4])); \
|
p_05(di[7], f(si[3]),f(si[4])); \
|
||||||
di[8] = f(si[4]); \
|
di[8] = f(si[4]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/5*9; \
|
di += ds - w/5*9; \
|
||||||
|
@ -287,16 +290,16 @@ scalers h:
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
#define h_upscale_bl4_5_9(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bl4_5_9(di,ds,si,ss,w,f) do { \
|
||||||
int i, t; uint p = f(si[0]); \
|
int i; u16 t, p = f(si[0]); \
|
||||||
for (i = w/5; i > 0; i--, si += 5, di += 9) { \
|
for (i = w/5; i > 0; i--, si += 5, di += 9) { \
|
||||||
di[0] = p_05 (p,f(si[0])); \
|
p_05 (di[0], p, f(si[0])); \
|
||||||
di[1] = f(si[0]); \
|
di[1] = f(si[0]); \
|
||||||
di[2] = p_025(f(si[0]),f(si[1])); \
|
p_025(di[2], f(si[0]),f(si[1])); \
|
||||||
di[3] = p_075(f(si[1]),f(si[2])); \
|
p_075(di[3], f(si[1]),f(si[2])); \
|
||||||
di[4] = p_025(f(si[1]),f(si[2])); \
|
p_025(di[4], f(si[1]),f(si[2])); \
|
||||||
di[5] = p_075(f(si[2]),f(si[3])); \
|
p_075(di[5], f(si[2]),f(si[3])); \
|
||||||
di[6] = f(si[3]); \
|
di[6] = f(si[3]); \
|
||||||
di[7] = p_05 (f(si[3]),f(si[4])); \
|
p_05 (di[7], f(si[3]),f(si[4])); \
|
||||||
di[8] = p = f(si[4]); \
|
di[8] = p = f(si[4]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w/5*9; \
|
di += ds - w/5*9; \
|
||||||
|
@ -319,9 +322,9 @@ scalers h:
|
||||||
#define h_upscale_bl2_1_2(di,ds,si,ss,w,f) do { \
|
#define h_upscale_bl2_1_2(di,ds,si,ss,w,f) do { \
|
||||||
int i; uint p = f(si[0]); \
|
int i; uint p = f(si[0]); \
|
||||||
for (i = w/2; i > 0; i--, si += 2, di += 4) { \
|
for (i = w/2; i > 0; i--, si += 2, di += 4) { \
|
||||||
di[0] = p_05 (p, f(si[0])); \
|
p_05 (di[0], p, f(si[0])); \
|
||||||
di[1] = f(si[0]); \
|
di[1] = f(si[0]); \
|
||||||
di[2] = p_05 (f(si[0]), f(si[1])); \
|
p_05 (di[2], f(si[0]),f(si[1])); \
|
||||||
di[3] = p = f(si[1]); \
|
di[3] = p = f(si[1]); \
|
||||||
} \
|
} \
|
||||||
di += ds - w*2; \
|
di += ds - w*2; \
|
||||||
|
@ -350,12 +353,12 @@ scalers v:
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#define v_mix(di,li,ri,w,p_mix,f) do { \
|
#define v_mix(di,li,ri,w,p_mix,f) do { \
|
||||||
int i, t, u; (void)t, (void)u; \
|
u16 i, t, u; (void)t, (void)u; \
|
||||||
for (i = 0; i < w; i += 4) { \
|
for (i = 0; i < w; i += 4) { \
|
||||||
(di)[i ] = p_mix(f((li)[i ]), f((ri)[i ])); \
|
p_mix((di)[i ], f((li)[i ]),f((ri)[i ])); \
|
||||||
(di)[i+1] = p_mix(f((li)[i+1]), f((ri)[i+1])); \
|
p_mix((di)[i+1], f((li)[i+1]),f((ri)[i+1])); \
|
||||||
(di)[i+2] = p_mix(f((li)[i+2]), f((ri)[i+2])); \
|
p_mix((di)[i+2], f((li)[i+2]),f((ri)[i+2])); \
|
||||||
(di)[i+3] = p_mix(f((li)[i+3]), f((ri)[i+3])); \
|
p_mix((di)[i+3], f((li)[i+3]),f((ri)[i+3])); \
|
||||||
} \
|
} \
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
|
@ -369,32 +372,222 @@ scalers v:
|
||||||
} \
|
} \
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
|
/* scale 14:15 */
|
||||||
|
#define v_upscale_nn_14_15(di,ds,w,l) do { \
|
||||||
|
if (++l == 7) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 14) { \
|
||||||
|
l = 0; \
|
||||||
|
di -= 7*ds; \
|
||||||
|
v_copy(&di[0], &di[-ds], w, f_nop); \
|
||||||
|
di += 7*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_snn_14_15(di,ds,w,l) do { \
|
||||||
|
if (++l == 7) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 14) { \
|
||||||
|
l = 0; \
|
||||||
|
di -= 7*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
v_mix(&di[-ds], &di[-2*ds], &di[-ds], w, p_05, f_nop); \
|
||||||
|
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], w, p_05, f_nop); \
|
||||||
|
di += 7*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_bl2_14_15(di,ds,w,l) do { \
|
||||||
|
if (++l == 3) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 14) { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 11*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
for (j = 0; j < 7; j++) { \
|
||||||
|
di += ds; \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_05, f_nop); \
|
||||||
|
} \
|
||||||
|
di += 4*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_bl4_14_15(di,ds,w,l) do { \
|
||||||
|
if (++l == 1) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 14) { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 13*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_025, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
for (j = 0; j < 3; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_025, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
for (j = 0; j < 4; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_05, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
for (j = 0; j < 4; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_075, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
di += 1*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
/* scale 16:17 */
|
||||||
|
#define v_upscale_nn_16_17(di,ds,w,l) do { \
|
||||||
|
if (++l == 8) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 16) { \
|
||||||
|
l = 0; \
|
||||||
|
di -= 8*ds; \
|
||||||
|
v_copy(&di[0], &di[-ds], w, f_nop); \
|
||||||
|
di += 8*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_snn_16_17(di,ds,w,l) do { \
|
||||||
|
if (++l == 8) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 16) { \
|
||||||
|
l = 0; \
|
||||||
|
di -= 8*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
v_mix(&di[-ds], &di[-2*ds], &di[-ds], w, p_05, f_nop); \
|
||||||
|
v_mix(&di[ ds], &di[ ds], &di[ 2*ds], w, p_05, f_nop); \
|
||||||
|
di += 8*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_bl2_16_17(di,ds,w,l) do { \
|
||||||
|
if (++l == 4) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 16) { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 12*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
for (j = 0; j < 7; j++) { \
|
||||||
|
di += ds; \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_05, f_nop); \
|
||||||
|
} \
|
||||||
|
di += 5*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_bl4_16_17(di,ds,w,l) do { \
|
||||||
|
if (++l == 2) { \
|
||||||
|
di += ds; \
|
||||||
|
} else if (l >= 16) { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 14*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_025, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
for (j = 0; j < 3; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_025, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
for (j = 0; j < 4; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_05, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
for (j = 0; j < 4; j++) { \
|
||||||
|
v_mix(&di[0], &di[0], &di[ds], w, p_075, f_nop); \
|
||||||
|
di += ds; \
|
||||||
|
} \
|
||||||
|
di += 2*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
/* scale 3:5 */
|
||||||
|
#define v_upscale_nn_3_5(di,ds,w,l) do { \
|
||||||
|
if (++l < 3) { \
|
||||||
|
di += ds; \
|
||||||
|
} else { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 4*ds; \
|
||||||
|
for (j = 0; j < 2; j++) { \
|
||||||
|
v_copy(&di[0], &di[-ds], w, f_nop); \
|
||||||
|
di += 2*ds; \
|
||||||
|
} \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_snn_3_5(di,ds,w,l) do { \
|
||||||
|
if (++l < 3) { \
|
||||||
|
di += ds; \
|
||||||
|
} else { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 4*ds; \
|
||||||
|
for (j = 0; j < 2; j++) { \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
di += 2*ds; \
|
||||||
|
} \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
/* scale 2:3 */
|
||||||
|
#define v_upscale_nn_2_3(di,ds,w,l) do { \
|
||||||
|
if (++l < 2) { \
|
||||||
|
di += ds; \
|
||||||
|
} else { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 2*ds; \
|
||||||
|
v_copy(&di[0], &di[-ds], w, f_nop); \
|
||||||
|
di += 2*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
#define v_upscale_snn_2_3(di,ds,w,l) do { \
|
||||||
|
if (++l < 2) { \
|
||||||
|
di += ds; \
|
||||||
|
} else { \
|
||||||
|
int j; \
|
||||||
|
l = 0; \
|
||||||
|
di -= 2*ds; \
|
||||||
|
v_mix(&di[0], &di[-ds], &di[ds], w, p_05, f_nop); \
|
||||||
|
di += 2*ds; \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
|
|
||||||
/* 256x___ -> 320x___, H32/mode 4, PAR 5:4, for PAL DAR 4:3 (wrong for NTSC) */
|
/* X x Y -> X*5/4 x Y, for X 256->320 */
|
||||||
void upscale_clut_nn_256_320x___(u8 *__restrict di, int ds, u8 *__restrict si, int ss, int height);
|
void upscale_rgb_nn_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_nn_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal);
|
void upscale_rgb_snn_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_snn_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal);
|
void upscale_rgb_bl2_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl2_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal);
|
void upscale_rgb_bl4_x_4_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl4_256_320x___(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int height, u16 *pal);
|
|
||||||
|
|
||||||
/* 256x224 -> 320x240, H32/mode 4, PAR 5:4, for NTSC DAR 4:3 (wrong for PAL) */
|
/* X x Y -> X x Y*17/16, for Y 224->238 or 192->204 (SMS) */
|
||||||
void upscale_clut_nn_256_320x224_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss);
|
void upscale_rgb_nn_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_nn_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_snn_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_snn_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_bl2_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl2_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_bl4_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl4_256_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
|
|
||||||
/* 320x224 -> 320x240, PAR 1:1, for NTSC, DAR 4:3 (wrong for PAL) */
|
/* X x Y -> X*5/4 x Y*17/16 */
|
||||||
void upscale_clut_nn_320x224_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss);
|
void upscale_rgb_nn_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_nn_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_snn_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_snn_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_bl2_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl2_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
void upscale_rgb_bl4_x_4_5_y_16_17(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
void upscale_rgb_bl4_320x224_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
|
/* X x Y -> X*2/1 x Y, e.g. for X 160->320 (GG) */
|
||||||
|
void upscale_rgb_nn_x_1_2(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
void upscale_rgb_bl2_x_1_2(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
|
||||||
|
/* X x Y -> X x Y*5/3, e.g. for Y 144->240 (GG) */
|
||||||
|
void upscale_rgb_nn_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
void upscale_rgb_bl2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
void upscale_rgb_bl4_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
|
||||||
|
/* X x Y -> X*2/1 x Y*5/3 (GG) */
|
||||||
|
void upscale_rgb_nn_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
void upscale_rgb_bl2_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
void upscale_rgb_bl4_x_1_2_y_3_5(u16 *__restrict di, int ds, u8 *__restrict si, int ss, int width, int height, u16 *pal);
|
||||||
|
|
||||||
/* 160x144 -> 320x240: GG, PAR 6:5, scaling to 320x240 for DAR 4:3 */
|
|
||||||
void upscale_clut_nn_160_320x144_240(u8 *__restrict di, int ds, u8 *__restrict si, int ss);
|
|
||||||
void upscale_rgb_nn_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
void upscale_rgb_snn_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
void upscale_rgb_bl2_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
void upscale_rgb_bl4_160_320x144_240(u16 *__restrict di, int ds, u8 *__restrict si, int ss, u16 *pal);
|
|
||||||
|
|
|
@ -558,14 +558,16 @@ static void vid_reset_mode(void)
|
||||||
Pico.m.dirtyPal = 1;
|
Pico.m.dirtyPal = 1;
|
||||||
|
|
||||||
PicoIn.opt &= ~POPT_EN_SOFTSCALE;
|
PicoIn.opt &= ~POPT_EN_SOFTSCALE;
|
||||||
if (currentConfig.scaling == EOPT_SCALE_SW)
|
if (currentConfig.scaling == EOPT_SCALE_SW) {
|
||||||
PicoIn.opt |= POPT_EN_SOFTSCALE;
|
PicoIn.opt |= POPT_EN_SOFTSCALE;
|
||||||
|
PicoIn.filter = EOPT_FILTER_BILINEAR2;
|
||||||
|
}
|
||||||
|
|
||||||
// palette converters for 8bit modes
|
// palette converters for 8bit modes
|
||||||
make_local_pal = (PicoIn.AHW & PAHW_SMS) ? make_local_pal_sms : make_local_pal_md;
|
make_local_pal = (PicoIn.AHW & PAHW_SMS) ? make_local_pal_sms : make_local_pal_md;
|
||||||
}
|
}
|
||||||
|
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
{
|
{
|
||||||
int scalex = 320, scaley = 240;
|
int scalex = 320, scaley = 240;
|
||||||
int ln_offs = 0;
|
int ln_offs = 0;
|
||||||
|
@ -578,10 +580,10 @@ void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
||||||
|
|
||||||
/* set up hwscaling here */
|
/* set up hwscaling here */
|
||||||
PicoIn.opt &= ~POPT_DIS_32C_BORDER;
|
PicoIn.opt &= ~POPT_DIS_32C_BORDER;
|
||||||
if (is_32cols && currentConfig.scaling == EOPT_SCALE_HW) {
|
if (col_count < 320 && currentConfig.scaling == EOPT_SCALE_HW) {
|
||||||
scalex = 256;
|
scalex = col_count;
|
||||||
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
||||||
osd_fps_x = OSD_FPS_X - 64;
|
osd_fps_x = col_count - (320-OSD_FPS_X);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (currentConfig.vscaling == EOPT_SCALE_HW) {
|
if (currentConfig.vscaling == EOPT_SCALE_HW) {
|
||||||
|
|
|
@ -84,7 +84,6 @@ static retro_environment_t environ_cb;
|
||||||
static retro_audio_sample_batch_t audio_batch_cb;
|
static retro_audio_sample_batch_t audio_batch_cb;
|
||||||
|
|
||||||
#define VOUT_MAX_WIDTH 320
|
#define VOUT_MAX_WIDTH 320
|
||||||
#define VOUT_32COL_WIDTH 256
|
|
||||||
#define VOUT_MAX_HEIGHT 240
|
#define VOUT_MAX_HEIGHT 240
|
||||||
|
|
||||||
#define INITIAL_SND_RATE 44100
|
#define INITIAL_SND_RATE 44100
|
||||||
|
@ -99,7 +98,8 @@ static bool old_show_overscan = false;
|
||||||
/* Required to allow on the fly changes to 'show overscan' */
|
/* Required to allow on the fly changes to 'show overscan' */
|
||||||
static int vm_current_start_line = -1;
|
static int vm_current_start_line = -1;
|
||||||
static int vm_current_line_count = -1;
|
static int vm_current_line_count = -1;
|
||||||
static int vm_current_is_32cols = -1;
|
static int vm_current_start_col = -1;
|
||||||
|
static int vm_current_col_count = -1;
|
||||||
|
|
||||||
static int vout_16bit = 1;
|
static int vout_16bit = 1;
|
||||||
static int vout_format = PDF_RGB555;
|
static int vout_format = PDF_RGB555;
|
||||||
|
@ -615,13 +615,14 @@ int plat_mem_set_exec(void *ptr, size_t size)
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
{
|
{
|
||||||
struct retro_system_av_info av_info;
|
struct retro_system_av_info av_info;
|
||||||
|
|
||||||
vm_current_start_line = start_line;
|
vm_current_start_line = start_line;
|
||||||
vm_current_line_count = line_count;
|
vm_current_line_count = line_count;
|
||||||
vm_current_is_32cols = is_32cols;
|
vm_current_start_col = start_col;
|
||||||
|
vm_current_col_count = col_count;
|
||||||
|
|
||||||
// 8bit renderes create a 328x256 CLUT image, while 16bit creates 320x240 RGB
|
// 8bit renderes create a 328x256 CLUT image, while 16bit creates 320x240 RGB
|
||||||
vout_16bit = vout_format == PDF_RGB555 || (PicoIn.AHW & PAHW_32X);
|
vout_16bit = vout_format == PDF_RGB555 || (PicoIn.AHW & PAHW_32X);
|
||||||
|
@ -631,13 +632,7 @@ void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
||||||
vout_width = (vout_16bit ? VOUT_MAX_WIDTH : VOUT_8BIT_WIDTH);
|
vout_width = (vout_16bit ? VOUT_MAX_WIDTH : VOUT_8BIT_WIDTH);
|
||||||
vout_height = (vout_16bit ? VOUT_MAX_HEIGHT : VOUT_8BIT_HEIGHT);
|
vout_height = (vout_16bit ? VOUT_MAX_HEIGHT : VOUT_8BIT_HEIGHT);
|
||||||
vout_offset = (vout_16bit ? 0 : 8); // 8bit has 8 px overlap area on the left
|
vout_offset = (vout_16bit ? 0 : 8); // 8bit has 8 px overlap area on the left
|
||||||
if (is_32cols) {
|
padding = (struct retro_hw_ps2_insets){start_line, vout_offset, vout_height - line_count - start_line, vout_width - col_count - vout_offset};
|
||||||
// 256x240, with or w/o overlap on the left and 64 px on the right
|
|
||||||
padding = (struct retro_hw_ps2_insets){start_line, vout_offset, vout_height - line_count - start_line, vout_width - 256.0f - vout_offset};
|
|
||||||
} else {
|
|
||||||
// 320x240, with or w/o overlap on the left and none on the right
|
|
||||||
padding = (struct retro_hw_ps2_insets){start_line, vout_offset, vout_height - line_count - start_line, vout_width - 320.0f - vout_offset};
|
|
||||||
}
|
|
||||||
|
|
||||||
int pxsz = (vout_16bit ? 2 : 1); // pixel size: RGB = 16 bits, CLUT = 8 bits
|
int pxsz = (vout_16bit ? 2 : 1); // pixel size: RGB = 16 bits, CLUT = 8 bits
|
||||||
memset(vout_buf, 0, pxsz * vout_width * vout_height);
|
memset(vout_buf, 0, pxsz * vout_width * vout_height);
|
||||||
|
@ -651,7 +646,7 @@ void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
||||||
ps2->padding = padding;
|
ps2->padding = padding;
|
||||||
}
|
}
|
||||||
#else
|
#else
|
||||||
vout_width = is_32cols ? VOUT_32COL_WIDTH : VOUT_MAX_WIDTH;
|
vout_width = col_count;
|
||||||
memset(vout_buf, 0, VOUT_MAX_WIDTH * VOUT_MAX_HEIGHT * 2);
|
memset(vout_buf, 0, VOUT_MAX_WIDTH * VOUT_MAX_HEIGHT * 2);
|
||||||
if (vout_16bit)
|
if (vout_16bit)
|
||||||
PicoDrawSetOutBuf(vout_buf, vout_width * 2);
|
PicoDrawSetOutBuf(vout_buf, vout_width * 2);
|
||||||
|
@ -686,11 +681,11 @@ void emu_32x_startup(void)
|
||||||
PicoDrawSetOutFormat(vout_format, 0);
|
PicoDrawSetOutFormat(vout_format, 0);
|
||||||
if ((vm_current_start_line != -1) &&
|
if ((vm_current_start_line != -1) &&
|
||||||
(vm_current_line_count != -1) &&
|
(vm_current_line_count != -1) &&
|
||||||
(vm_current_is_32cols != -1))
|
(vm_current_start_col != -1) &&
|
||||||
|
(vm_current_col_count != -1))
|
||||||
emu_video_mode_change(
|
emu_video_mode_change(
|
||||||
vm_current_start_line,
|
vm_current_start_line, vm_current_line_count,
|
||||||
vm_current_line_count,
|
vm_current_start_col, vm_current_col_count);
|
||||||
vm_current_is_32cols);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void lprintf(const char *fmt, ...)
|
void lprintf(const char *fmt, ...)
|
||||||
|
@ -1621,11 +1616,11 @@ static void update_variables(bool first_run)
|
||||||
{
|
{
|
||||||
if ((vm_current_start_line != -1) &&
|
if ((vm_current_start_line != -1) &&
|
||||||
(vm_current_line_count != -1) &&
|
(vm_current_line_count != -1) &&
|
||||||
(vm_current_is_32cols != -1))
|
(vm_current_start_col != -1) &&
|
||||||
|
(vm_current_col_count != -1))
|
||||||
emu_video_mode_change(
|
emu_video_mode_change(
|
||||||
vm_current_start_line,
|
vm_current_start_line, vm_current_line_count,
|
||||||
vm_current_line_count,
|
vm_current_start_col, vm_current_col_count);
|
||||||
vm_current_is_32cols);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Reinitialise frameskipping, if required */
|
/* Reinitialise frameskipping, if required */
|
||||||
|
|
|
@ -14,6 +14,7 @@
|
||||||
#include "../libpicofe/plat.h"
|
#include "../libpicofe/plat.h"
|
||||||
#include "../common/emu.h"
|
#include "../common/emu.h"
|
||||||
#include "../common/arm_utils.h"
|
#include "../common/arm_utils.h"
|
||||||
|
#include "../common/upscale.h"
|
||||||
#include "../common/version.h"
|
#include "../common/version.h"
|
||||||
|
|
||||||
#include <pico/pico_int.h>
|
#include <pico/pico_int.h>
|
||||||
|
@ -23,8 +24,9 @@ const char *renderer_names[] = { "16bit accurate", " 8bit accurate", " 8bit fast
|
||||||
const char *renderer_names32x[] = { "accurate", "faster", "fastest", NULL };
|
const char *renderer_names32x[] = { "accurate", "faster", "fastest", NULL };
|
||||||
enum renderer_types { RT_16BIT, RT_8BIT_ACC, RT_8BIT_FAST, RT_COUNT };
|
enum renderer_types { RT_16BIT, RT_8BIT_ACC, RT_8BIT_FAST, RT_COUNT };
|
||||||
|
|
||||||
static int out_x, out_y;
|
static int out_x, out_y, out_w, out_h; // renderer output in render buffer
|
||||||
static int out_w, out_h;
|
static int screen_x, screen_y, screen_w, screen_h; // final render destination
|
||||||
|
static int render_bg; // force 16bit mode for bg render
|
||||||
|
|
||||||
void pemu_prep_defconfig(void)
|
void pemu_prep_defconfig(void)
|
||||||
{
|
{
|
||||||
|
@ -38,7 +40,7 @@ void pemu_validate_config(void)
|
||||||
}
|
}
|
||||||
|
|
||||||
#define is_16bit_mode() \
|
#define is_16bit_mode() \
|
||||||
(currentConfig.renderer == RT_16BIT || (PicoIn.AHW & PAHW_32X))
|
(currentConfig.renderer == RT_16BIT || (PicoIn.AHW & PAHW_32X) || render_bg)
|
||||||
|
|
||||||
static int get_renderer(void)
|
static int get_renderer(void)
|
||||||
{
|
{
|
||||||
|
@ -82,31 +84,79 @@ static void draw_cd_leds(void)
|
||||||
#undef p
|
#undef p
|
||||||
}
|
}
|
||||||
|
|
||||||
static unsigned short *get_16bit_start(unsigned short *buf)
|
/* render/screen buffer handling:
|
||||||
|
* In 16 bit mode, render output is directly placed in the screen buffer.
|
||||||
|
* SW scaling is handled in renderer (x) and in vscaling callbacks here (y).
|
||||||
|
* In 8 bit modes, output goes to the internal Draw2FB buffer in alternate
|
||||||
|
* renderer format (8 pix overscan at left/top/bottom), left aligned (DIS_32C).
|
||||||
|
* It is converted to 16 bit and SW scaled in pemu_finalize_frame.
|
||||||
|
*
|
||||||
|
* HW scaling always aligns the image to the left/top, since selecting an area
|
||||||
|
* for display isn't always possible.
|
||||||
|
*/
|
||||||
|
|
||||||
|
static u16 *screen_buffer(u16 *buf)
|
||||||
{
|
{
|
||||||
// center the output on the screen
|
// center the emulator display on the screen if screen is larger
|
||||||
int offs = (g_screen_height-240)/2 * g_screen_ppitch + (g_screen_width-320)/2;
|
if (currentConfig.scaling != EOPT_SCALE_HW)
|
||||||
return buf + offs;
|
buf += (g_screen_width-320)/2;
|
||||||
|
if (currentConfig.vscaling != EOPT_SCALE_HW)
|
||||||
|
buf += (g_screen_height-240)/2 * g_screen_ppitch;
|
||||||
|
return buf;
|
||||||
|
}
|
||||||
|
|
||||||
|
void screen_blit(u16 *pd, int pp, u8* ps, int ss, u16 *pal)
|
||||||
|
{
|
||||||
|
typedef void (*upscale_t)
|
||||||
|
(u16 *di,int ds, u8 *si,int ss, int w,int h, u16 *pal);
|
||||||
|
upscale_t upscale_hv[] = {
|
||||||
|
upscale_rgb_nn_x_4_5_y_16_17, upscale_rgb_snn_x_4_5_y_16_17,
|
||||||
|
upscale_rgb_bl2_x_4_5_y_16_17, upscale_rgb_bl4_x_4_5_y_16_17,
|
||||||
|
};
|
||||||
|
upscale_t upscale_h[] = {
|
||||||
|
upscale_rgb_nn_x_4_5, upscale_rgb_snn_x_4_5,
|
||||||
|
upscale_rgb_bl2_x_4_5, upscale_rgb_bl4_x_4_5,
|
||||||
|
};
|
||||||
|
upscale_t upscale_v[] = {
|
||||||
|
upscale_rgb_nn_y_16_17, upscale_rgb_snn_y_16_17,
|
||||||
|
upscale_rgb_bl2_y_16_17, upscale_rgb_bl4_y_16_17,
|
||||||
|
};
|
||||||
|
upscale_t *upscale;
|
||||||
|
int y;
|
||||||
|
|
||||||
|
// handle software upscaling
|
||||||
|
upscale = NULL;
|
||||||
|
if (currentConfig.scaling == EOPT_SCALE_SW && out_w == 256) {
|
||||||
|
if (currentConfig.vscaling == EOPT_SCALE_SW && out_h <= 224)
|
||||||
|
// h+v scaling
|
||||||
|
upscale = upscale_hv;
|
||||||
|
else
|
||||||
|
// h scaling
|
||||||
|
upscale = upscale_h;
|
||||||
|
} else if (currentConfig.vscaling == EOPT_SCALE_SW && out_h <= 224) {
|
||||||
|
// v scaling
|
||||||
|
upscale = upscale_v;
|
||||||
|
} else {
|
||||||
|
// no scaling
|
||||||
|
for (y = 0; y < out_h; y++)
|
||||||
|
h_copy(pd, pp, ps, 328, out_w, f_pal);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
upscale[currentConfig.filter & 0x3](pd, pp, ps, ss, out_w, out_h, pal);
|
||||||
}
|
}
|
||||||
|
|
||||||
void pemu_finalize_frame(const char *fps, const char *notice)
|
void pemu_finalize_frame(const char *fps, const char *notice)
|
||||||
{
|
{
|
||||||
if (!is_16bit_mode()) {
|
if (!is_16bit_mode()) {
|
||||||
// convert the 8 bit CLUT output to 16 bit RGB
|
// convert the 8 bit CLUT output to 16 bit RGB
|
||||||
unsigned short *pd = (unsigned short *)g_screen_ptr +
|
u16 *pd = screen_buffer(g_screen_ptr) +
|
||||||
out_y * g_screen_ppitch + out_x;
|
screen_y * g_screen_ppitch + screen_x;
|
||||||
unsigned char *ps = Pico.est.Draw2FB + 328*out_y + 8;
|
u8 *ps = Pico.est.Draw2FB + 328*out_y + out_x + 8;
|
||||||
unsigned short *pal = Pico.est.HighPal;
|
|
||||||
int i, x;
|
|
||||||
|
|
||||||
pd = get_16bit_start(pd);
|
|
||||||
PicoDrawUpdateHighPal();
|
PicoDrawUpdateHighPal();
|
||||||
for (i = 0; i < out_h; i++, ps += 8) {
|
|
||||||
for (x = 0; x < out_w; x++)
|
screen_blit(pd, g_screen_ppitch, ps, 328, Pico.est.HighPal);
|
||||||
*pd++ = pal[*ps++];
|
|
||||||
pd += g_screen_ppitch - out_w;
|
|
||||||
ps += 320 - out_w;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (notice)
|
if (notice)
|
||||||
|
@ -120,33 +170,44 @@ void pemu_finalize_frame(const char *fps, const char *notice)
|
||||||
void plat_video_set_buffer(void *buf)
|
void plat_video_set_buffer(void *buf)
|
||||||
{
|
{
|
||||||
if (is_16bit_mode())
|
if (is_16bit_mode())
|
||||||
PicoDrawSetOutBuf(get_16bit_start(buf), g_screen_ppitch * 2);
|
PicoDrawSetOutBuf(screen_buffer(buf), g_screen_ppitch * 2);
|
||||||
}
|
}
|
||||||
|
|
||||||
static void apply_renderer(void)
|
static void apply_renderer(void)
|
||||||
{
|
{
|
||||||
|
PicoIn.opt &= ~(POPT_ALT_RENDERER|POPT_EN_SOFTSCALE|POPT_DIS_32C_BORDER);
|
||||||
switch (get_renderer()) {
|
switch (get_renderer()) {
|
||||||
case RT_16BIT:
|
case RT_16BIT:
|
||||||
PicoIn.opt &= ~POPT_ALT_RENDERER;
|
// 32X uses line mode for vscaling with accurate renderer, since
|
||||||
PicoIn.opt &= ~POPT_DIS_32C_BORDER;
|
// the MD VDP layer must be unscaled and merging the scaled 32X
|
||||||
PicoDrawSetOutFormat(PDF_RGB555, 0);
|
// image data will fail.
|
||||||
PicoDrawSetOutBuf(get_16bit_start(g_screen_ptr), g_screen_ppitch * 2);
|
PicoDrawSetOutFormat(PDF_RGB555,
|
||||||
|
(PicoIn.AHW & PAHW_32X) && currentConfig.vscaling);
|
||||||
|
PicoDrawSetOutBuf(screen_buffer(g_screen_ptr), g_screen_ppitch * 2);
|
||||||
break;
|
break;
|
||||||
case RT_8BIT_ACC:
|
case RT_8BIT_ACC:
|
||||||
PicoIn.opt &= ~POPT_ALT_RENDERER;
|
// for simplification the 8 bit accurate renderer uses the same
|
||||||
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
// storage format as the fast renderer
|
||||||
PicoDrawSetOutFormat(PDF_8BIT, 0);
|
PicoDrawSetOutFormat(PDF_8BIT, 0);
|
||||||
PicoDrawSetOutBuf(Pico.est.Draw2FB, 328);
|
PicoDrawSetOutBuf(Pico.est.Draw2FB, 328);
|
||||||
break;
|
break;
|
||||||
case RT_8BIT_FAST:
|
case RT_8BIT_FAST:
|
||||||
PicoIn.opt |= POPT_ALT_RENDERER;
|
PicoIn.opt |= POPT_ALT_RENDERER;
|
||||||
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
|
||||||
PicoDrawSetOutFormat(PDF_NONE, 0);
|
PicoDrawSetOutFormat(PDF_NONE, 0);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (PicoIn.AHW & PAHW_32X)
|
if (PicoIn.AHW & PAHW_32X)
|
||||||
PicoDrawSetOutBuf(get_16bit_start(g_screen_ptr), g_screen_ppitch * 2);
|
PicoDrawSetOutBuf(screen_buffer(g_screen_ptr), g_screen_ppitch * 2);
|
||||||
|
else if (is_16bit_mode()) {
|
||||||
|
if (currentConfig.scaling == EOPT_SCALE_SW) {
|
||||||
|
PicoIn.opt |= POPT_EN_SOFTSCALE;
|
||||||
|
PicoIn.filter = currentConfig.filter;
|
||||||
|
} else if (currentConfig.scaling == EOPT_SCALE_HW)
|
||||||
|
// hw scaling, render without any padding
|
||||||
|
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
||||||
|
} else
|
||||||
|
PicoIn.opt |= POPT_DIS_32C_BORDER;
|
||||||
|
|
||||||
Pico.m.dirtyPal = 1;
|
Pico.m.dirtyPal = 1;
|
||||||
}
|
}
|
||||||
|
@ -188,19 +249,6 @@ void plat_update_volume(int has_changed, int is_up)
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
void pemu_forced_frame(int no_scale, int do_emu)
|
|
||||||
{
|
|
||||||
unsigned short *pd = get_16bit_start(g_screen_ptr);
|
|
||||||
|
|
||||||
PicoIn.opt &= ~POPT_DIS_32C_BORDER;
|
|
||||||
PicoDrawSetCallbacks(NULL, NULL);
|
|
||||||
Pico.m.dirtyPal = 1;
|
|
||||||
|
|
||||||
emu_cmn_forced_frame(no_scale, do_emu, pd);
|
|
||||||
|
|
||||||
g_menubg_src_ptr = g_screen_ptr;
|
|
||||||
}
|
|
||||||
|
|
||||||
void pemu_sound_start(void)
|
void pemu_sound_start(void)
|
||||||
{
|
{
|
||||||
emu_sound_start();
|
emu_sound_start();
|
||||||
|
@ -210,15 +258,116 @@ void plat_debug_cat(char *str)
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void pemu_forced_frame(int no_scale, int do_emu)
|
||||||
{
|
{
|
||||||
|
u16 *pd = screen_buffer(g_screen_ptr);
|
||||||
|
int hs = currentConfig.scaling, vs = currentConfig.vscaling;
|
||||||
|
|
||||||
|
// create centered and sw scaled (if scaling enabled) 16 bit output
|
||||||
|
PicoIn.opt &= ~POPT_DIS_32C_BORDER;
|
||||||
|
Pico.m.dirtyPal = 1;
|
||||||
|
if (currentConfig.scaling) currentConfig.scaling = EOPT_SCALE_SW;
|
||||||
|
if (currentConfig.vscaling) currentConfig.vscaling = EOPT_SCALE_SW;
|
||||||
|
plat_video_set_size(320, 240);
|
||||||
|
|
||||||
|
// render a frame in 16 bit mode
|
||||||
|
render_bg = 1;
|
||||||
|
emu_cmn_forced_frame(no_scale, do_emu, pd);
|
||||||
|
render_bg = 0;
|
||||||
|
|
||||||
|
g_menubg_src_ptr = g_screen_ptr;
|
||||||
|
currentConfig.scaling = hs, currentConfig.vscaling = vs;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* vertical sw scaling, 16 bit mode */
|
||||||
|
static int vscale_state;
|
||||||
|
|
||||||
|
static int cb_vscaling_begin(unsigned int line)
|
||||||
|
{
|
||||||
|
static int prevline = 999;
|
||||||
|
|
||||||
|
// at start of new frame?
|
||||||
|
if (line < prevline) {
|
||||||
|
// set y frame offset (see emu_change_video_mode)
|
||||||
|
u16 *dest = g_screen_ptr;
|
||||||
|
Pico.est.DrawLineDest = dest + screen_y * g_screen_ppitch;
|
||||||
|
vscale_state = 0;
|
||||||
|
}
|
||||||
|
prevline = line;
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int cb_vscaling_nop(unsigned int line)
|
||||||
|
{
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int cb_vscaling_end(unsigned int line)
|
||||||
|
{
|
||||||
|
u16 *dest = Pico.est.DrawLineDest;
|
||||||
|
switch (currentConfig.filter) {
|
||||||
|
case 3: v_upscale_bl4_16_17(dest, g_screen_ppitch, 320, vscale_state);
|
||||||
|
break;
|
||||||
|
case 2: v_upscale_bl2_16_17(dest, g_screen_ppitch, 320, vscale_state);
|
||||||
|
break;
|
||||||
|
case 1: v_upscale_snn_16_17(dest, g_screen_ppitch, 320, vscale_state);
|
||||||
|
break;
|
||||||
|
default: v_upscale_nn_16_17(dest, g_screen_ppitch, 320, vscale_state);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
Pico.est.DrawLineDest = dest;
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
|
{
|
||||||
|
// relative position in core fb and screen fb
|
||||||
|
out_y = start_line; out_x = start_col;
|
||||||
|
out_h = line_count; out_w = col_count;
|
||||||
|
|
||||||
|
PicoDrawSetCallbacks(NULL, NULL);
|
||||||
|
screen_x = screen_y = 0;
|
||||||
|
screen_w = 320, screen_h = 240;
|
||||||
|
|
||||||
|
switch (currentConfig.scaling) {
|
||||||
|
case EOPT_SCALE_HW:
|
||||||
|
screen_w = out_w;
|
||||||
|
break;
|
||||||
|
case EOPT_SCALE_NONE:
|
||||||
|
// center output in screen
|
||||||
|
screen_x = (screen_w - out_w)/2;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
switch (currentConfig.vscaling) {
|
||||||
|
case EOPT_SCALE_HW:
|
||||||
|
// NTSC always has 224 visible lines, anything smaller has bars
|
||||||
|
screen_h = (out_h < 224 ? 224 : out_h);
|
||||||
|
// handle vertical centering for 16 bit mode
|
||||||
|
screen_y = (screen_h - out_h) / 2;
|
||||||
|
if (is_16bit_mode())
|
||||||
|
PicoDrawSetCallbacks(cb_vscaling_begin, cb_vscaling_nop);
|
||||||
|
break;
|
||||||
|
case EOPT_SCALE_SW:
|
||||||
|
// NTSC always has 224 visible lines, anything smaller has bars
|
||||||
|
if (out_y > 7)
|
||||||
|
screen_y = out_y - 7;
|
||||||
|
// in 16 bit mode sw scaling is divided between core and platform
|
||||||
|
if (is_16bit_mode() && out_h < 240)
|
||||||
|
PicoDrawSetCallbacks(cb_vscaling_begin, cb_vscaling_end);
|
||||||
|
break;
|
||||||
|
case EOPT_SCALE_NONE:
|
||||||
|
// center output in screen
|
||||||
|
screen_y = (screen_h - out_h)/2;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
plat_video_set_size(screen_w, screen_h);
|
||||||
|
plat_video_set_buffer(g_screen_ptr);
|
||||||
|
|
||||||
// clear whole screen in all buffers
|
// clear whole screen in all buffers
|
||||||
if (!is_16bit_mode())
|
if (!is_16bit_mode())
|
||||||
memset32(Pico.est.Draw2FB, 0xe0e0e0e0, (320+8) * (8+240+8) / 4);
|
memset32(Pico.est.Draw2FB, 0xe0e0e0e0, (320+8) * (8+240+8) / 4);
|
||||||
plat_video_clear_buffers();
|
plat_video_clear_buffers();
|
||||||
|
|
||||||
out_y = start_line; out_x = (is_32cols ? 32 : 0);
|
|
||||||
out_h = line_count; out_w = (is_32cols ? 256:320);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void pemu_loop_prep(void)
|
void pemu_loop_prep(void)
|
||||||
|
|
|
@ -1,12 +1,14 @@
|
||||||
#include "../libpicofe/gp2x/plat_gp2x.h"
|
|
||||||
|
|
||||||
// ------------ gfx options menu ------------
|
// ------------ gfx options menu ------------
|
||||||
|
|
||||||
|
static const char *men_scaling_opts[] = { "OFF", "software", "hardware", NULL };
|
||||||
|
static const char *men_filter_opts[] = { "nearest", "smoother", "bilinear 1", "bilinear 2", NULL };
|
||||||
|
|
||||||
const char *men_scaling_opts[] = { "OFF", "ON", NULL };
|
static const char h_scale[] = "hardware scaling may not be working on some devices";
|
||||||
|
|
||||||
#define MENU_OPTIONS_GFX \
|
#define MENU_OPTIONS_GFX \
|
||||||
// mee_enum ("screen scaling", MA_OPT_SCALING, currentConfig.scaling, men_scaling_opts), \
|
mee_enum_h ("Horizontal scaling", MA_OPT_SCALING, currentConfig.scaling, men_scaling_opts, h_scale), \
|
||||||
|
mee_enum_h ("Vertical scaling", MA_OPT_VSCALING, currentConfig.vscaling, men_scaling_opts, h_scale), \
|
||||||
|
mee_enum_h ("Scaler type", MA_OPT3_FILTERING, currentConfig.filter, men_filter_opts, NULL), \
|
||||||
|
|
||||||
#define MENU_OPTIONS_ADV
|
#define MENU_OPTIONS_ADV
|
||||||
|
|
||||||
|
|
|
@ -331,17 +331,16 @@ void pnd_restore_layer_data(void)
|
||||||
plat_video_flip();
|
plat_video_flip();
|
||||||
}
|
}
|
||||||
|
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
{
|
{
|
||||||
int fb_w = 320, fb_h = 240, fb_left = 0, fb_right = 0, fb_top = 0, fb_bottom = 0;
|
int fb_w = 320, fb_h = 240, fb_left = 0, fb_right = 0, fb_top = 0, fb_bottom = 0;
|
||||||
|
|
||||||
if (doing_bg_frame)
|
if (doing_bg_frame)
|
||||||
return;
|
return;
|
||||||
|
|
||||||
if (is_32cols) {
|
fb_w = col_count;
|
||||||
fb_w = 256;
|
fb_left = start_col;
|
||||||
fb_left = fb_right = 32;
|
fb_right = 320 - (fb_w+fb_left);;
|
||||||
}
|
|
||||||
|
|
||||||
switch (currentConfig.scaling) {
|
switch (currentConfig.scaling) {
|
||||||
case SCALE_1x1:
|
case SCALE_1x1:
|
||||||
|
@ -349,7 +348,7 @@ void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
||||||
g_layer_h = fb_h;
|
g_layer_h = fb_h;
|
||||||
break;
|
break;
|
||||||
case SCALE_2x2_3x2:
|
case SCALE_2x2_3x2:
|
||||||
g_layer_w = fb_w * (is_32cols ? 3 : 2);
|
g_layer_w = fb_w * (col_count < 320 ? 3 : 2);
|
||||||
g_layer_h = fb_h * 2;
|
g_layer_h = fb_h * 2;
|
||||||
break;
|
break;
|
||||||
case SCALE_2x2_2x2:
|
case SCALE_2x2_2x2:
|
||||||
|
@ -381,7 +380,7 @@ void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
||||||
fb_h = line_count;
|
fb_h = line_count;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
g_osd_fps_x = is_32cols ? 232 : 264;
|
g_osd_fps_x = col_count < 320 ? 232 : 264;
|
||||||
g_osd_y = fb_top + fb_h - 8;
|
g_osd_y = fb_top + fb_h - 8;
|
||||||
|
|
||||||
pnd_setup_layer(1, g_layer_x, g_layer_y, g_layer_w, g_layer_h);
|
pnd_setup_layer(1, g_layer_x, g_layer_y, g_layer_w, g_layer_h);
|
||||||
|
|
|
@ -674,11 +674,11 @@ void plat_update_volume(int has_changed, int is_up)
|
||||||
}
|
}
|
||||||
|
|
||||||
/* prepare for MD screen mode change */
|
/* prepare for MD screen mode change */
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
{
|
{
|
||||||
h32_mode = is_32cols;
|
h32_mode = col_count < 320;
|
||||||
out_y = start_line; out_x = (is_32cols ? 32 : 0);
|
out_y = start_line; out_x = (h32_mode ? 32 : 0);
|
||||||
out_h = line_count; out_w = (is_32cols ? 256:320);
|
out_h = line_count; out_w = (h32_mode ? 256:320);
|
||||||
|
|
||||||
vidResetMode();
|
vidResetMode();
|
||||||
if (h32_mode) // clear borders from h40 remnants
|
if (h32_mode) // clear borders from h40 remnants
|
||||||
|
|
|
@ -107,10 +107,10 @@ void plat_video_toggle_renderer(int change, int is_menu)
|
||||||
PicoDrawSetOutFormat(PDF_RGB555, 1);
|
PicoDrawSetOutFormat(PDF_RGB555, 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
void emu_video_mode_change(int start_line, int line_count, int is_32cols)
|
void emu_video_mode_change(int start_line, int line_count, int start_col, int col_count)
|
||||||
{
|
{
|
||||||
EmuScreenRect.left = is_32cols ? 32 : 0;
|
EmuScreenRect.left = start_col;
|
||||||
EmuScreenRect.right = is_32cols ? 256+32 : 320;
|
EmuScreenRect.right = start_col + col_count;
|
||||||
EmuScreenRect.top = start_line;
|
EmuScreenRect.top = start_line;
|
||||||
EmuScreenRect.bottom = start_line + line_count;
|
EmuScreenRect.bottom = start_line + line_count;
|
||||||
|
|
||||||
|
|
|
@ -134,9 +134,13 @@ get_define OFS_Pico_ Pico rom ; echo "$line" >>$fn
|
||||||
get_define OFS_Pico_ Pico romsize ; echo "$line" >>$fn
|
get_define OFS_Pico_ Pico romsize ; echo "$line" >>$fn
|
||||||
get_define OFS_Pico_ Pico est ; echo "$line" >>$fn
|
get_define OFS_Pico_ Pico est ; echo "$line" >>$fn
|
||||||
|
|
||||||
|
get_define OFS_PicoIn_ PicoInterface opt ; echo "$line" >>$fn
|
||||||
|
get_define OFS_PicoIn_ PicoInterface filter ; echo "$line" >>$fn
|
||||||
|
|
||||||
get_define OFS_EST_ PicoEState DrawScanline ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState DrawScanline ; echo "$line" >>$fn
|
||||||
get_define OFS_EST_ PicoEState rendstatus ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState rendstatus ; echo "$line" >>$fn
|
||||||
get_define OFS_EST_ PicoEState DrawLineDest ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState DrawLineDest ; echo "$line" >>$fn
|
||||||
|
get_define OFS_EST_ PicoEState DrawLineDestIncr ; echo "$line" >>$fn
|
||||||
get_define OFS_EST_ PicoEState HighCol ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState HighCol ; echo "$line" >>$fn
|
||||||
get_define OFS_EST_ PicoEState HighPreSpr ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState HighPreSpr ; echo "$line" >>$fn
|
||||||
get_define OFS_EST_ PicoEState Pico ; echo "$line" >>$fn
|
get_define OFS_EST_ PicoEState Pico ; echo "$line" >>$fn
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue