mirror of
https://github.com/RaySollium99/picodrive.git
synced 2025-09-05 15:27:46 -04:00
revamped 32X draw arm asm code
This commit is contained in:
parent
064cc6d103
commit
23eef37f25
2 changed files with 26 additions and 22 deletions
|
@ -1,373 +0,0 @@
|
|||
@*
|
||||
@* PicoDrive
|
||||
@* (C) notaz, 2010
|
||||
@*
|
||||
@* This work is licensed under the terms of MAME license.
|
||||
@* See COPYING file in the top-level directory.
|
||||
@*
|
||||
|
||||
.extern Pico32x
|
||||
.extern PicoDraw2FB
|
||||
.extern HighPal
|
||||
|
||||
.equiv P32XV_PRI, (1<< 7)
|
||||
|
||||
.bss
|
||||
.align 2
|
||||
.global Pico32xNativePal
|
||||
Pico32xNativePal:
|
||||
.word 0
|
||||
|
||||
.text
|
||||
.align 2
|
||||
|
||||
|
||||
.macro call_scan_prep cond
|
||||
.if \cond
|
||||
ldr r4, =PicoScan32xBegin
|
||||
ldr r5, =PicoScan32xEnd
|
||||
ldr r6, =DrawLineDest
|
||||
ldr r4, [r4]
|
||||
ldr r5, [r5]
|
||||
stmfd sp!, {r4,r5,r6}
|
||||
.endif
|
||||
.endm
|
||||
|
||||
.macro call_scan_fin_ge cond
|
||||
.if \cond
|
||||
addge sp, sp, #4*3
|
||||
.endif
|
||||
.endm
|
||||
|
||||
.macro call_scan_begin cond
|
||||
.if \cond
|
||||
stmfd sp!, {r1-r3}
|
||||
and r0, r2, #0xff
|
||||
add r0, r0, r4
|
||||
mov lr, pc
|
||||
ldr pc, [sp, #(3+0)*4]
|
||||
ldr r0, [sp, #(3+2)*4] @ &DrawLineDest
|
||||
ldmfd sp!, {r1-r3}
|
||||
ldr r0, [r0]
|
||||
.endif
|
||||
.endm
|
||||
|
||||
.macro call_scan_end cond
|
||||
.if \cond
|
||||
stmfd sp!, {r0-r3}
|
||||
and r0, r2, #0xff
|
||||
add r0, r0, r4
|
||||
mov lr, pc
|
||||
ldr pc, [sp, #(4+1)*4]
|
||||
ldmfd sp!, {r0-r3}
|
||||
.endif
|
||||
.endm
|
||||
|
||||
@ direct color
|
||||
@ unsigned short *dst, unsigned short *dram, int lines_sft_offs, int mdbg
|
||||
.macro make_do_loop_dc name call_scan do_md
|
||||
.global \name
|
||||
\name:
|
||||
stmfd sp!, {r4-r11,lr}
|
||||
|
||||
ldr r10,=Pico32x
|
||||
ldr r11,=PicoDraw2FB
|
||||
ldr r10,[r10, #0x40] @ Pico32x.vdp_regs[0]
|
||||
ldr r11,[r11]
|
||||
ldr r9, =HighPal @ palmd
|
||||
and r4, r2, #0xff
|
||||
mov r5, #328
|
||||
lsl r3, #26 @ mdbg << 26
|
||||
mla r11,r4,r5,r11 @ r11 = pmd = PicoDraw2FB + offs*328: md data
|
||||
tst r10,#P32XV_PRI
|
||||
moveq r10,#0
|
||||
movne r10,#0x8000 @ r10 = inv_bit
|
||||
call_scan_prep \call_scan
|
||||
|
||||
mov r4, #0 @ line
|
||||
b 1f @ loop_outer_entry
|
||||
|
||||
0: @ loop_outer:
|
||||
call_scan_end \call_scan
|
||||
add r4, r4, #1
|
||||
sub r11,r11,#1 @ adjust for prev read
|
||||
cmp r4, r2, lsr #16
|
||||
call_scan_fin_ge \call_scan
|
||||
ldmgefd sp!, {r4-r11,pc}
|
||||
|
||||
1: @ loop_outer_entry:
|
||||
call_scan_begin \call_scan
|
||||
mov r12,r4, lsl #1
|
||||
ldrh r12,[r1, r12]
|
||||
add r11,r11,#8
|
||||
mov r6, #320
|
||||
add r5, r1, r12, lsl #1 @ p32x = dram + dram[l]
|
||||
|
||||
2: @ loop_inner:
|
||||
ldrb r7, [r11], #1 @ MD pixel
|
||||
subs r6, r6, #1
|
||||
blt 0b @ loop_outer
|
||||
ldrh r8, [r5], #2 @ 32x pixel
|
||||
cmp r3, r7, lsl #26 @ MD has bg pixel?
|
||||
beq 3f @ draw32x
|
||||
eor r12,r8, r10
|
||||
ands r12,r12,#0x8000 @ !((t ^ inv) & 0x8000)
|
||||
.if \do_md
|
||||
mov r7, r7, lsl #1
|
||||
ldreqh r12,[r9, r7]
|
||||
streqh r12,[r0], #2 @ *dst++ = palmd[*pmd]
|
||||
.endif
|
||||
beq 2b @ loop_inner
|
||||
|
||||
3: @ draw32x:
|
||||
and r12,r8, #0x03e0
|
||||
mov r8, r8, lsl #11
|
||||
orr r8, r8, r8, lsr #(10+11)
|
||||
orr r8, r8, r12,lsl #1
|
||||
bic r8, r8, #0x0020 @ kill prio bit
|
||||
strh r8, [r0], #2 @ *dst++ = bgr2rgb(*p32x++)
|
||||
b 2b @ loop_inner
|
||||
.endm
|
||||
|
||||
|
||||
@ packed pixel
|
||||
@ note: this may read a few bytes over the end of PicoDraw2FB and dram,
|
||||
@ so those should have a bit more alloc'ed than really needed.
|
||||
@ unsigned short *dst, unsigned short *dram, int lines_sft_offs, int mdbg
|
||||
.macro make_do_loop_pp name call_scan do_md
|
||||
.global \name
|
||||
\name:
|
||||
stmfd sp!, {r4-r11,lr}
|
||||
|
||||
ldr r11,=PicoDraw2FB
|
||||
ldr r10,=Pico32xNativePal
|
||||
ldr r11,[r11]
|
||||
ldr r10,[r10]
|
||||
ldr r9, =HighPal @ palmd
|
||||
and r4, r2, #0xff
|
||||
mov r5, #328
|
||||
lsl r3, #26 @ mdbg << 26
|
||||
mla r11,r4,r5,r11 @ r11 = pmd = PicoDraw2FB + offs*328: md data
|
||||
call_scan_prep \call_scan
|
||||
|
||||
mov r4, #0 @ line
|
||||
b 1f @ loop_outer_entry
|
||||
|
||||
0: @ loop_outer:
|
||||
call_scan_end \call_scan
|
||||
add r4, r4, #1
|
||||
cmp r4, r2, lsr #16
|
||||
call_scan_fin_ge \call_scan
|
||||
ldmgefd sp!, {r4-r11,pc}
|
||||
|
||||
1: @ loop_outer_entry:
|
||||
call_scan_begin \call_scan
|
||||
mov r12,r4, lsl #1
|
||||
ldrh r12,[r1, r12]
|
||||
add r11,r11,#8
|
||||
mov r6, #320/2
|
||||
add r5, r1, r12, lsl #1 @ p32x = dram + dram[l]
|
||||
and r12,r2, #0x100 @ shift
|
||||
add r5, r5, r12,lsr #8
|
||||
|
||||
2: @ loop_inner:
|
||||
@ r4,r6 - counters; r5 - 32x data; r9,r10 - md,32x pal; r11 - md data
|
||||
@ r7,r8,r12,lr - temp
|
||||
tst r5, #1
|
||||
ldreqb r8, [r5], #2
|
||||
ldrb r7, [r5, #-1]
|
||||
ldrneb r8, [r5, #2]! @ r7,r8 - pixel 0,1 index
|
||||
subs r6, r6, #1
|
||||
blt 0b @ loop_outer
|
||||
cmp r7, r8
|
||||
beq 5f @ check_fill @ +8
|
||||
|
||||
3: @ no_fill:
|
||||
mov r12,r7, lsl #1
|
||||
mov lr, r8, lsl #1
|
||||
ldrh r7, [r10,r12]
|
||||
ldrh r8, [r10,lr]
|
||||
add r11,r11,#2
|
||||
|
||||
eor r12,r7, #0x20
|
||||
tst r12,#0x20
|
||||
ldrneb r12,[r11,#-2] @ MD pixel 0
|
||||
eor lr, r8, #0x20
|
||||
cmpne r3, r12, lsl #26 @ MD has bg pixel?
|
||||
.if \do_md
|
||||
mov r12,r12,lsl #1
|
||||
ldrneh r7, [r9, r12] @ t = palmd[pmd[0]]
|
||||
tst lr, #0x20
|
||||
ldrneb lr, [r11,#-1] @ MD pixel 1
|
||||
strh r7, [r0], #2
|
||||
cmpne r3, lr, lsl #26 @ MD has bg pixel?
|
||||
mov lr, lr, lsl #1
|
||||
ldrneh r8, [r9, lr] @ t = palmd[pmd[1]]
|
||||
strh r8, [r0], #2
|
||||
.else
|
||||
streqh r7, [r0]
|
||||
tst lr, #0x20
|
||||
ldrneb lr, [r11,#-1] @ MD pixel 1
|
||||
add r0, r0, #4
|
||||
cmpne r3, lr, lsl #26 @ MD has bg pixel?
|
||||
streqh r8, [r0, #-2]
|
||||
.endif
|
||||
b 2b @ loop_inner
|
||||
|
||||
5: @ check_fill
|
||||
@ count pixels, align if needed
|
||||
bic r12,r5, #1
|
||||
ldrh r12,[r12]
|
||||
orr lr, r7, r7, lsl #8
|
||||
cmp r12,lr
|
||||
bne 3b @ no_fill
|
||||
|
||||
tst r5, #1
|
||||
sub lr, r5, #2 @ starting r5 (32x render data start)
|
||||
addeq r5, r5, #2
|
||||
addne r5, r5, #1 @ add for the check above
|
||||
add r6, r6, #1 @ restore from dec
|
||||
orr r7, r7, r7, lsl #8
|
||||
6:
|
||||
sub r12,r5, lr
|
||||
ldrh r8, [r5], #2
|
||||
cmp r12,r6, lsl #1
|
||||
ldrh r12,[r5], #2
|
||||
bge 7f @ count_done
|
||||
cmp r8, r7
|
||||
cmpeq r12,r7
|
||||
beq 6b
|
||||
|
||||
7: @ count_done
|
||||
sub r5, r5, #4 @ undo readahead
|
||||
|
||||
@ fix alignment and check type
|
||||
sub r8, r5, lr
|
||||
tst r8, #1
|
||||
subne r5, r5, #1
|
||||
subne r8, r8, #1
|
||||
|
||||
and r7, r7, #0xff
|
||||
cmp r8, r6, lsl #1
|
||||
mov r7, r7, lsl #1
|
||||
movgt r8, r6, lsl #1 @ r8=count
|
||||
ldrh r7, [r10,r7]
|
||||
sub r6, r6, r8, lsr #1 @ adjust counter
|
||||
tst r7, #0x20
|
||||
beq 9f @ bg_mode
|
||||
|
||||
add r11,r11,r8
|
||||
8:
|
||||
subs r8, r8, #2
|
||||
strgeh r7, [r0], #2
|
||||
strgeh r7, [r0], #2
|
||||
bgt 8b
|
||||
b 2b @ loop_inner
|
||||
|
||||
9: @ bg_mode:
|
||||
ldrb r12,[r11],#1 @ MD pixel
|
||||
ldrb lr, [r11],#1
|
||||
cmp r3, lr, lsl #26 @ MD has bg pixel?
|
||||
.if \do_md
|
||||
mov r12,r12,lsl #1
|
||||
ldrneh r12,[r9, r12] @ t = palmd[*pmd]
|
||||
moveq r12,r7
|
||||
cmp r3, lr, lsl #26
|
||||
mov lr, lr, lsl #1
|
||||
ldrneh lr, [r9, lr]
|
||||
moveq lr, r7
|
||||
strh r12,[r0], #2
|
||||
strh lr, [r0], #2
|
||||
.else
|
||||
streqh r7, [r0]
|
||||
cmp r3, lr, lsl #26
|
||||
streqh r7, [r0, #2]
|
||||
add r0, r0, #4
|
||||
.endif
|
||||
subs r8, r8, #2
|
||||
bgt 9b @ bg_mode
|
||||
b 2b @ loop_inner
|
||||
.endm
|
||||
|
||||
|
||||
@ run length
|
||||
@ unsigned short *dst, unsigned short *dram, int lines_sft_offs, int mdbg
|
||||
.macro make_do_loop_rl name call_scan do_md
|
||||
.global \name
|
||||
\name:
|
||||
stmfd sp!, {r4-r11,lr}
|
||||
|
||||
ldr r11,=PicoDraw2FB
|
||||
ldr r10,=Pico32xNativePal
|
||||
ldr r11,[r11]
|
||||
ldr r10,[r10]
|
||||
ldr r9, =HighPal @ palmd
|
||||
and r4, r2, #0xff
|
||||
mov r5, #328
|
||||
lsl r3, #26 @ mdbg << 26
|
||||
mla r11,r4,r5,r11 @ r11 = pmd = PicoDraw2FB + offs*328: md data
|
||||
call_scan_prep \call_scan
|
||||
|
||||
mov r4, #0 @ line
|
||||
b 1f @ loop_outer_entry
|
||||
|
||||
0: @ loop_outer:
|
||||
call_scan_end \call_scan
|
||||
add r4, r4, #1
|
||||
sub r11,r11,#1 @ adjust for prev read
|
||||
cmp r4, r2, lsr #16
|
||||
call_scan_fin_ge \call_scan
|
||||
ldmgefd sp!, {r4-r11,pc}
|
||||
|
||||
1: @ loop_outer_entry:
|
||||
call_scan_begin \call_scan
|
||||
mov r12,r4, lsl #1
|
||||
ldrh r12,[r1, r12]
|
||||
add r11,r11,#8
|
||||
mov r6, #320
|
||||
add r5, r1, r12, lsl #1 @ p32x = dram + dram[l]
|
||||
|
||||
2: @ loop_inner:
|
||||
ldrh r8, [r5], #2 @ control word
|
||||
and r12,r8, #0xff
|
||||
mov r12,r12,lsl #1
|
||||
ldrh lr, [r10,r12] @ t = 32x pixel
|
||||
eor lr, lr, #0x20
|
||||
|
||||
3: @ loop_innermost:
|
||||
ldrb r7, [r11], #1 @ MD pixel
|
||||
subs r6, r6, #1
|
||||
blt 0b @ loop_outer
|
||||
cmp r3, r7, lsl #26 @ MD has bg pixel?
|
||||
mov r7, r7, lsl #1
|
||||
tstne lr, #0x20
|
||||
.if \do_md
|
||||
ldrneh r12,[r9, r7] @ t = palmd[*pmd]
|
||||
streqh lr, [r0], #2
|
||||
strneh r12,[r0], #2 @ *dst++ = t
|
||||
.else
|
||||
streqh lr, [r0]
|
||||
add r0, r0, #2
|
||||
.endif
|
||||
subs r8, r8, #0x100
|
||||
bge 3b @ loop_innermost
|
||||
b 2b @ loop_inner
|
||||
.endm
|
||||
|
||||
|
||||
make_do_loop_dc do_loop_dc, 0, 0
|
||||
make_do_loop_dc do_loop_dc_md, 0, 1
|
||||
make_do_loop_dc do_loop_dc_scan, 1, 0
|
||||
make_do_loop_dc do_loop_dc_scan_md, 1, 1
|
||||
|
||||
make_do_loop_pp do_loop_pp, 0, 0
|
||||
make_do_loop_pp do_loop_pp_md, 0, 1
|
||||
make_do_loop_pp do_loop_pp_scan, 1, 0
|
||||
make_do_loop_pp do_loop_pp_scan_md, 1, 1
|
||||
|
||||
make_do_loop_rl do_loop_rl, 0, 0
|
||||
make_do_loop_rl do_loop_rl_md, 0, 1
|
||||
make_do_loop_rl do_loop_rl_scan, 1, 0
|
||||
make_do_loop_rl do_loop_rl_scan_md, 1, 1
|
||||
|
||||
@ vim:filetype=armasm
|
Loading…
Add table
Add a link
Reference in a new issue