mirror of
https://github.com/RaySollium99/picodrive.git
synced 2025-09-06 15:48:05 -04:00
giz wip (acc 16bit faster than 8!)
git-svn-id: file:///home/notaz/opt/svn/PicoDrive@260 be3aeb3a-fb24-0410-a615-afba39da0efa
This commit is contained in:
parent
2ec14aec8f
commit
499a0be394
7 changed files with 201 additions and 50 deletions
145
Pico/Draw.s
145
Pico/Draw.s
|
@ -1647,8 +1647,14 @@ FinalizeLineRGB555:
|
|||
addeq r0, r0, #32*2
|
||||
|
||||
.fl_no32colRGB555:
|
||||
.fl_loopRGB555:
|
||||
|
||||
.if UNALIGNED_DRAWLINEDEST
|
||||
@ this is basically for Gizmondo, which has unaligned odd lines in the framebuffer
|
||||
tst r0, #2
|
||||
bne .fl_RGB555u
|
||||
.endif
|
||||
|
||||
.fl_loopRGB555:
|
||||
ldr r12, [r1], #4
|
||||
ldr r7, [r1], #4
|
||||
|
||||
|
@ -1670,12 +1676,12 @@ FinalizeLineRGB555:
|
|||
ldrh r6, [r3, r6]
|
||||
and r12,lr, r7, lsr #15
|
||||
ldrh r12,[r3, r12]
|
||||
and r7, lr, r7, lsr #23
|
||||
ldrh r7, [r3, r7]
|
||||
orr r8, r8, r6, lsl #16
|
||||
|
||||
and r6, lr, r7, lsr #23
|
||||
ldrh r6, [r3, r6] @ 1 cycle interlock here (r6)
|
||||
subs r2, r2, #1
|
||||
orr r12,r12, r6, lsl #16
|
||||
orr r12,r12, r7, lsl #16
|
||||
|
||||
stmia r0!, {r4,r5,r8,r12}
|
||||
bne .fl_loopRGB555
|
||||
|
@ -1689,6 +1695,11 @@ FinalizeLineRGB555:
|
|||
mov r9, #0x3900 @ f800 07e0 001f | e000 0780 001c | 3800 01e0 0007
|
||||
orr r9, r9, #0x00e7
|
||||
|
||||
.if UNALIGNED_DRAWLINEDEST
|
||||
tst r0, #2
|
||||
bne .fl_32scale_RGB555u
|
||||
.endif
|
||||
|
||||
.fl_loop32scale_RGB555:
|
||||
ldr r12, [r1], #4
|
||||
ldr r7, [r1], #4
|
||||
|
@ -1745,6 +1756,132 @@ FinalizeLineRGB555:
|
|||
ldmfd sp!, {r4-r8,lr}
|
||||
bx lr
|
||||
|
||||
.if UNALIGNED_DRAWLINEDEST
|
||||
@ unaligned versions of loops
|
||||
|
||||
.fl_RGB555u:
|
||||
ldr r12, [r1], #4
|
||||
ldr r7, [r1], #4
|
||||
|
||||
and r4, lr, r12, lsl #1
|
||||
ldrh r4, [r3, r4]
|
||||
and r5, lr, r12, lsr #7
|
||||
ldrh r5, [r3, r5]
|
||||
strh r4, [r0], #2
|
||||
b .fl_loopRGB555u_enter
|
||||
|
||||
.fl_loopRGB555u:
|
||||
ldr r12, [r1], #4
|
||||
ldr r7, [r1], #4
|
||||
|
||||
and r4, lr, r12, lsl #1
|
||||
ldrh r4, [r3, r4]
|
||||
and r5, lr, r12, lsr #7
|
||||
ldrh r5, [r3, r5]
|
||||
|
||||
orr r4, r8, r4, lsl #16
|
||||
str r4, [r0], #4
|
||||
|
||||
.fl_loopRGB555u_enter:
|
||||
and r6, lr, r12, lsr #15
|
||||
ldrh r6, [r3, r6]
|
||||
and r8, lr, r12, lsr #23
|
||||
ldrh r8, [r3, r8]
|
||||
orr r4, r5, r6, lsl #16
|
||||
|
||||
and r5, lr, r7, lsl #1
|
||||
ldrh r5, [r3, r5]
|
||||
and r6, lr, r7, lsr #7
|
||||
ldrh r6, [r3, r6]
|
||||
orr r5, r8, r5, lsl #16
|
||||
|
||||
and r12,lr, r7, lsr #15
|
||||
ldrh r12,[r3, r12]
|
||||
and r8, lr, r7, lsr #23
|
||||
ldrh r8, [r3, r8]
|
||||
orr r6, r6, r12,lsl #16
|
||||
|
||||
subs r2, r2, #1
|
||||
stmia r0!, {r4,r5,r6}
|
||||
bne .fl_loopRGB555u
|
||||
|
||||
strh r8, [r0], #2
|
||||
|
||||
ldmfd sp!, {r4-r8,lr}
|
||||
bx lr
|
||||
|
||||
|
||||
.fl_32scale_RGB555u:
|
||||
|
||||
@ r9 f800 07e0 001f | e000 0780 001c | 3800 01e0 0007
|
||||
.fl_loop32scale_RGB555u:
|
||||
ldr r12, [r1], #4
|
||||
ldr r7, [r1], #4
|
||||
|
||||
and r4, lr, r12,lsl #1
|
||||
ldrh r4, [r3, r4]
|
||||
and r5, lr, r12,lsr #7
|
||||
ldrh r5, [r3, r5]
|
||||
and r4, r4, r9, lsl #2
|
||||
@ orr r4, rx, r4, lsl #16
|
||||
str r4, [r0], #4 @ pix_d -1, 0
|
||||
|
||||
.fl_loop32scale_RGB555u_enter:
|
||||
and r4, r9, r4, lsr #2 @ r4=1/4 pix_s 0
|
||||
|
||||
and r5, r5, r9, lsl #2
|
||||
sub r6, r5, r5, lsr #2 @ r6 = 3/4 pix_s 1
|
||||
add r4, r6, r4, lsr #2 @ r4=(1/4 pix_s 0) + (3/4 pix_s 1)
|
||||
orr r4, r4, r5, lsl #15
|
||||
|
||||
and r6, lr, r12,lsr #15
|
||||
ldrh r6, [r3, r6]
|
||||
and r12,lr, r12,lsr #23
|
||||
ldrh r12,[r3, r12]
|
||||
and r6, r6, r9, lsl #2
|
||||
add r4, r4, r6, lsl #15 @ pix_d 1, 2
|
||||
|
||||
@@ TODO...
|
||||
|
||||
mov r5, r5, lsr #1
|
||||
sub r6, r6, r6, lsr #2 @ r6 = 3/4 pix_s 2
|
||||
orr r5, r5, r6, lsl #16
|
||||
|
||||
and r6, lr, r7, lsl #1
|
||||
ldrh r6, [r3, r6]
|
||||
and r12,r12,r9, lsl #2
|
||||
add r5, r5, r12,lsl #14 @ pix_d 2, 3
|
||||
and r6, r6, r9, lsl #2
|
||||
orr r6, r12,r6, lsl #16 @ pix_d 4, 5
|
||||
|
||||
and r12,lr, r7, lsr #7
|
||||
ldrh r12,[r3, r12]
|
||||
and r10,lr, r7, lsr #15
|
||||
ldrh r10,[r3, r10]
|
||||
and r12,r12,r9, lsl #2
|
||||
sub r8, r12,r12,lsr #2 @ r8 = 3/4 pix_s 1
|
||||
add r8, r8, r6, lsr #18
|
||||
and r7, lr, r7, lsr #23
|
||||
ldrh r7, [r3, r7]
|
||||
and r10,r10,r9, lsl #2
|
||||
orr r8, r8, r10,lsl #15
|
||||
add r8, r8, r12,lsl #15 @ pix_d 6, 7
|
||||
sub r10,r10,r10,lsr #2 @ r10= 3/4 pix_s 2
|
||||
and r7, r7, r9, lsl #2
|
||||
add r10,r10,r7, lsr #2 @ += 1/4 pix_s 3
|
||||
orr r10,r10,r7, lsl #16 @ pix_d 8, 9
|
||||
|
||||
subs r2, r2, #1
|
||||
|
||||
stmia r0!, {r4,r5,r6,r8,r10}
|
||||
bne .fl_loop32scale_RGB555u
|
||||
|
||||
ldmfd sp!, {r9,r10}
|
||||
ldmfd sp!, {r4-r8,lr}
|
||||
bx lr
|
||||
|
||||
.endif @ UNALIGNED_DRAWLINEDEST
|
||||
|
||||
|
||||
@ @@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue