mirror of
https://git.code.sf.net/p/quake/quakeforge-old
synced 2024-11-25 05:11:23 +00:00
c3f5581b0a
Unchained, Ultimate, Ultra, Up Yours, Underworld, Underground, Unified, Unity, etc. You know the drill. This takes care of the "standalone" problem with the wrong name, and the recent snafu with multiple developers working on the same files simultaneously...expect me (and probably others) to start locking dirs when updates are taking place. And yes, this update is really as large as it looks. Software only at the moment, but I will have the makefile updated to build the GL builds as well.
149 lines
2.5 KiB
ArmAsm
149 lines
2.5 KiB
ArmAsm
//
|
|
// d_copy.s
|
|
// x86 assembly-language screen copying code.
|
|
//
|
|
|
|
#include "asm_i386.h"
|
|
#include "quakeasm.h"
|
|
#include "asm_draw.h"
|
|
|
|
.data
|
|
|
|
LCopyWidth: .long 0
|
|
LBlockSrcStep: .long 0
|
|
LBlockDestStep: .long 0
|
|
LSrcDelta: .long 0
|
|
LDestDelta: .long 0
|
|
|
|
#define bufptr 4+16
|
|
|
|
// copies 16 rows per plane at a pop; idea is that 16*512 = 8k, and since
|
|
// no Mode X mode is wider than 360, all the data should fit in the cache for
|
|
// the passes for the next 3 planes
|
|
|
|
.text
|
|
|
|
.globl C(VGA_UpdatePlanarScreen)
|
|
C(VGA_UpdatePlanarScreen):
|
|
pushl %ebp // preserve caller's stack frame
|
|
pushl %edi
|
|
pushl %esi // preserve register variables
|
|
pushl %ebx
|
|
|
|
movl C(VGA_bufferrowbytes),%eax
|
|
shll $1,%eax
|
|
movl %eax,LBlockSrcStep
|
|
movl C(VGA_rowbytes),%eax
|
|
shll $1,%eax
|
|
movl %eax,LBlockDestStep
|
|
|
|
movl $0x3C4,%edx
|
|
movb $2,%al
|
|
outb %al,%dx // point the SC to the Map Mask
|
|
incl %edx
|
|
|
|
movl bufptr(%esp),%esi
|
|
movl C(VGA_pagebase),%edi
|
|
movl C(VGA_height),%ebp
|
|
shrl $1,%ebp
|
|
|
|
movl C(VGA_width),%ecx
|
|
movl C(VGA_bufferrowbytes),%eax
|
|
subl %ecx,%eax
|
|
movl %eax,LSrcDelta
|
|
movl C(VGA_rowbytes),%eax
|
|
shll $2,%eax
|
|
subl %ecx,%eax
|
|
movl %eax,LDestDelta
|
|
shrl $4,%ecx
|
|
movl %ecx,LCopyWidth
|
|
|
|
LRowLoop:
|
|
movb $1,%al
|
|
|
|
LPlaneLoop:
|
|
outb %al,%dx
|
|
movb $2,%ah
|
|
|
|
pushl %esi
|
|
pushl %edi
|
|
LRowSetLoop:
|
|
movl LCopyWidth,%ecx
|
|
LColumnLoop:
|
|
movb 12(%esi),%bh
|
|
movb 8(%esi),%bl
|
|
shll $16,%ebx
|
|
movb 4(%esi),%bh
|
|
movb (%esi),%bl
|
|
movl %ebx,(%edi)
|
|
addl $16,%esi
|
|
addl $4,%edi
|
|
decl %ecx
|
|
jnz LColumnLoop
|
|
|
|
addl LDestDelta,%edi
|
|
addl LSrcDelta,%esi
|
|
decb %ah
|
|
jnz LRowSetLoop
|
|
|
|
popl %edi
|
|
popl %esi
|
|
incl %esi
|
|
|
|
shlb $1,%al
|
|
cmpb $16,%al
|
|
jnz LPlaneLoop
|
|
|
|
subl $4,%esi
|
|
addl LBlockSrcStep,%esi
|
|
addl LBlockDestStep,%edi
|
|
decl %ebp
|
|
jnz LRowLoop
|
|
|
|
popl %ebx // restore register variables
|
|
popl %esi
|
|
popl %edi
|
|
popl %ebp // restore the caller's stack frame
|
|
|
|
ret
|
|
|
|
|
|
#define srcptr 4+16
|
|
#define destptr 8+16
|
|
#define width 12+16
|
|
#define height 16+16
|
|
#define srcrowbytes 20+16
|
|
#define destrowbytes 24+16
|
|
|
|
.globl C(VGA_UpdateLinearScreen)
|
|
C(VGA_UpdateLinearScreen):
|
|
pushl %ebp // preserve caller's stack frame
|
|
pushl %edi
|
|
pushl %esi // preserve register variables
|
|
pushl %ebx
|
|
|
|
cld
|
|
movl srcptr(%esp),%esi
|
|
movl destptr(%esp),%edi
|
|
movl width(%esp),%ebx
|
|
movl srcrowbytes(%esp),%eax
|
|
subl %ebx,%eax
|
|
movl destrowbytes(%esp),%edx
|
|
subl %ebx,%edx
|
|
shrl $2,%ebx
|
|
movl height(%esp),%ebp
|
|
LLRowLoop:
|
|
movl %ebx,%ecx
|
|
rep/movsl (%esi),(%edi)
|
|
addl %eax,%esi
|
|
addl %edx,%edi
|
|
decl %ebp
|
|
jnz LLRowLoop
|
|
|
|
popl %ebx // restore register variables
|
|
popl %esi
|
|
popl %edi
|
|
popl %ebp // restore the caller's stack frame
|
|
|
|
ret
|
|
|