mirror of
https://git.code.sf.net/p/quake/quake2forge
synced 2025-01-06 09:51:05 +00:00
167 lines
3.3 KiB
ArmAsm
167 lines
3.3 KiB
ArmAsm
/* $Id$
|
|
*
|
|
* x86 assembly-language screen copying code
|
|
*
|
|
* Copyright (C) 1997-2001 Id Software, Inc.
|
|
* Copyright (c) 2002 The Quakeforge Project.
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
# include "config.h"
|
|
#endif
|
|
#include "qasm.h"
|
|
|
|
.data
|
|
|
|
LCopyWidth: .long 0
|
|
LBlockSrcStep: .long 0
|
|
LBlockDestStep: .long 0
|
|
LSrcDelta: .long 0
|
|
LDestDelta: .long 0
|
|
|
|
#define bufptr 4+16
|
|
|
|
// copies 16 rows per plane at a pop; idea is that 16*512 = 8k, and since
|
|
// no Mode X mode is wider than 360, all the data should fit in the cache for
|
|
// the passes for the next 3 planes
|
|
|
|
.text
|
|
|
|
.globl C(VGA_UpdatePlanarScreen)
|
|
C(VGA_UpdatePlanarScreen):
|
|
pushl %ebp // preserve caller's stack frame
|
|
pushl %edi
|
|
pushl %esi // preserve register variables
|
|
pushl %ebx
|
|
|
|
movl C(VGA_bufferrowbytes),%eax
|
|
shll $1,%eax
|
|
movl %eax,LBlockSrcStep
|
|
movl C(VGA_rowbytes),%eax
|
|
shll $1,%eax
|
|
movl %eax,LBlockDestStep
|
|
|
|
movl $0x3C4,%edx
|
|
movb $2,%al
|
|
outb %al,%dx // point the SC to the Map Mask
|
|
incl %edx
|
|
|
|
movl bufptr(%esp),%esi
|
|
movl C(VGA_pagebase),%edi
|
|
movl C(VGA_height),%ebp
|
|
shrl $1,%ebp
|
|
|
|
movl C(VGA_width),%ecx
|
|
movl C(VGA_bufferrowbytes),%eax
|
|
subl %ecx,%eax
|
|
movl %eax,LSrcDelta
|
|
movl C(VGA_rowbytes),%eax
|
|
shll $2,%eax
|
|
subl %ecx,%eax
|
|
movl %eax,LDestDelta
|
|
shrl $4,%ecx
|
|
movl %ecx,LCopyWidth
|
|
|
|
LRowLoop:
|
|
movb $1,%al
|
|
|
|
LPlaneLoop:
|
|
outb %al,%dx
|
|
movb $2,%ah
|
|
|
|
pushl %esi
|
|
pushl %edi
|
|
LRowSetLoop:
|
|
movl LCopyWidth,%ecx
|
|
LColumnLoop:
|
|
movb 12(%esi),%bh
|
|
movb 8(%esi),%bl
|
|
shll $16,%ebx
|
|
movb 4(%esi),%bh
|
|
movb (%esi),%bl
|
|
movl %ebx,(%edi)
|
|
addl $16,%esi
|
|
addl $4,%edi
|
|
decl %ecx
|
|
jnz LColumnLoop
|
|
|
|
addl LDestDelta,%edi
|
|
addl LSrcDelta,%esi
|
|
decb %ah
|
|
jnz LRowSetLoop
|
|
|
|
popl %edi
|
|
popl %esi
|
|
incl %esi
|
|
|
|
shlb $1,%al
|
|
cmpb $16,%al
|
|
jnz LPlaneLoop
|
|
|
|
subl $4,%esi
|
|
addl LBlockSrcStep,%esi
|
|
addl LBlockDestStep,%edi
|
|
decl %ebp
|
|
jnz LRowLoop
|
|
|
|
popl %ebx // restore register variables
|
|
popl %esi
|
|
popl %edi
|
|
popl %ebp // restore the caller's stack frame
|
|
|
|
ret
|
|
|
|
|
|
#define srcptr 4+16
|
|
#define destptr 8+16
|
|
#define width 12+16
|
|
#define height 16+16
|
|
#define srcrowbytes 20+16
|
|
#define destrowbytes 24+16
|
|
|
|
.globl C(VGA_UpdateLinearScreen)
|
|
C(VGA_UpdateLinearScreen):
|
|
pushl %ebp // preserve caller's stack frame
|
|
pushl %edi
|
|
pushl %esi // preserve register variables
|
|
pushl %ebx
|
|
|
|
cld
|
|
movl srcptr(%esp),%esi
|
|
movl destptr(%esp),%edi
|
|
movl width(%esp),%ebx
|
|
movl srcrowbytes(%esp),%eax
|
|
subl %ebx,%eax
|
|
movl destrowbytes(%esp),%edx
|
|
subl %ebx,%edx
|
|
shrl $2,%ebx
|
|
movl height(%esp),%ebp
|
|
LLRowLoop:
|
|
movl %ebx,%ecx
|
|
rep/movsl (%esi),(%edi)
|
|
addl %eax,%esi
|
|
addl %edx,%edi
|
|
decl %ebp
|
|
jnz LLRowLoop
|
|
|
|
popl %ebx // restore register variables
|
|
popl %esi
|
|
popl %edi
|
|
popl %ebp // restore the caller's stack frame
|
|
|
|
ret
|
|
|