mirror of
https://github.com/ZDoom/Raze.git
synced 2024-11-16 09:21:36 +00:00
a6e60e9723
git-svn-id: https://svn.eduke32.com/eduke32@7146 1a8010ca-5511-0410-912e-c29ae57300e0
2918 lines
57 KiB
NASM
2918 lines
57 KiB
NASM
; "Build Engine & Tools" Copyright (c) 1993-1997 Ken Silverman
|
|
; Ken Silverman's official web site: "http://www.advsys.net/ken"
|
|
; See the included license file "BUILDLIC.TXT" for license info.
|
|
;
|
|
; This file has been modified from Ken Silverman's original release
|
|
; by Jonathon Fowler (jf@jonof.id.au)
|
|
; by the EDuke32 team (development@voidpoint.com)
|
|
|
|
%ifidn __OUTPUT_FORMAT__, x64
|
|
%define ASM_x86_64
|
|
%elifidn __OUTPUT_FORMAT__, win64
|
|
%define ASM_x86_64
|
|
%elifidn __OUTPUT_FORMAT__, elf64
|
|
%define ASM_x86_64
|
|
%elifidn __OUTPUT_FORMAT__, macho64
|
|
%define ASM_x86_64
|
|
%elifidn __OUTPUT_FORMAT__, win32
|
|
%define ASM_x86
|
|
%elifidn __OUTPUT_FORMAT__, elf32
|
|
%define ASM_x86
|
|
%elifidn __OUTPUT_FORMAT__, macho32
|
|
%define ASM_x86
|
|
%elifidn __OUTPUT_FORMAT__, win
|
|
%define ASM_x86
|
|
%elifidn __OUTPUT_FORMAT__, elf
|
|
%define ASM_x86
|
|
%elifidn __OUTPUT_FORMAT__, macho
|
|
%define ASM_x86
|
|
%endif
|
|
|
|
%ifdef ASM_x86
|
|
|
|
;CPU 586
|
|
|
|
SECTION .text
|
|
|
|
%ifdef UNDERSCORES
|
|
%define asm1 _asm1
|
|
%define asm2 _asm2
|
|
%define asm3 _asm3
|
|
%define asm4 _asm4
|
|
%define reciptable _reciptable
|
|
%define fpuasm _fpuasm
|
|
%define globalx3 _globalx3
|
|
%define globaly3 _globaly3
|
|
%define ylookup _ylookup
|
|
%define vplce _vplce
|
|
%define vince _vince
|
|
%define palookupoffse _palookupoffse
|
|
%define bufplce _bufplce
|
|
%define ebpbak _ebpbak
|
|
%define espbak _espbak
|
|
%define globaltilesizy _globaltilesizy
|
|
|
|
%define sethlinesizes _sethlinesizes
|
|
%define prosethlinesizes _prosethlinesizes
|
|
%define setvlinebpl _setvlinebpl
|
|
%define setpalookupaddress _setpalookupaddress
|
|
%define prosetpalookupaddress _prosetpalookupaddress
|
|
%define setuphlineasm4 _setuphlineasm4
|
|
%define hlineasm4 _hlineasm4
|
|
%define prohlineasm4 _prohlineasm4
|
|
%define prosetuphlineasm4 _prosetupvlineasm
|
|
%define setupmvlineasm _setupmvlineasm
|
|
%define setuptvlineasm _setuptvlineasm
|
|
%define prevlineasm1 _prevlineasm1
|
|
%define vlineasm1 _vlineasm1
|
|
%define vlineasm1nonpow2 _vlineasm1nonpow2
|
|
%define mvlineasm1 _mvlineasm1
|
|
%define mvlineasm1nonpow2 _mvlineasm1nonpow2
|
|
%define fixtransluscence _fixtransluscence
|
|
%define settransnormal _settransnormal
|
|
%define settransreverse _settransreverse
|
|
%define tvlineasm1 _tvlineasm1
|
|
%define tvlineasm1nonpow2 _tvlineasm1nonpow2
|
|
%define vlineasm4 _vlineasm4
|
|
%define provlineasm4 _provlineasm4
|
|
%define setupvlineasm _setupvlineasm
|
|
%define mvlineasm4 _mvlineasm4
|
|
%define setupspritevline _setupspritevline
|
|
%define spritevline _spritevline
|
|
%define msetupspritevline _msetupspritevline
|
|
%define mspritevline _mspritevline
|
|
%define tsetupspritevline _tsetupspritevline
|
|
%define tspritevline _tspritevline
|
|
%define msethlineshift _msethlineshift
|
|
%define mhline _mhline
|
|
%define mhlineskipmodify _mhlineskipmodify
|
|
%define tsethlineshift _tsethlineshift
|
|
%define thline _thline
|
|
%define thlineskipmodify _thlineskipmodify
|
|
%define setuptvlineasm2 _setuptvlineasm2
|
|
%define tvlineasm2 _tvlineasm2
|
|
%define setupslopevlin2 _setupslopevlin2
|
|
;%define slopevlin2 _slopevlin2
|
|
%define setupslopevlin _setupslopevlin
|
|
%define slopevlin _slopevlin
|
|
%define setuprhlineasm4 _setuprhlineasm4
|
|
%define rhlineasm4 _rhlineasm4
|
|
%define setuprmhlineasm4 _setuprmhlineasm4
|
|
%define rmhlineasm4 _rmhlineasm4
|
|
%define setupqrhlineasm4 _setupqrhlineasm4
|
|
%define qrhlineasm4 _qrhlineasm4
|
|
%define setupdrawslab _setupdrawslab
|
|
%define drawslab _drawslab
|
|
;%define stretchhline _stretchhline
|
|
%define mmxoverlay _mmxoverlay
|
|
|
|
%define dep_begin _dep_begin
|
|
%define dep_end _dep_end
|
|
%endif
|
|
|
|
; Some macros to help make cdecl calling easier to manage
|
|
%macro CDECLBEGIN 1
|
|
%if %1 >= 2
|
|
push ebx
|
|
%endif
|
|
%if %1 >= 3
|
|
push ecx
|
|
%endif
|
|
%if %1 >= 4
|
|
push edx
|
|
%endif
|
|
%if %1 >= 5
|
|
push esi
|
|
%endif
|
|
%if %1 >= 6
|
|
push edi
|
|
%endif
|
|
%endmacro
|
|
|
|
%macro CDECLEND 1
|
|
%if %1 >= 6
|
|
pop edi
|
|
%endif
|
|
%if %1 >= 5
|
|
pop esi
|
|
%endif
|
|
%if %1 >= 4
|
|
pop edx
|
|
%endif
|
|
%if %1 >= 3
|
|
pop ecx
|
|
%endif
|
|
%if %1 >= 2
|
|
pop ebx
|
|
%endif
|
|
%endmacro
|
|
|
|
%macro CDECLPARAM 3
|
|
; mov %1, dword [esp + (%2*4+16)]
|
|
mov %1, dword [esp + ((%2+%3)*4+4)]
|
|
%endmacro
|
|
|
|
%macro CDECLBEGINSET 1
|
|
CDECLBEGIN %1
|
|
|
|
%assign _offsetted %1-1
|
|
|
|
%if %1 >= 1
|
|
CDECLPARAM eax,0,_offsetted
|
|
%endif
|
|
%if %1 >= 2
|
|
CDECLPARAM ebx,1,_offsetted
|
|
%endif
|
|
%if %1 >= 3
|
|
CDECLPARAM ecx,2,_offsetted
|
|
%endif
|
|
%if %1 >= 4
|
|
CDECLPARAM edx,3,_offsetted
|
|
%endif
|
|
%if %1 >= 5
|
|
CDECLPARAM esi,4,_offsetted
|
|
%endif
|
|
%if %1 >= 6
|
|
CDECLPARAM edi,5,_offsetted
|
|
%endif
|
|
%endmacro
|
|
|
|
%macro CDECLENDSET 1
|
|
CDECLEND %1
|
|
%endmacro
|
|
|
|
|
|
EXTERN asm1
|
|
EXTERN asm2
|
|
EXTERN asm3
|
|
EXTERN asm4
|
|
EXTERN reciptable
|
|
EXTERN fpuasm
|
|
EXTERN globalx3
|
|
EXTERN globaly3
|
|
EXTERN ylookup
|
|
|
|
EXTERN vplce
|
|
EXTERN vince
|
|
EXTERN palookupoffse
|
|
EXTERN bufplce
|
|
|
|
EXTERN ebpbak
|
|
EXTERN espbak
|
|
|
|
EXTERN globaltilesizy
|
|
|
|
GLOBAL sethlinesizes
|
|
GLOBAL prosethlinesizes
|
|
GLOBAL setvlinebpl
|
|
GLOBAL setpalookupaddress
|
|
GLOBAL prosetpalookupaddress
|
|
GLOBAL setuphlineasm4
|
|
GLOBAL hlineasm4
|
|
GLOBAL prohlineasm4
|
|
GLOBAL prosetupvlineasm
|
|
GLOBAL setupmvlineasm
|
|
GLOBAL setuptvlineasm
|
|
GLOBAL prevlineasm1
|
|
GLOBAL vlineasm1
|
|
GLOBAL vlineasm1nonpow2
|
|
GLOBAL mvlineasm1 ;Masked vline
|
|
GLOBAL mvlineasm1nonpow2 ;Masked vline, non-power-of-2
|
|
GLOBAL fixtransluscence
|
|
GLOBAL settransnormal
|
|
GLOBAL settransreverse
|
|
GLOBAL tvlineasm1 ;Masked & transluscent vline
|
|
GLOBAL tvlineasm1nonpow2 ;Masked & transluscent vline, non-power-of-2
|
|
GLOBAL vlineasm4
|
|
GLOBAL provlineasm4
|
|
GLOBAL setupvlineasm
|
|
GLOBAL mvlineasm4
|
|
GLOBAL setupspritevline
|
|
GLOBAL spritevline
|
|
GLOBAL msetupspritevline
|
|
GLOBAL mspritevline
|
|
GLOBAL tsetupspritevline
|
|
GLOBAL tspritevline
|
|
GLOBAL msethlineshift
|
|
GLOBAL mhline
|
|
GLOBAL mhlineskipmodify
|
|
GLOBAL tsethlineshift
|
|
GLOBAL thline
|
|
GLOBAL thlineskipmodify
|
|
GLOBAL setuptvlineasm2
|
|
GLOBAL tvlineasm2
|
|
GLOBAL setupslopevlin2
|
|
; GLOBAL slopevlin2
|
|
GLOBAL setupslopevlin
|
|
GLOBAL slopevlin
|
|
GLOBAL setuprhlineasm4
|
|
GLOBAL rhlineasm4
|
|
GLOBAL setuprmhlineasm4
|
|
GLOBAL rmhlineasm4
|
|
GLOBAL setupqrhlineasm4
|
|
GLOBAL qrhlineasm4 ;4 pixels in 9 cycles! 2.25 cycles/pixel
|
|
GLOBAL setupdrawslab
|
|
GLOBAL drawslab
|
|
; GLOBAL stretchhline
|
|
GLOBAL mmxoverlay
|
|
|
|
GLOBAL dep_begin
|
|
GLOBAL dep_end
|
|
|
|
dep_begin:
|
|
|
|
ALIGN 16
|
|
sethlinesizes:
|
|
CDECLBEGINSET 3
|
|
|
|
mov byte [machxbits1+2], al
|
|
mov byte [machxbits2+2], al
|
|
mov byte [machxbits3+2], al
|
|
neg al
|
|
mov byte [hxsiz1+2], al
|
|
mov byte [hxsiz2+2], al
|
|
mov byte [hxsiz3+2], al
|
|
mov byte [hxsiz4+2], al
|
|
mov byte [machnegxbits1+2], al
|
|
|
|
mov byte [hysiz1+3], bl
|
|
mov byte [hysiz2+3], bl
|
|
mov byte [hysiz3+3], bl
|
|
mov byte [hysiz4+3], bl
|
|
mov byte [hmach3a+2], bl
|
|
mov byte [hmach3b+2], bl
|
|
mov byte [hmach3c+2], bl
|
|
mov byte [hmach3d+2], bl
|
|
|
|
mov dword [hoffs1+2], ecx
|
|
mov dword [hoffs2+2], ecx
|
|
mov dword [hoffs3+2], ecx
|
|
mov dword [hoffs4+2], ecx
|
|
mov dword [hoffs5+2], ecx
|
|
mov dword [hoffs6+2], ecx
|
|
mov dword [hoffs7+2], ecx
|
|
mov dword [hoffs8+2], ecx
|
|
|
|
push edx ;JBF
|
|
mov edx, -1
|
|
mov cl, al
|
|
sub cl, bl
|
|
shr edx, cl
|
|
mov dword [hmach2a+1], edx
|
|
mov dword [hmach2b+1], edx
|
|
mov dword [hmach2c+1], edx
|
|
mov dword [hmach2d+1], edx
|
|
pop edx ;JBF
|
|
|
|
CDECLENDSET 3
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
prosethlinesizes:
|
|
CDECLBEGINSET 3
|
|
|
|
mov dword [prohbuf-4], ecx
|
|
neg eax
|
|
mov ecx, eax
|
|
sub eax, ebx
|
|
mov byte [prohshru-1], al ;bl = 32-al-bl
|
|
mov eax, -1
|
|
shr eax, cl
|
|
mov ecx, ebx
|
|
shl eax, cl
|
|
mov dword [prohand-4], eax ;((-1>>(-oal))<<obl)
|
|
neg ebx
|
|
mov byte [prohshrv-1], bl ;bl = 32-bl
|
|
|
|
CDECLENDSET 3
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setvlinebpl:
|
|
CDECLBEGINSET 1
|
|
mov dword [np2_fixchain1a+2], eax
|
|
mov dword [np2_fixchain1b+2], eax
|
|
|
|
mov dword [mnp2_fixchain1b+2], eax
|
|
mov dword [tnp2_fixchain1b+2], eax
|
|
|
|
mov dword [fixchain1a+2], eax
|
|
mov dword [fixchain1b+2], eax
|
|
mov dword [fixchain1m+2], eax
|
|
mov dword [fixchain1t+2], eax
|
|
mov dword [fixchain1s+2], eax
|
|
mov dword [mfixchain1s+2], eax
|
|
mov dword [tfixchain1s+2], eax
|
|
mov dword [fixchain2a+2], eax
|
|
mov dword [profixchain2a+2], eax
|
|
mov dword [fixchain2ma+2], eax
|
|
mov dword [fixchain2mb+2], eax
|
|
mov dword [fixchaint2a+1], eax
|
|
mov dword [fixchaint2b+2], eax
|
|
mov dword [fixchaint2c+2], eax
|
|
mov dword [fixchaint2d+2], eax
|
|
mov dword [fixchaint2e+2], eax
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setpalookupaddress:
|
|
CDECLBEGINSET 1
|
|
mov dword [pal1+2], eax
|
|
mov dword [pal2+2], eax
|
|
mov dword [pal3+2], eax
|
|
mov dword [pal4+2], eax
|
|
mov dword [pal5+2], eax
|
|
mov dword [pal6+2], eax
|
|
mov dword [pal7+2], eax
|
|
mov dword [pal8+2], eax
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
prosetpalookupaddress:
|
|
CDECLBEGINSET 1
|
|
mov dword [prohpala-4], eax
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setuphlineasm4:
|
|
CDECLBEGINSET 2
|
|
|
|
machxbits3: rol eax, 6 ;xbits
|
|
mov dword [hmach4a+2], eax
|
|
mov dword [hmach4b+2], eax
|
|
mov bl, al
|
|
mov dword [hmach4c+2], eax
|
|
mov dword [hmach4d+2], eax
|
|
mov dword [hmach1a+2], ebx
|
|
mov dword [hmach1b+2], ebx
|
|
mov dword [hmach1c+2], ebx
|
|
mov dword [hmach1d+2], ebx
|
|
|
|
CDECLENDSET 2
|
|
ret
|
|
|
|
;Non-256-stuffed ceiling&floor method with NO SHLD!:
|
|
;yinc&0xffffff00 lea eax, [edx+88888800h] 1 1/2
|
|
;ybits...xbits and edx, 88000088h 1 1/2
|
|
;ybits rol edx, 6 2 1/2
|
|
;xinc<<xbits add esi, 88888888h 1 1/2
|
|
;xinc>>(32-xbits) adc al, 88h 1 1/2
|
|
;bufplc mov cl, byte [edx+88888888h] 1 1/2
|
|
;paloffs&255 mov bl, byte [ecx+88888888h] 1 1/2
|
|
ALIGN 16
|
|
hlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
lea ebp, [eax+1]
|
|
|
|
cmp ebp, 8
|
|
jle near shorthline
|
|
|
|
test edi, 1
|
|
jnz short skipthe1byte
|
|
|
|
mov eax, esi
|
|
hxsiz1: shr eax, 26
|
|
hysiz1: shld eax, edx, 6
|
|
hoffs1: mov cl, byte [eax+88888888h]
|
|
pal1: mov bl, byte [ecx+88888888h]
|
|
sub esi, dword [asm1]
|
|
sub edx, dword [asm2]
|
|
mov byte [edi], bl
|
|
dec edi
|
|
dec ebp
|
|
|
|
skipthe1byte:
|
|
test edi, 2
|
|
jnz short skipthe2byte
|
|
|
|
mov eax, esi
|
|
hxsiz2: shr eax, 26
|
|
hysiz2: shld eax, edx, 6
|
|
hoffs2: mov cl, byte [eax+88888888h]
|
|
pal2: mov bh, byte [ecx+88888888h]
|
|
sub esi, dword [asm1]
|
|
sub edx, dword [asm2]
|
|
|
|
mov eax, esi
|
|
hxsiz3: shr eax, 26
|
|
hysiz3: shld eax, edx, 6
|
|
hoffs3: mov cl, byte [eax+88888888h]
|
|
pal3: mov bl, byte [ecx+88888888h]
|
|
sub esi, dword [asm1]
|
|
sub edx, dword [asm2]
|
|
mov word [edi-1], bx
|
|
sub edi, 2
|
|
sub ebp, 2
|
|
|
|
skipthe2byte:
|
|
|
|
mov eax, esi
|
|
machxbits1: shl esi, 6 ;xbits
|
|
machnegxbits1: shr eax, 32-6 ;32-xbits
|
|
mov dl, al
|
|
|
|
inc edi
|
|
|
|
add ebx, ebx
|
|
mov eax, edx
|
|
jc beginhline64
|
|
|
|
mov eax, dword [asm1]
|
|
machxbits2: rol eax, 6 ;xbits
|
|
mov dword [hmach4a+2], eax
|
|
mov dword [hmach4b+2], eax
|
|
mov dword [hmach4c+2], eax
|
|
mov dword [hmach4d+2], eax
|
|
mov ebx, eax
|
|
mov eax, dword [asm2]
|
|
mov al, bl
|
|
mov dword [hmach1a+2], eax
|
|
mov dword [hmach1b+2], eax
|
|
mov dword [hmach1c+2], eax
|
|
mov dword [hmach1d+2], eax
|
|
|
|
mov eax, edx
|
|
jmp beginhline64
|
|
ALIGN 16
|
|
prebeginhline64:
|
|
mov dword [edi], ebx
|
|
beginhline64:
|
|
|
|
hmach3a: rol eax, 6
|
|
hmach2a: and eax, 00008888h
|
|
hmach4a: sub esi, 88888888h
|
|
hmach1a: sbb edx, 88888888h
|
|
sub edi, 4
|
|
hoffs4: mov cl, byte [eax+88888888h]
|
|
mov eax, edx
|
|
|
|
hmach3b: rol eax, 6
|
|
hmach2b: and eax, 00008888h
|
|
hmach4b: sub esi, 88888888h
|
|
hmach1b: sbb edx, 88888888h
|
|
pal4: mov bh, byte [ecx+88888888h]
|
|
hoffs5: mov cl, byte [eax+88888888h]
|
|
mov eax, edx
|
|
|
|
hmach3c: rol eax, 6
|
|
pal5: mov bl, byte [ecx+88888888h]
|
|
hmach2c: and eax, 00008888h
|
|
shl ebx, 16
|
|
hmach4c: sub esi, 88888888h
|
|
hmach1c: sbb edx, 88888888h
|
|
hoffs6: mov cl, byte [eax+88888888h]
|
|
|
|
mov eax, edx
|
|
;(
|
|
|
|
hmach3d: rol eax, 6
|
|
hmach2d: and eax, 00008888h
|
|
hmach4d: sub esi, 88888888h
|
|
hmach1d: sbb edx, 88888888h
|
|
pal6: mov bh, byte [ecx+88888888h]
|
|
hoffs7: mov cl, byte [eax+88888888h]
|
|
mov eax, edx
|
|
sub ebp, 4
|
|
nop
|
|
pal7: mov bl, byte [ecx+88888888h]
|
|
jnc near prebeginhline64
|
|
skipthe4byte:
|
|
|
|
test ebp, 2
|
|
jz skipdrawthe2
|
|
rol ebx, 16
|
|
mov word [edi+2], bx
|
|
sub edi, 2
|
|
skipdrawthe2:
|
|
test ebp, 1
|
|
jz skipdrawthe1
|
|
shr ebx, 24
|
|
mov byte [edi+3], bl
|
|
skipdrawthe1:
|
|
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
shorthline:
|
|
test ebp, ebp
|
|
jz endshorthline
|
|
begshorthline:
|
|
mov eax, esi
|
|
hxsiz4: shr eax, 26
|
|
hysiz4: shld eax, edx, 6
|
|
hoffs8: mov cl, byte [eax+88888888h]
|
|
pal8: mov bl, byte [ecx+88888888h]
|
|
sub esi, dword [asm1]
|
|
sub edx, dword [asm2]
|
|
mov byte [edi], bl
|
|
dec edi
|
|
dec ebp
|
|
jnz near begshorthline
|
|
endshorthline:
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
;eax: 00000000 00000000 00000000 temp----
|
|
;ebx: 00000000 00000000 00000000 temp----
|
|
;ecx: UUUUUUuu uuuuuuuu uuuuuuuu uuuuuuuu
|
|
;edx: VVVVVVvv vvvvvvvv vvvvvvvv vvvvvvvv
|
|
;esi: cnt----- -------- -------- --------
|
|
;edi: vid----- -------- -------- --------
|
|
;ebp: paloffs- -------- -------- --------
|
|
;esp: ???????? ???????? ???????? ????????
|
|
ALIGN 16
|
|
prohlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
lea ebp, [ecx+88888888h]
|
|
prohpala:
|
|
mov ecx, esi
|
|
lea esi, [eax+1]
|
|
sub edi, esi
|
|
|
|
prohbeg:
|
|
mov eax, ecx
|
|
shr eax, 20
|
|
prohshru:
|
|
mov ebx, edx
|
|
shr ebx, 26
|
|
prohshrv:
|
|
and eax, 88888888h
|
|
prohand:
|
|
movzx eax, byte [eax+ebx+88888888h]
|
|
prohbuf:
|
|
mov al, [eax+ebp]
|
|
sub ecx, dword [asm1]
|
|
sub edx, dword [asm2]
|
|
mov [edi+esi], al
|
|
dec esi
|
|
jnz prohbeg
|
|
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
|
|
ALIGN 16
|
|
setupvlineasm:
|
|
CDECLBEGINSET 1
|
|
;First 2 lines for VLINEASM1, rest for VLINEASM4
|
|
mov byte [premach3a+2], al
|
|
mov byte [mach3a+2], al
|
|
|
|
push ecx
|
|
mov byte [machvsh1+2], al ;32-shy
|
|
mov byte [machvsh3+2], al ;32-shy
|
|
mov byte [machvsh5+2], al ;32-shy
|
|
mov byte [machvsh6+2], al ;32-shy
|
|
mov ah, al
|
|
sub ah, 16
|
|
mov byte [machvsh8+2], ah ;16-shy
|
|
neg al
|
|
mov byte [machvsh7+2], al ;shy
|
|
mov byte [machvsh9+2], al ;shy
|
|
mov byte [machvsh10+2], al ;shy
|
|
mov byte [machvsh11+2], al ;shy
|
|
mov byte [machvsh12+2], al ;shy
|
|
mov cl, al
|
|
mov eax, 1
|
|
shl eax, cl
|
|
dec eax
|
|
mov dword [machvsh2+2], eax ;(1<<shy)-1
|
|
mov dword [machvsh4+2], eax ;(1<<shy)-1
|
|
pop ecx
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
prosetupvlineasm:
|
|
CDECLBEGINSET 1
|
|
;First 2 lines for VLINEASM1, rest for VLINEASM4
|
|
mov byte [premach3a+2], al
|
|
mov byte [mach3a+2], al
|
|
|
|
push ecx
|
|
mov byte [promachvsh1+2], al ;32-shy
|
|
mov byte [promachvsh3+2], al ;32-shy
|
|
mov byte [promachvsh5+2], al ;32-shy
|
|
mov byte [promachvsh6+2], al ;32-shy
|
|
mov ah, al
|
|
sub ah, 16
|
|
mov byte [promachvsh8+2], ah ;16-shy
|
|
neg al
|
|
mov byte [promachvsh7+2], al ;shy
|
|
mov byte [promachvsh9+2], al ;shy
|
|
mov byte [promachvsh10+2], al ;shy
|
|
mov byte [promachvsh11+2], al ;shy
|
|
mov byte [promachvsh12+2], al ;shy
|
|
mov cl, al
|
|
mov eax, 1
|
|
shl eax, cl
|
|
dec eax
|
|
mov dword [promachvsh2+2], eax ;(1<<shy)-1
|
|
mov dword [promachvsh4+2], eax ;(1<<shy)-1
|
|
pop ecx
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setupmvlineasm:
|
|
;; NOTE: We actually receive two args (second one: saturate vplc?), but the
|
|
;; second one is currently unused here. See the others: UNUSED_DO_SATURATE.
|
|
CDECLBEGINSET 1
|
|
mov byte [maskmach3a+2], al
|
|
mov byte [machmv13+2], al
|
|
mov byte [machmv14+2], al
|
|
mov byte [machmv15+2], al
|
|
mov byte [machmv16+2], al
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setuptvlineasm:
|
|
;; UNUSED_DO_SATURATE
|
|
CDECLBEGINSET 1
|
|
mov byte [transmach3a+2], al
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
prevlineasm1:
|
|
CDECLBEGINSET 6
|
|
test ecx, ecx
|
|
jnz vlineasm1_nosetup
|
|
|
|
add eax, edx
|
|
premach3a: shr edx, 32
|
|
mov dl, byte [esi+edx]
|
|
mov cl, byte [ebx+edx]
|
|
mov byte [edi], cl
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
vlineasm1:
|
|
CDECLBEGINSET 6
|
|
vlineasm1_nosetup:
|
|
push ebp
|
|
mov ebp, ebx
|
|
inc ecx
|
|
fixchain1a: sub edi, 320
|
|
beginvline:
|
|
mov ebx, edx
|
|
; Here, the right shift value is supposed to be >= 24,
|
|
; translating into tiles with y sizes <= 256 ...
|
|
; (ebx is what is called "vplc" in the C replacement code.)
|
|
mach3a: shr ebx, 32
|
|
fixchain1b: add edi, 320
|
|
; ... so that the upper 24 bits of ebx are clear here:
|
|
mov bl, byte [esi+ebx]
|
|
add edx, eax
|
|
dec ecx
|
|
mov bl, byte [ebp+ebx]
|
|
mov byte [edi], bl
|
|
jnz short beginvline
|
|
pop ebp
|
|
mov eax, edx
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
vlineasm1nonpow2:
|
|
CDECLBEGINSET 6
|
|
; NOTE: this seems to be not debuggable with valgrind --smc-check=all,
|
|
; a crash reading the dummy address 0xbeeff0XX appears, as if only the
|
|
; low byte has been written into.
|
|
; (Valgrind bug?)
|
|
mov dword [np2_do_palookup+2], ebx
|
|
push ebp
|
|
mov ebp, edx ; ebp: vertical place
|
|
mov ebx, eax ; ebx: vertical increment
|
|
mov eax, dword [globaltilesizy]
|
|
mov dword [np2_beginvline+1], eax
|
|
inc ecx
|
|
np2_fixchain1a: sub edi, 320
|
|
np2_beginvline: ; +1: y tile size
|
|
mov eax, 0x00000123
|
|
mul ebp
|
|
np2_fixchain1b: add edi, 320
|
|
and eax, 0x000000ff
|
|
mov al, byte [esi+edx]
|
|
add ebp, ebx
|
|
dec ecx
|
|
np2_do_palookup: ; +2: addr
|
|
mov al, byte [0xbeeff00d+eax]
|
|
mov byte [edi], al
|
|
jnz short np2_beginvline
|
|
mov eax, ebp
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
mvlineasm1:
|
|
CDECLBEGINSET 6
|
|
push ebp
|
|
mov ebp, ebx
|
|
beginmvline:
|
|
mov ebx, edx
|
|
maskmach3a: shr ebx, 32
|
|
mov bl, byte [esi+ebx]
|
|
cmp bl, 255
|
|
je short skipmask1
|
|
maskmach3c: mov bl, [ebp+ebx]
|
|
mov byte [edi], bl
|
|
skipmask1:
|
|
add edx, eax
|
|
fixchain1m: add edi, 320
|
|
sub ecx, 1
|
|
jnc short beginmvline
|
|
|
|
pop ebp
|
|
mov eax, edx
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
mvlineasm1nonpow2:
|
|
CDECLBEGINSET 6
|
|
mov dword [mnp2_do_palookup+2], ebx
|
|
push ebp
|
|
mov ebp, edx ; ebp: vertical place
|
|
mov ebx, eax ; ebx: vertical increment
|
|
mov eax, dword [globaltilesizy]
|
|
mov dword [mnp2_beginvline+1], eax
|
|
mnp2_beginvline: ; +1: y tile size
|
|
mov eax, 0x00000123
|
|
mul ebp
|
|
and eax, 0x000000ff
|
|
mov al, byte [esi+edx]
|
|
cmp al, 255
|
|
je short mskipmask1
|
|
mnp2_do_palookup: ; +2: addr
|
|
mov al, byte [0xbeeff00d+eax]
|
|
mov byte [edi], al
|
|
mskipmask1:
|
|
add ebp, ebx
|
|
mnp2_fixchain1b: add edi, 320
|
|
sub ecx, 1
|
|
jnc short mnp2_beginvline
|
|
mov eax, ebp
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
fixtransluscence:
|
|
CDECLBEGINSET 1
|
|
mov dword [transmach4+2], eax
|
|
mov dword [tmach1+2], eax
|
|
mov dword [tmach2+2], eax
|
|
mov dword [tmach3+2], eax
|
|
mov dword [tmach4+2], eax
|
|
mov dword [tran2traa+2], eax
|
|
mov dword [tran2trab+2], eax
|
|
mov dword [tran2trac+2], eax
|
|
mov dword [tran2trad+2], eax
|
|
|
|
mov dword [tnmach4+2], eax
|
|
CDECLENDSET 1
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
settransnormal:
|
|
mov byte [transrev0+1], 83h
|
|
mov byte [transrev1+1], 27h
|
|
mov byte [transrev2+1], 3fh
|
|
mov byte [transrev3+1], 98h
|
|
mov byte [transrev4+1], 90h
|
|
mov byte [transrev5+1], 37h
|
|
mov byte [transrev6+1], 90h
|
|
mov word [transrev7+0], 0f38ah
|
|
mov byte [transrev8+1], 90h
|
|
mov word [transrev9+0], 0f78ah
|
|
mov byte [transrev10+1], 0a7h
|
|
mov byte [transrev11+1], 81h
|
|
mov byte [transrev12+2], 9fh
|
|
mov word [transrev13+0], 0dc88h
|
|
mov byte [transrev14+1], 81h
|
|
mov byte [transrev15+1], 9ah
|
|
mov byte [transrev16+1], 0a7h
|
|
mov byte [transrev17+1], 82h
|
|
|
|
mov byte [ntransrev0+1], 80h
|
|
mov byte [ntransrev1+1], 27h
|
|
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
settransreverse:
|
|
mov byte [transrev0+1], 0a3h
|
|
mov byte [transrev1+1], 7h
|
|
mov byte [transrev2+1], 1fh
|
|
mov byte [transrev3+1], 0b8h
|
|
mov byte [transrev4+1], 0b0h
|
|
mov byte [transrev5+1], 17h
|
|
mov byte [transrev6+1], 0b0h
|
|
mov word [transrev7+0], 0d38ah
|
|
mov byte [transrev8+1], 0b0h
|
|
mov word [transrev9+0], 0d78ah
|
|
mov byte [transrev10+1], 87h
|
|
mov byte [transrev11+1], 0a1h
|
|
mov byte [transrev12+2], 87h
|
|
mov word [transrev13+0], 0e388h
|
|
mov byte [transrev14+1], 0a1h
|
|
mov byte [transrev15+1], 0bah
|
|
mov byte [transrev16+1], 87h
|
|
mov byte [transrev17+1], 0a2h
|
|
|
|
mov byte [ntransrev0+1], 0a0h
|
|
mov byte [ntransrev1+1], 7h
|
|
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
tvlineasm1:
|
|
CDECLBEGINSET 6
|
|
push ebp
|
|
mov ebp, eax
|
|
xor eax, eax
|
|
inc ecx
|
|
mov dword [transmach3c+2], ebx
|
|
jmp short begintvline
|
|
ALIGN 16
|
|
begintvline:
|
|
mov ebx, edx
|
|
transmach3a: shr ebx, 32
|
|
mov bl, byte [esi+ebx]
|
|
cmp bl, 255
|
|
je short skiptrans1
|
|
transrev0:
|
|
transmach3c: mov al, [ebx+88888888h]
|
|
transrev1:
|
|
mov ah, byte [edi]
|
|
transmach4: mov al, byte [eax+88888888h] ;_transluc[eax]
|
|
mov byte [edi], al
|
|
skiptrans1:
|
|
add edx, ebp
|
|
fixchain1t: add edi, 320
|
|
dec ecx
|
|
jnz short begintvline
|
|
|
|
pop ebp
|
|
mov eax, edx
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
tvlineasm1nonpow2:
|
|
CDECLBEGINSET 6
|
|
mov dword [tnp2_do_palookup+2], ebx
|
|
push ebp
|
|
mov ebp, edx ; ebp: vertical place
|
|
mov ebx, eax ; ebx: vertical increment
|
|
inc ecx
|
|
mov eax, dword [globaltilesizy]
|
|
mov dword [tnp2_beginvline+1], eax
|
|
tnp2_beginvline: ; +1: y tile size
|
|
mov eax, 0x00000123
|
|
mul ebp
|
|
and eax, 0x000000ff
|
|
mov al, byte [esi+edx]
|
|
cmp al, 255
|
|
je short tskipmask1
|
|
ntransrev0:
|
|
tnp2_do_palookup: ; +2: addr
|
|
mov al, byte [0xbeeff00d+eax]
|
|
ntransrev1:
|
|
mov ah, byte [edi]
|
|
tnmach4: mov al, byte [eax+88888888h] ;_luc[eax]
|
|
mov byte [edi], al
|
|
tskipmask1:
|
|
add ebp, ebx
|
|
tnp2_fixchain1b: add edi, 320
|
|
dec ecx
|
|
jnz short tnp2_beginvline
|
|
mov eax, ebp
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
;eax: -------temp1-------
|
|
;ebx: -------temp2-------
|
|
;ecx: dat dat dat dat
|
|
;edx: ylo2 ylo4
|
|
;esi: yhi1 yhi2
|
|
;edi: ---videoplc/cnt----
|
|
;ebp: yhi3 yhi4
|
|
;esp:
|
|
ALIGN 16
|
|
vlineasm4:
|
|
CDECLBEGIN 6
|
|
CDECLPARAM ecx,0,5
|
|
CDECLPARAM edi,1,5
|
|
push ebp
|
|
|
|
mov eax, dword [ylookup]
|
|
mov eax, dword [eax+ecx*4]
|
|
add eax, edi
|
|
mov dword [machvline4end+2], eax
|
|
sub edi, eax
|
|
|
|
mov eax, dword [bufplce]
|
|
mov ebx, dword [bufplce+4]
|
|
mov ecx, dword [bufplce+8]
|
|
mov edx, dword [bufplce+12]
|
|
mov dword [machvbuf1+2], ecx
|
|
mov dword [machvbuf2+2], edx
|
|
mov dword [machvbuf3+2], eax
|
|
mov dword [machvbuf4+2], ebx
|
|
|
|
mov eax, dword [palookupoffse]
|
|
mov ebx, dword [palookupoffse+4]
|
|
mov ecx, dword [palookupoffse+8]
|
|
mov edx, dword [palookupoffse+12]
|
|
mov dword [machvpal1+2], ecx
|
|
mov dword [machvpal2+2], edx
|
|
mov dword [machvpal3+2], eax
|
|
mov dword [machvpal4+2], ebx
|
|
|
|
; +---------------+---------------+
|
|
;edx: |v3lo |v1lo |
|
|
; +---------------+-------+-------+
|
|
;esi: |v2hi v2lo | v3hi|
|
|
; +-----------------------+-------+
|
|
;ebp: |v0hi v0lo | v1hi|
|
|
; +-----------------------+-------+
|
|
|
|
mov ebp, dword [vince]
|
|
mov ebx, dword [vince+4]
|
|
mov esi, dword [vince+8]
|
|
mov eax, dword [vince+12]
|
|
and esi, 0fffffe00h
|
|
and ebp, 0fffffe00h
|
|
machvsh9: rol eax, 88h ;sh
|
|
machvsh10: rol ebx, 88h ;sh
|
|
mov edx, eax
|
|
mov ecx, ebx
|
|
shr ecx, 16
|
|
and edx, 0ffff0000h
|
|
add edx, ecx
|
|
and eax, 000001ffh
|
|
and ebx, 000001ffh
|
|
add esi, eax
|
|
add ebp, ebx
|
|
;
|
|
mov eax, edx
|
|
and eax, 0ffff0000h
|
|
mov dword [machvinc1+2], eax
|
|
mov dword [machvinc2+2], esi
|
|
mov byte [machvinc3+2], dl
|
|
mov byte [machvinc4+2], dh
|
|
mov dword [machvinc5+2], ebp
|
|
|
|
mov ebp, dword [vplce]
|
|
mov ebx, dword [vplce+4]
|
|
mov esi, dword [vplce+8]
|
|
mov eax, dword [vplce+12]
|
|
and esi, 0fffffe00h
|
|
and ebp, 0fffffe00h
|
|
machvsh11: rol eax, 88h ;sh
|
|
machvsh12: rol ebx, 88h ;sh
|
|
mov edx, eax
|
|
mov ecx, ebx
|
|
shr ecx, 16
|
|
and edx, 0ffff0000h
|
|
add edx, ecx
|
|
and eax, 000001ffh
|
|
and ebx, 000001ffh
|
|
add esi, eax
|
|
add ebp, ebx
|
|
|
|
mov ecx, esi
|
|
jmp short beginvlineasm4
|
|
ALIGN 16
|
|
nop
|
|
nop
|
|
nop
|
|
beginvlineasm4:
|
|
machvsh1: shr ecx, 88h ;32-sh
|
|
mov ebx, esi
|
|
machvsh2: and ebx, 00000088h ;(1<<sh)-1
|
|
machvinc1: add edx, 88880000h
|
|
machvinc2: adc esi, 88888088h
|
|
machvbuf1: mov cl, byte [ecx+88888888h]
|
|
machvbuf2: mov bl, byte [ebx+88888888h]
|
|
mov eax, ebp
|
|
machvsh3: shr eax, 88h ;32-sh
|
|
machvpal1: mov cl, byte [ecx+88888888h]
|
|
machvpal2: mov ch, byte [ebx+88888888h]
|
|
mov ebx, ebp
|
|
shl ecx, 16
|
|
machvsh4: and ebx, 00000088h ;(1<<sh)-1
|
|
machvinc3: add dl, 88h
|
|
machvbuf3: mov al, byte [eax+88888888h]
|
|
machvinc4: adc dh, 88h
|
|
machvbuf4: mov bl, byte [ebx+88888888h]
|
|
machvinc5: adc ebp, 88888088h
|
|
machvpal3: mov cl, byte [eax+88888888h]
|
|
machvpal4: mov ch, byte [ebx+88888888h]
|
|
machvline4end: mov dword [edi+88888888h], ecx
|
|
fixchain2a: add edi, 88888888h
|
|
mov ecx, esi
|
|
jnc short beginvlineasm4
|
|
|
|
; +---------------+---------------+
|
|
;edx: |v3lo |v1lo |
|
|
; +---------------+-------+-------+
|
|
;esi: |v2hi v2lo | v3hi|
|
|
; +-----------------------+-------+
|
|
;ebp: |v0hi v0lo | v1hi|
|
|
; +-----------------------+-------+
|
|
|
|
mov dword [vplce+8], esi
|
|
mov dword [vplce], ebp
|
|
;vplc2 = (esi<<(32-sh))+(edx>>sh)
|
|
;vplc3 = (ebp<<(32-sh))+((edx&65535)<<(16-sh))
|
|
machvsh5: shl esi, 88h ;32-sh
|
|
mov eax, edx
|
|
machvsh6: shl ebp, 88h ;32-sh
|
|
and edx, 0000ffffh
|
|
machvsh7: shr eax, 88h ;sh
|
|
add esi, eax
|
|
machvsh8: shl edx, 88h ;16-sh
|
|
add ebp, edx
|
|
mov dword [vplce+12], esi
|
|
mov dword [vplce+4], ebp
|
|
|
|
pop ebp
|
|
CDECLEND 6
|
|
ret
|
|
|
|
;eax: -------temp1-------
|
|
;ebx: -------temp2-------
|
|
;ecx: ylo4 ---------
|
|
;edx: ylo2 ---------
|
|
;esi: yhi1 yhi2
|
|
;edi: ---videoplc/cnt----
|
|
;ebp: yhi3 yhi4
|
|
;esp:
|
|
ALIGN 16
|
|
provlineasm4:
|
|
CDECLBEGIN 6
|
|
CDECLPARAM ecx,0,5
|
|
CDECLPARAM edi,1,5
|
|
push ebp
|
|
|
|
mov eax, dword [ylookup]
|
|
mov eax, dword [eax+ecx*4]
|
|
add eax, edi
|
|
mov dword [promachvline4end1+2], eax
|
|
inc eax
|
|
mov dword [promachvline4end2+2], eax
|
|
inc eax
|
|
mov dword [promachvline4end3+2], eax
|
|
inc eax
|
|
mov dword [promachvline4end4+2], eax
|
|
sub eax, 3
|
|
sub edi, eax
|
|
|
|
mov eax, dword [bufplce]
|
|
mov ebx, dword [bufplce+4]
|
|
mov ecx, dword [bufplce+8]
|
|
mov edx, dword [bufplce+12]
|
|
mov dword [promachvbuf1+3], ecx
|
|
mov dword [promachvbuf2+3], edx
|
|
mov dword [promachvbuf3+3], eax
|
|
mov dword [promachvbuf4+3], ebx
|
|
|
|
mov eax, dword [palookupoffse]
|
|
mov ebx, dword [palookupoffse+4]
|
|
mov ecx, dword [palookupoffse+8]
|
|
mov edx, dword [palookupoffse+12]
|
|
mov dword [promachvpal1+2], ecx
|
|
mov dword [promachvpal2+2], edx
|
|
mov dword [promachvpal3+2], eax
|
|
mov dword [promachvpal4+2], ebx
|
|
|
|
; +---------------+---------------+
|
|
;edx: |v3lo |v1lo |
|
|
; +---------------+-------+-------+
|
|
;esi: |v2hi v2lo | v3hi|
|
|
; +-----------------------+-------+
|
|
;ebp: |v0hi v0lo | v1hi|
|
|
; +-----------------------+-------+
|
|
|
|
mov ebp, dword [vince]
|
|
mov ebx, dword [vince+4]
|
|
mov esi, dword [vince+8]
|
|
mov eax, dword [vince+12]
|
|
and esi, 0fffffe00h
|
|
and ebp, 0fffffe00h
|
|
promachvsh9: rol eax, 88h ;sh
|
|
promachvsh10: rol ebx, 88h ;sh
|
|
mov edx, eax
|
|
mov ecx, ebx
|
|
shr ecx, 16
|
|
and edx, 0ffff0000h
|
|
add edx, ecx
|
|
and eax, 000001ffh
|
|
and ebx, 000001ffh
|
|
add esi, eax
|
|
add ebp, ebx
|
|
;
|
|
mov eax, edx
|
|
and eax, 0ffff0000h
|
|
mov dword [promachvinc1+2], eax
|
|
mov dword [promachvinc2+2], esi
|
|
shl edx, 16
|
|
mov dword [promachvinc3+2], edx
|
|
mov dword [promachvinc5+2], ebp
|
|
|
|
mov ebp, dword [vplce]
|
|
mov ebx, dword [vplce+4]
|
|
mov esi, dword [vplce+8]
|
|
mov eax, dword [vplce+12]
|
|
and esi, 0fffffe00h
|
|
and ebp, 0fffffe00h
|
|
promachvsh11: rol eax, 88h ;sh
|
|
promachvsh12: rol ebx, 88h ;sh
|
|
mov edx, eax
|
|
mov ecx, ebx
|
|
shr ecx, 16
|
|
and edx, 0ffff0000h
|
|
add edx, ecx
|
|
and eax, 000001ffh
|
|
and ebx, 000001ffh
|
|
add esi, eax
|
|
add ebp, ebx
|
|
|
|
mov eax, esi
|
|
mov ecx, edx
|
|
shl ecx, 16
|
|
jmp short probeginvlineasm4
|
|
ALIGN 16
|
|
nop
|
|
nop
|
|
nop
|
|
probeginvlineasm4:
|
|
promachvsh1: shr eax, 88h ;32-sh
|
|
mov ebx, esi
|
|
promachvsh2: and ebx, 00000088h ;(1<<sh)-1
|
|
promachvinc1: add edx, 88880000h
|
|
promachvinc2: adc esi, 88888088h
|
|
promachvbuf1: movzx eax, byte [eax+88888888h]
|
|
promachvbuf2: movzx ebx, byte [ebx+88888888h]
|
|
promachvpal1: mov al, byte [eax+88888888h]
|
|
promachvline4end3: mov byte [edi+88888888h], al
|
|
mov eax, ebp
|
|
promachvsh3: shr eax, 88h ;32-sh
|
|
promachvpal2: mov bl, byte [ebx+88888888h]
|
|
promachvline4end4: mov byte [edi+88888888h], bl
|
|
mov ebx, ebp
|
|
promachvsh4: and ebx, 00000088h ;(1<<sh)-1
|
|
promachvbuf3: movzx eax, byte [eax+88888888h]
|
|
promachvinc3: add ecx, 88888888h
|
|
promachvbuf4: movzx ebx, byte [ebx+88888888h]
|
|
promachvinc5: adc ebp, 88888088h
|
|
promachvpal3: mov al, byte [eax+88888888h]
|
|
promachvline4end1: mov byte [edi+88888888h], al
|
|
promachvpal4: mov bl, byte [ebx+88888888h]
|
|
promachvline4end2: mov byte [edi+88888888h], bl
|
|
profixchain2a: add edi, 88888888h
|
|
mov eax, esi
|
|
jnc near probeginvlineasm4
|
|
|
|
; +---------------+---------------+
|
|
;edx: |v3lo |v1lo |
|
|
; +---------------+-------+-------+
|
|
;esi: |v2hi v2lo | v3hi|
|
|
; +-----------------------+-------+
|
|
;ebp: |v0hi v0lo | v1hi|
|
|
; +-----------------------+-------+
|
|
|
|
mov dword [vplce+8], esi
|
|
mov dword [vplce], ebp
|
|
;vplc2 = (esi<<(32-sh))+(edx>>sh)
|
|
;vplc3 = (ebp<<(32-sh))+((edx&65535)<<(16-sh))
|
|
promachvsh5: shl esi, 88h ;32-sh
|
|
mov eax, edx
|
|
promachvsh6: shl ebp, 88h ;32-sh
|
|
and edx, 0000ffffh
|
|
promachvsh7: shr eax, 88h ;sh
|
|
add esi, eax
|
|
promachvsh8: shl edx, 88h ;16-sh
|
|
add ebp, edx
|
|
mov dword [vplce+12], esi
|
|
mov dword [vplce+4], ebp
|
|
|
|
pop ebp
|
|
CDECLEND 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
mvlineasm4:
|
|
CDECLBEGIN 6
|
|
CDECLPARAM ecx,0,5
|
|
CDECLPARAM edi,1,5
|
|
|
|
push ebp
|
|
|
|
mov eax, dword [bufplce]
|
|
mov ebx, dword [bufplce+4]
|
|
mov dword [machmv1+2], eax
|
|
mov dword [machmv4+2], ebx
|
|
mov eax, dword [bufplce+8]
|
|
mov ebx, dword [bufplce+12]
|
|
mov dword [machmv7+2], eax
|
|
mov dword [machmv10+2], ebx
|
|
|
|
mov eax, dword [palookupoffse]
|
|
mov ebx, dword [palookupoffse+4]
|
|
mov dword [machmv2+2], eax
|
|
mov dword [machmv5+2], ebx
|
|
mov eax, dword [palookupoffse+8]
|
|
mov ebx, dword [palookupoffse+12]
|
|
mov dword [machmv8+2], eax
|
|
mov dword [machmv11+2], ebx
|
|
|
|
mov eax, dword [vince]
|
|
mov ebx, dword [vince+4]
|
|
xor al, al
|
|
xor bl, bl
|
|
mov dword [machmv3+2], eax
|
|
mov dword [machmv6+2], ebx
|
|
mov eax, dword [vince+8]
|
|
mov ebx, dword [vince+12]
|
|
mov dword [machmv9+2], eax
|
|
mov dword [machmv12+2], ebx
|
|
|
|
mov ebx, ecx
|
|
mov ecx, dword [vplce]
|
|
mov edx, dword [vplce+4]
|
|
mov esi, dword [vplce+8]
|
|
mov ebp, dword [vplce+12]
|
|
mov cl, bl
|
|
inc cl
|
|
inc bh
|
|
mov byte [asm3], bh
|
|
fixchain2ma: sub edi, 320
|
|
|
|
jmp short beginmvlineasm4
|
|
ALIGN 16
|
|
beginmvlineasm4:
|
|
dec cl
|
|
jz near endmvlineasm4
|
|
beginmvlineasm42:
|
|
mov eax, ebp
|
|
mov ebx, esi
|
|
machmv16: shr eax, 32
|
|
machmv15: shr ebx, 32
|
|
machmv12: add ebp, 88888888h ;vince[3]
|
|
machmv9: add esi, 88888888h ;vince[2]
|
|
machmv10: mov al, byte [eax+88888888h] ;bufplce[3]
|
|
machmv7: mov bl, byte [ebx+88888888h] ;bufplce[2]
|
|
cmp al, 255
|
|
adc dl, dl
|
|
cmp bl, 255
|
|
adc dl, dl
|
|
machmv8: mov bl, byte [ebx+88888888h] ;palookupoffs[2]
|
|
machmv11: mov bh, byte [eax+88888888h] ;palookupoffs[3]
|
|
|
|
mov eax, edx
|
|
machmv14: shr eax, 32
|
|
shl ebx, 16
|
|
machmv4: mov al, byte [eax+88888888h] ;bufplce[1]
|
|
cmp al, 255
|
|
adc dl, dl
|
|
machmv6: add edx, 88888888h ;vince[1]
|
|
machmv5: mov bh, byte [eax+88888888h] ;palookupoffs[1]
|
|
|
|
mov eax, ecx
|
|
machmv13: shr eax, 32
|
|
machmv3: add ecx, 88888888h ;vince[0]
|
|
machmv1: mov al, byte [eax+88888888h] ;bufplce[0]
|
|
cmp al, 255
|
|
adc dl, dl
|
|
machmv2: mov bl, byte [eax+88888888h] ;palookupoffs[0]
|
|
|
|
shl dl, 4
|
|
xor eax, eax
|
|
fixchain2mb: add edi, 320
|
|
mov al, dl
|
|
add eax, mvcase0
|
|
jmp eax ;16 byte cases
|
|
|
|
ALIGN 16
|
|
endmvlineasm4:
|
|
dec byte [asm3]
|
|
jnz near beginmvlineasm42 ;near
|
|
|
|
mov dword [vplce], ecx
|
|
mov dword [vplce+4], edx
|
|
mov dword [vplce+8], esi
|
|
mov dword [vplce+12], ebp
|
|
pop ebp
|
|
CDECLEND 6
|
|
ret
|
|
|
|
;5,7,8,8,11,13,12,14,11,13,14,14,12,14,15,7
|
|
ALIGN 16
|
|
mvcase0:
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase1:
|
|
mov byte [edi], bl
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase2:
|
|
mov byte [edi+1], bh
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase3:
|
|
mov word [edi], bx
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase4:
|
|
shr ebx, 16
|
|
mov byte [edi+2], bl
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase5:
|
|
mov byte [edi], bl
|
|
shr ebx, 16
|
|
mov byte [edi+2], bl
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase6:
|
|
shr ebx, 8
|
|
mov word [edi+1], bx
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase7:
|
|
mov word [edi], bx
|
|
shr ebx, 16
|
|
mov byte [edi+2], bl
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase8:
|
|
shr ebx, 16
|
|
mov byte [edi+3], bh
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase9:
|
|
mov byte [edi], bl
|
|
shr ebx, 16
|
|
mov byte [edi+3], bh
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase10:
|
|
mov byte [edi+1], bh
|
|
shr ebx, 16
|
|
mov byte [edi+3], bh
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase11:
|
|
mov word [edi], bx
|
|
shr ebx, 16
|
|
mov byte [edi+3], bh
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase12:
|
|
shr ebx, 16
|
|
mov word [edi+2], bx
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase13:
|
|
mov byte [edi], bl
|
|
shr ebx, 16
|
|
mov word [edi+2], bx
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase14:
|
|
mov byte [edi+1], bh
|
|
shr ebx, 16
|
|
mov word [edi+2], bx
|
|
jmp beginmvlineasm4
|
|
ALIGN 16
|
|
mvcase15:
|
|
mov dword [edi], ebx
|
|
jmp beginmvlineasm4
|
|
|
|
|
|
ALIGN 16
|
|
setupspritevline:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [spal+2], eax
|
|
|
|
mov eax, esi ;xinc's
|
|
shl eax, 16
|
|
mov dword [smach1+2], eax
|
|
mov dword [smach4+2], eax
|
|
mov eax, esi
|
|
sar eax, 16
|
|
add eax, ebx ;watch out with ebx - it's passed
|
|
mov dword [smach2+2], eax
|
|
add eax, edx
|
|
mov dword [smach5+2], eax
|
|
|
|
mov dword [smach3+2], ecx ;yinc's
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
spritevline:
|
|
CDECLBEGINSET 6
|
|
jmp short spritevline_start
|
|
;eax = 0, ebx = x, ecx = cnt, edx = y, esi = yplc, edi = p
|
|
prestartsvline:
|
|
smach1: add ebx, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
smach2: adc esi, 88888888h ;xincshr16+yalwaysinc
|
|
|
|
startsvline:
|
|
spal: mov al, [eax+88888888h] ;palookup
|
|
mov byte [edi], al
|
|
fixchain1s: add edi, 320
|
|
|
|
spritevline_start:
|
|
smach3: add edx, 88888888h ;dayinc
|
|
dec ecx
|
|
ja short prestartsvline ;jump if (no carry (add)) and (not zero (dec))!
|
|
jz short endsvline
|
|
smach4: add ebx, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
smach5: adc esi, 88888888h ;xincshr16+yalwaysinc+daydime
|
|
jmp short startsvline
|
|
endsvline:
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
msetupspritevline:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [mspal+2], eax
|
|
|
|
mov eax, esi ;xinc's
|
|
shl eax, 16
|
|
mov dword [msmach1+2], eax
|
|
mov dword [msmach4+2], eax
|
|
mov eax, esi
|
|
sar eax, 16
|
|
add eax, ebx ;watch out with ebx - it's passed
|
|
mov dword [msmach2+2], eax
|
|
add eax, edx
|
|
mov dword [msmach5+2], eax
|
|
|
|
mov dword [msmach3+2], ecx ;yinc's
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
mspritevline:
|
|
CDECLBEGINSET 6
|
|
jmp short mspritevline_start
|
|
;eax = 0, ebx = x, ecx = cnt, edx = y, esi = yplc, edi = p
|
|
mprestartsvline:
|
|
msmach1: add ebx, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
msmach2: adc esi, 88888888h ;xincshr16+yalwaysinc
|
|
|
|
mstartsvline:
|
|
cmp al, 255
|
|
je short mskipsvline
|
|
mspal: mov al, [eax+88888888h] ;palookup
|
|
mov byte [edi], al
|
|
mskipsvline:
|
|
mfixchain1s: add edi, 320
|
|
|
|
mspritevline_start:
|
|
msmach3: add edx, 88888888h ;dayinc
|
|
dec ecx
|
|
ja short mprestartsvline ;jump if (no carry (add)) and (not zero (dec))!
|
|
jz short mendsvline
|
|
msmach4: add ebx, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
msmach5: adc esi, 88888888h ;xincshr16+yalwaysinc+daydime
|
|
jmp short mstartsvline
|
|
mendsvline:
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
tsetupspritevline:
|
|
CDECLBEGINSET 6
|
|
mov dword [tspal+2], eax
|
|
|
|
mov eax, esi ;xinc's
|
|
shl eax, 16
|
|
mov dword [tsmach1+2], eax
|
|
mov dword [tsmach4+2], eax
|
|
mov eax, esi
|
|
sar eax, 16
|
|
add eax, ebx ;watch out with ebx - it's passed
|
|
mov dword [tsmach2+2], eax
|
|
add eax, edx
|
|
mov dword [tsmach5+2], eax
|
|
|
|
mov dword [tsmach3+2], ecx ;yinc's
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
tspritevline:
|
|
CDECLBEGINSET 6
|
|
;eax = 0, ebx = x, ecx = cnt, edx = y, esi = yplc, edi = p
|
|
push ebp
|
|
mov ebp, ebx
|
|
xor ebx, ebx
|
|
jmp tenterspritevline
|
|
ALIGN 16
|
|
tprestartsvline:
|
|
tsmach1: add ebp, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
tsmach2: adc esi, 88888888h ;xincshr16+yalwaysinc
|
|
|
|
tstartsvline:
|
|
cmp al, 255
|
|
je short tskipsvline
|
|
transrev2:
|
|
mov bh, byte [edi]
|
|
transrev3:
|
|
tspal: mov bl, [eax+88888888h] ;palookup
|
|
tmach4: mov al, byte [ebx+88888888h] ;_transluc
|
|
mov byte [edi], al
|
|
tskipsvline:
|
|
tfixchain1s: add edi, 320
|
|
|
|
tenterspritevline:
|
|
tsmach3: add edx, 88888888h ;dayinc
|
|
dec ecx
|
|
ja short tprestartsvline ;jump if (no carry (add)) and (not zero (dec))!
|
|
jz short tendsvline
|
|
tsmach4: add ebp, 88888888h ;xincshl16
|
|
mov al, byte [esi]
|
|
tsmach5: adc esi, 88888888h ;xincshr16+yalwaysinc+daydime
|
|
jmp short tstartsvline
|
|
tendsvline:
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
msethlineshift:
|
|
CDECLBEGINSET 2
|
|
neg al
|
|
mov byte [msh1d+2], al
|
|
mov byte [msh2d+3], bl
|
|
mov byte [msh3d+2], al
|
|
mov byte [msh4d+3], bl
|
|
mov byte [msh5d+2], al
|
|
mov byte [msh6d+3], bl
|
|
CDECLENDSET 2
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
mhline:
|
|
CDECLBEGINSET 6
|
|
;asm1 = bxinc
|
|
;asm2 = byinc
|
|
;asm3 = shadeoffs
|
|
;eax = picoffs
|
|
;ebx = bx
|
|
;ecx = cnt
|
|
;edx = ?
|
|
;esi = by
|
|
;edi = p
|
|
|
|
mov dword [mmach1d+2], eax
|
|
mov dword [mmach5d+2], eax
|
|
mov dword [mmach9d+2], eax
|
|
mov eax, dword [asm3]
|
|
mov dword [mmach2d+2], eax
|
|
mov dword [mmach2da+2], eax
|
|
mov dword [mmach2db+2], eax
|
|
mov dword [mmach6d+2], eax
|
|
mov dword [mmach10d+2], eax
|
|
mov eax, dword [asm1]
|
|
mov dword [mmach3d+2], eax
|
|
mov dword [mmach7d+2], eax
|
|
mov eax, dword [asm2]
|
|
mov dword [mmach4d+2], eax
|
|
mov dword [mmach8d+2], eax
|
|
jmp short mhlineskipmodify_nosetup
|
|
|
|
|
|
ALIGN 16
|
|
mhlineskipmodify:
|
|
CDECLBEGINSET 6
|
|
mhlineskipmodify_nosetup:
|
|
|
|
push ebp
|
|
|
|
xor eax, eax
|
|
mov ebp, ebx
|
|
|
|
test ecx, 00010000h
|
|
jnz short mbeghline
|
|
|
|
msh1d: shr ebx, 26
|
|
msh2d: shld ebx, esi, 6
|
|
add ebp, dword [asm1]
|
|
mmach9d: mov al, byte [ebx+88888888h] ;picoffs
|
|
add esi, dword [asm2]
|
|
cmp al, 255
|
|
je mskip5
|
|
|
|
mmach10d: mov cl, byte [eax+88888888h] ;shadeoffs
|
|
mov byte [edi], cl
|
|
mskip5:
|
|
inc edi
|
|
sub ecx, 65536
|
|
jc near mendhline
|
|
jmp short mbeghline
|
|
|
|
ALIGN 16
|
|
mpreprebeghline: ;1st only
|
|
mov al, cl
|
|
mmach2d: mov al, byte [eax+88888888h] ;shadeoffs
|
|
mov byte [edi], al
|
|
|
|
mprebeghline:
|
|
add edi, 2
|
|
sub ecx, 131072
|
|
jc near mendhline
|
|
mbeghline:
|
|
mmach3d: lea ebx, [ebp+88888888h] ;bxinc
|
|
msh3d: shr ebp, 26
|
|
msh4d: shld ebp, esi, 6
|
|
mmach4d: add esi, 88888888h ;byinc
|
|
mmach1d: mov cl, byte [ebp+88888888h] ;picoffs
|
|
mmach7d: lea ebp, [ebx+88888888h] ;bxinc
|
|
|
|
msh5d: shr ebx, 26
|
|
msh6d: shld ebx, esi, 6
|
|
mmach8d: add esi, 88888888h ;byinc
|
|
mmach5d: mov ch, byte [ebx+88888888h] ;picoffs
|
|
|
|
cmp cl, 255
|
|
je short mskip1
|
|
cmp ch, 255
|
|
je short mpreprebeghline
|
|
|
|
mov al, cl ;BOTH
|
|
mmach2da: mov bl, byte [eax+88888888h] ;shadeoffs
|
|
mov al, ch
|
|
mmach2db: mov bh, byte [eax+88888888h] ;shadeoffs
|
|
mov word [edi], bx
|
|
add edi, 2
|
|
sub ecx, 131072
|
|
jnc short mbeghline
|
|
jmp mendhline
|
|
mskip1: ;2nd only
|
|
cmp ch, 255
|
|
je short mprebeghline
|
|
|
|
mov al, ch
|
|
mmach6d: mov al, byte [eax+88888888h] ;shadeoffs
|
|
mov byte [edi+1], al
|
|
add edi, 2
|
|
sub ecx, 131072
|
|
jnc short mbeghline
|
|
mendhline:
|
|
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
tsethlineshift:
|
|
CDECLBEGINSET 2
|
|
neg al
|
|
mov byte [tsh1d+2], al
|
|
mov byte [tsh2d+3], bl
|
|
mov byte [tsh3d+2], al
|
|
mov byte [tsh4d+3], bl
|
|
mov byte [tsh5d+2], al
|
|
mov byte [tsh6d+3], bl
|
|
CDECLENDSET 2
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
thline:
|
|
CDECLBEGINSET 6
|
|
;asm1 = bxinc
|
|
;asm2 = byinc
|
|
;asm3 = shadeoffs
|
|
;eax = picoffs
|
|
;ebx = bx
|
|
;ecx = cnt
|
|
;edx = ?
|
|
;esi = by
|
|
;edi = p
|
|
|
|
mov dword [tmach1d+2], eax
|
|
mov dword [tmach5d+2], eax
|
|
mov dword [tmach9d+2], eax
|
|
mov eax, dword [asm3]
|
|
mov dword [tmach2d+2], eax
|
|
mov dword [tmach6d+2], eax
|
|
mov dword [tmach10d+2], eax
|
|
mov eax, dword [asm1]
|
|
mov dword [tmach3d+2], eax
|
|
mov dword [tmach7d+2], eax
|
|
mov eax, dword [asm2]
|
|
mov dword [tmach4d+2], eax
|
|
mov dword [tmach8d+2], eax
|
|
jmp thlineskipmodify_nosetup
|
|
|
|
|
|
ALIGN 16
|
|
thlineskipmodify:
|
|
CDECLBEGINSET 6
|
|
thlineskipmodify_nosetup:
|
|
|
|
push ebp
|
|
|
|
xor eax, eax
|
|
xor edx, edx
|
|
mov ebp, ebx
|
|
|
|
test ecx, 00010000h
|
|
jnz short tbeghline
|
|
|
|
tsh1d: shr ebx, 26
|
|
tsh2d: shld ebx, esi, 6
|
|
add ebp, dword [asm1]
|
|
tmach9d: mov al, byte [ebx+88888888h] ;picoffs
|
|
add esi, dword [asm2]
|
|
cmp al, 255
|
|
je tskip5
|
|
|
|
transrev4:
|
|
tmach10d: mov dl, byte [eax+88888888h] ;shadeoffs
|
|
transrev5:
|
|
mov dh, byte [edi]
|
|
tmach1: mov al, byte [edx+88888888h] ;_transluc
|
|
mov byte [edi], al
|
|
tskip5:
|
|
inc edi
|
|
sub ecx, 65536
|
|
jc near tendhline
|
|
jmp short tbeghline
|
|
|
|
ALIGN 16
|
|
tprebeghline:
|
|
add edi, 2
|
|
sub ecx, 131072
|
|
jc short tendhline
|
|
tbeghline:
|
|
tmach3d: lea ebx, [ebp+88888888h] ;bxinc
|
|
tsh3d: shr ebp, 26
|
|
tsh4d: shld ebp, esi, 6
|
|
tmach4d: add esi, 88888888h ;byinc
|
|
tmach1d: mov cl, byte [ebp+88888888h] ;picoffs
|
|
tmach7d: lea ebp, [ebx+88888888h] ;bxinc
|
|
|
|
tsh5d: shr ebx, 26
|
|
tsh6d: shld ebx, esi, 6
|
|
tmach8d: add esi, 88888888h ;byinc
|
|
tmach5d: mov ch, byte [ebx+88888888h] ;picoffs
|
|
|
|
cmp cx, 0ffffh
|
|
je short tprebeghline
|
|
|
|
mov bx, word [edi]
|
|
|
|
cmp cl, 255
|
|
je short tskip1
|
|
mov al, cl
|
|
transrev6:
|
|
tmach2d: mov dl, byte [eax+88888888h] ;shadeoffs
|
|
transrev7:
|
|
mov dh, bl
|
|
tmach2: mov al, byte [edx+88888888h] ;_transluc
|
|
mov byte [edi], al
|
|
|
|
cmp ch, 255
|
|
je short tskip2
|
|
tskip1:
|
|
mov al, ch
|
|
transrev8:
|
|
tmach6d: mov dl, byte [eax+88888888h] ;shadeoffs
|
|
transrev9:
|
|
mov dh, bh
|
|
tmach3: mov al, byte [edx+88888888h] ;_transluc
|
|
mov byte [edi+1], al
|
|
tskip2:
|
|
|
|
add edi, 2
|
|
sub ecx, 131072
|
|
jnc tbeghline
|
|
tendhline:
|
|
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
;eax=shiftval, ebx=palookup1, ecx=palookup2
|
|
ALIGN 16
|
|
setuptvlineasm2:
|
|
CDECLBEGINSET 3
|
|
mov byte [tran2shra+2], al
|
|
mov byte [tran2shrb+2], al
|
|
mov dword [tran2pala+2], ebx
|
|
mov dword [tran2palb+2], ecx
|
|
mov dword [tran2palc+2], ebx
|
|
mov dword [tran2pald+2], ecx
|
|
CDECLENDSET 3
|
|
ret
|
|
|
|
;Pass: eax=vplc2, ebx=vinc1, ecx=bufplc1, edx=bufplc2, esi=vplc1, edi=p
|
|
; asm1=vinc2, asm2=pend
|
|
;Return: asm1=vplc1, asm2=vplc2
|
|
ALIGN 16
|
|
tvlineasm2:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
mov ebp, eax
|
|
|
|
mov dword [tran2inca+2], ebx
|
|
mov eax, dword [asm1]
|
|
mov dword [tran2incb+2], eax
|
|
|
|
mov dword [tran2bufa+2], ecx ;bufplc1
|
|
mov dword [tran2bufb+2], edx ;bufplc2
|
|
|
|
mov eax, dword [asm2]
|
|
sub edi, eax
|
|
mov dword [tran2edia+3], eax
|
|
mov dword [tran2edic+2], eax
|
|
inc eax
|
|
mov dword [tran2edie+2], eax
|
|
fixchaint2a: sub eax, 320
|
|
mov dword [tran2edif+2], eax
|
|
dec eax
|
|
mov dword [tran2edib+3], eax
|
|
mov dword [tran2edid+2], eax
|
|
|
|
xor ecx, ecx
|
|
xor edx, edx
|
|
jmp short begintvline2
|
|
|
|
;eax 0000000000 temp temp
|
|
;ebx 0000000000 odat2 odat1
|
|
;ecx 0000000000000000 ndat1
|
|
;edx 0000000000000000 ndat2
|
|
;esi vplc1
|
|
;edi videoplc--------------
|
|
;ebp vplc2
|
|
|
|
ALIGN 16
|
|
;LEFT ONLY
|
|
skipdraw2:
|
|
transrev10:
|
|
tran2edic: mov ah, byte [edi+88888888h] ;getpixel
|
|
transrev11:
|
|
tran2palc: mov al, byte [ecx+88888888h] ;palookup1
|
|
fixchaint2d: add edi, 320
|
|
tran2trac: mov bl, byte [eax+88888888h] ;_transluc
|
|
tran2edid: mov byte [edi+88888888h-320], bl ;drawpixel
|
|
jnc short begintvline2
|
|
jmp endtvline2
|
|
|
|
skipdraw1:
|
|
cmp dl, 255
|
|
jne short skipdraw3
|
|
fixchaint2b: add edi, 320
|
|
jc short endtvline2
|
|
|
|
begintvline2:
|
|
mov eax, esi
|
|
tran2shra: shr eax, 88h ;globalshift
|
|
mov ebx, ebp
|
|
tran2shrb: shr ebx, 88h ;globalshift
|
|
tran2inca: add esi, 88888888h ;vinc1
|
|
tran2incb: add ebp, 88888888h ;vinc2
|
|
tran2bufa: mov cl, byte [eax+88888888h] ;bufplc1
|
|
cmp cl, 255
|
|
tran2bufb: mov dl, byte [ebx+88888888h] ;bufplc2
|
|
je short skipdraw1
|
|
cmp dl, 255
|
|
je short skipdraw2
|
|
|
|
;mov ax The transluscent reverse of both!
|
|
;mov bl, ah
|
|
;mov ah
|
|
;mov bh
|
|
|
|
;BOTH
|
|
transrev12:
|
|
tran2edia: mov bx, word [edi+88888888h] ;getpixels
|
|
transrev13:
|
|
mov ah, bl
|
|
transrev14:
|
|
tran2pala: mov al, byte [ecx+88888888h] ;palookup1
|
|
transrev15:
|
|
tran2palb: mov bl, byte [edx+88888888h] ;palookup2
|
|
fixchaint2c: add edi, 320
|
|
tran2traa: mov al, byte [eax+88888888h] ;_transluc
|
|
tran2trab: mov ah, byte [ebx+88888888h] ;_transluc
|
|
tran2edib: mov word [edi+88888888h-320], ax ;drawpixels
|
|
jnc short begintvline2
|
|
jmp short endtvline2
|
|
|
|
;RIGHT ONLY
|
|
skipdraw3:
|
|
transrev16:
|
|
tran2edie: mov ah, byte [edi+88888889h] ;getpixel
|
|
transrev17:
|
|
tran2pald: mov al, byte [edx+88888888h] ;palookup2
|
|
fixchaint2e: add edi, 320
|
|
tran2trad: mov bl, byte [eax+88888888h] ;_transluc
|
|
tran2edif: mov byte [edi+88888889h-320], bl ;drawpixel
|
|
jnc short begintvline2
|
|
|
|
endtvline2:
|
|
mov dword [asm1], esi
|
|
mov dword [asm2], ebp
|
|
|
|
pop ebp
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
BITSOFPRECISION equ 3
|
|
BITSOFPRECISIONPOW equ 8
|
|
|
|
%if 0 ; SLOPEVLIN2 is unused as of 2012-02-26
|
|
|
|
;Double-texture mapping with palette lookup
|
|
;eax: ylo1------------|----dat|----dat
|
|
;ebx: ylo2--------------------|----cnt
|
|
;ecx: 000000000000000000000000|---temp
|
|
;edx: xhi1-xlo1---------------|---yhi1
|
|
;esi: xhi2-xlo2---------------|---yhi2
|
|
;edi: ------------------------videopos
|
|
;ebp: ----------------------------temp
|
|
|
|
ALIGN 16
|
|
setupslopevlin2:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [slop3+2], edx ;ptr
|
|
mov dword [slop7+2], edx ;ptr
|
|
mov dword [slop4+2], esi ;tptr
|
|
mov dword [slop8+2], esi ;tptr
|
|
mov byte [slop2+2], ah ;ybits
|
|
mov byte [slop6+2], ah ;ybits
|
|
mov dword [slop9+2], edi ;pinc
|
|
|
|
mov edx, 1
|
|
mov cl, al
|
|
add cl, ah
|
|
shl edx, cl
|
|
dec edx
|
|
mov cl, ah
|
|
ror edx, cl
|
|
|
|
mov dword [slop1+2], edx ;ybits...xbits
|
|
mov dword [slop5+2], edx ;ybits...xbits
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
ALIGN 16
|
|
slopevlin2:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
xor ecx, ecx
|
|
|
|
slopevlin2begin:
|
|
mov ebp, edx
|
|
slop1: and ebp, 88000088h ;ybits...xbits
|
|
slop2: rol ebp, 6 ;ybits
|
|
add eax, dword [asm1] ;xinc1<<xbits
|
|
adc edx, dword [asm2] ;(yinc1&0xffffff00)+(xinc1>>(32-xbits))
|
|
slop3: mov cl, byte [ebp+88888888h] ;bufplc
|
|
|
|
mov ebp, esi
|
|
slop4: mov al, byte [ecx+88888888h] ;paloffs
|
|
slop5: and ebp, 88000088h ;ybits...xbits
|
|
slop6: rol ebp, 6 ;ybits
|
|
add ebx, dword [asm3] ;xinc2<<xbits
|
|
slop7: mov cl, byte [ebp+88888888h] ;bufplc
|
|
adc esi, dword [asm4] ;(yinc2&0xffffff00)+(xinc2>>(32-xbits))
|
|
slop8: mov ah, byte [ecx+88888888h] ;paloffs
|
|
|
|
dec bl
|
|
mov word [edi], ax
|
|
slop9: lea edi, [edi+88888888h] ;pinc
|
|
jnz short slopevlin2begin
|
|
|
|
pop ebp
|
|
mov eax, edi
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
%endif ; SLOPEVLIN2 %if 0
|
|
|
|
ALIGN 16
|
|
setupslopevlin:
|
|
CDECLBEGINSET 3
|
|
|
|
mov dword [slopmach3+3], ebx ;ptr
|
|
mov dword [slopmach5+2], ecx ;pinc
|
|
neg ecx
|
|
mov dword [slopmach6+2], ecx ;-pinc
|
|
|
|
mov edx, 1
|
|
mov cl, al
|
|
shl edx, cl
|
|
dec edx
|
|
mov cl, ah
|
|
shl edx, cl
|
|
mov dword [slopmach7+2], edx
|
|
|
|
neg ah
|
|
mov byte [slopmach2+2], ah
|
|
|
|
sub ah, al
|
|
mov byte [slopmach1+2], ah
|
|
|
|
fild dword [asm1]
|
|
fstp dword [asm2]
|
|
|
|
CDECLENDSET 3
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
slopevlin:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [ebpbak], ebp
|
|
mov dword [espbak], esp
|
|
|
|
sub ecx, esp
|
|
mov dword [slopmach4+3], ecx
|
|
|
|
fild dword [asm3]
|
|
slopmach6: lea ebp, [eax+88888888h]
|
|
fadd dword [asm2]
|
|
|
|
mov dword [asm1], ebx
|
|
shl ebx, 3
|
|
|
|
mov eax, dword [globalx3]
|
|
mov ecx, dword [globaly3]
|
|
imul eax, ebx
|
|
imul ecx, ebx
|
|
add esi, eax
|
|
add edi, ecx
|
|
|
|
mov ebx, edx
|
|
jmp short bigslopeloop
|
|
ALIGN 16
|
|
bigslopeloop:
|
|
fst dword [fpuasm]
|
|
|
|
mov eax, dword [fpuasm]
|
|
add eax, eax
|
|
sbb edx, edx
|
|
mov ecx, eax
|
|
shr ecx, 24
|
|
and eax, 00ffe000h
|
|
shr eax, 11
|
|
sub cl, 2
|
|
mov eax, dword [reciptable+eax]
|
|
shr eax, cl
|
|
xor eax, edx
|
|
mov edx, dword [asm1]
|
|
mov ecx, dword [globalx3]
|
|
mov dword [asm1], eax
|
|
sub eax, edx
|
|
mov edx, dword [globaly3]
|
|
imul ecx, eax
|
|
imul eax, edx
|
|
|
|
fadd dword [asm2]
|
|
|
|
cmp ebx, BITSOFPRECISIONPOW
|
|
mov dword [asm4], ebx
|
|
mov cl, bl
|
|
jl short slopeskipmin
|
|
mov cl, BITSOFPRECISIONPOW
|
|
slopeskipmin:
|
|
|
|
;eax: yinc.............
|
|
;ebx: 0 0 0 ?
|
|
;ecx: xinc......... cnt
|
|
;edx: ?
|
|
;esi: xplc.............
|
|
;edi: yplc.............
|
|
;ebp: videopos
|
|
|
|
mov ebx, esi
|
|
mov edx, edi
|
|
|
|
beginnerslopeloop:
|
|
slopmach1: shr ebx, 20
|
|
add esi, ecx
|
|
slopmach2: shr edx, 26
|
|
slopmach7: and ebx, 88888888h
|
|
add edi, eax
|
|
slopmach5: add ebp, 88888888h ;pinc
|
|
slopmach3: mov dl, byte [ebx+edx+88888888h] ;ptr
|
|
slopmach4: mov ebx, dword [esp+88888888h]
|
|
sub esp, 4
|
|
dec cl
|
|
mov al, byte [ebx+edx] ;tptr
|
|
mov ebx, esi
|
|
mov [ebp], al
|
|
mov edx, edi
|
|
jnz short beginnerslopeloop
|
|
|
|
mov ebx, dword [asm4]
|
|
sub ebx, BITSOFPRECISIONPOW
|
|
jg near bigslopeloop
|
|
|
|
ffree st0
|
|
|
|
mov esp, dword [espbak]
|
|
mov ebp, dword [ebpbak]
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setuprhlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [rmach1a+2], eax
|
|
mov dword [rmach1b+2], eax
|
|
mov dword [rmach1c+2], eax
|
|
mov dword [rmach1d+2], eax
|
|
mov dword [rmach1e+2], eax
|
|
|
|
mov dword [rmach2a+2], ebx
|
|
mov dword [rmach2b+2], ebx
|
|
mov dword [rmach2c+2], ebx
|
|
mov dword [rmach2d+2], ebx
|
|
mov dword [rmach2e+2], ebx
|
|
|
|
mov dword [rmach3a+2], ecx
|
|
mov dword [rmach3b+2], ecx
|
|
mov dword [rmach3c+2], ecx
|
|
mov dword [rmach3d+2], ecx
|
|
mov dword [rmach3e+2], ecx
|
|
|
|
mov dword [rmach4a+2], edx
|
|
mov dword [rmach4b+2], edx
|
|
mov dword [rmach4c+2], edx
|
|
mov dword [rmach4d+2], edx
|
|
mov dword [rmach4e+2], edx
|
|
|
|
mov dword [rmach5a+2], esi
|
|
mov dword [rmach5b+2], esi
|
|
mov dword [rmach5c+2], esi
|
|
mov dword [rmach5d+2], esi
|
|
mov dword [rmach5e+2], esi
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
;Non power of 2, non masking, with palookup method #1 (6 clock cycles)
|
|
;eax: dat dat dat dat
|
|
;ebx: bufplc
|
|
;ecx: 0 dat
|
|
;edx: xlo
|
|
;esi: ylo
|
|
;edi: videopos/cnt
|
|
;ebp: tempvar
|
|
;esp:
|
|
ALIGN 16
|
|
rhlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
cmp eax, 0
|
|
jle near endrhline
|
|
|
|
lea ebp, [edi-4]
|
|
sub ebp, eax
|
|
mov dword [rmach6a+2], ebp
|
|
add ebp, 3
|
|
mov dword [rmach6b+2], ebp
|
|
mov edi, eax
|
|
test edi, 3
|
|
jz short begrhline
|
|
jmp short startrhline1
|
|
|
|
ALIGN 16
|
|
startrhline1:
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmach1e: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmach2e: sub esi, 88888888h ;ylo
|
|
rmach3e: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmach4e: mov al, byte [ecx+88888888h] ;palookup
|
|
rmach5e: and ebp, 88888888h ;tilesizy
|
|
rmach6b: mov byte [edi+88888888h], al ;vidcntoffs
|
|
sub ebx, ebp
|
|
dec edi
|
|
test edi, 3
|
|
jnz short startrhline1
|
|
test edi, edi
|
|
jz near endrhline
|
|
|
|
begrhline:
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmach1a: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmach2a: sub esi, 88888888h ;ylo
|
|
rmach3a: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmach5a: and ebp, 88888888h ;tilesizy
|
|
sub ebx, ebp
|
|
|
|
rmach1b: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmach4a: mov ah, byte [ecx+88888888h] ;palookup
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmach2b: sub esi, 88888888h ;ylo
|
|
rmach3b: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmach5b: and ebp, 88888888h ;tilesizy
|
|
rmach4b: mov al, byte [ecx+88888888h] ;palookup
|
|
sub ebx, ebp
|
|
|
|
shl eax, 16
|
|
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmach1c: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmach2c: sub esi, 88888888h ;ylo
|
|
rmach3c: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmach5c: and ebp, 88888888h ;tilesizy
|
|
sub ebx, ebp
|
|
|
|
rmach1d: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmach4c: mov ah, byte [ecx+88888888h] ;palookup
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmach2d: sub esi, 88888888h ;ylo
|
|
rmach3d: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmach5d: and ebp, 88888888h ;tilesizy
|
|
rmach4d: mov al, byte [ecx+88888888h] ;palookup
|
|
sub ebx, ebp
|
|
|
|
rmach6a: mov dword [edi+88888888h], eax ;vidcntoffs
|
|
sub edi, 4
|
|
jnz near begrhline
|
|
endrhline:
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setuprmhlineasm4:
|
|
CDECLBEGINSET 6
|
|
mov dword [rmmach1+2], eax
|
|
mov dword [rmmach2+2], ebx
|
|
mov dword [rmmach3+2], ecx
|
|
mov dword [rmmach4+2], edx
|
|
mov dword [rmmach5+2], esi
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
rmhlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
cmp eax, 0
|
|
jle short endrmhline
|
|
|
|
lea ebp, [edi-1]
|
|
sub ebp, eax
|
|
mov dword [rmmach6+2], ebp
|
|
mov edi, eax
|
|
jmp short begrmhline
|
|
|
|
ALIGN 16
|
|
begrmhline:
|
|
mov cl, byte [ebx] ;bufplc
|
|
rmmach1: sub edx, 88888888h ;xlo
|
|
sbb ebp, ebp
|
|
rmmach2: sub esi, 88888888h ;ylo
|
|
rmmach3: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
rmmach5: and ebp, 88888888h ;tilesizy
|
|
cmp cl, 255
|
|
je short rmskip
|
|
rmmach4: mov al, byte [ecx+88888888h] ;palookup
|
|
rmmach6: mov byte [edi+88888888h], al ;vidcntoffs
|
|
rmskip:
|
|
sub ebx, ebp
|
|
dec edi
|
|
jnz short begrmhline
|
|
endrmhline:
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
setupqrhlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
mov dword [qrmach2e+2], ebx
|
|
mov dword [qrmach3e+2], ecx
|
|
xor edi, edi
|
|
sub edi, ecx
|
|
mov dword [qrmach7a+2], edi
|
|
mov dword [qrmach7b+2], edi
|
|
|
|
add ebx, ebx
|
|
adc ecx, ecx
|
|
mov dword [qrmach2a+2], ebx
|
|
mov dword [qrmach2b+2], ebx
|
|
mov dword [qrmach3a+2], ecx
|
|
mov dword [qrmach3b+2], ecx
|
|
|
|
mov dword [qrmach4a+2], edx
|
|
mov dword [qrmach4b+2], edx
|
|
mov dword [qrmach4c+2], edx
|
|
mov dword [qrmach4d+2], edx
|
|
mov dword [qrmach4e+2], edx
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
;Non power of 2, non masking, with palookup method (FASTER BUT NO SBB'S)
|
|
;eax: dat dat dat dat
|
|
;ebx: bufplc
|
|
;ecx: 0 dat
|
|
;edx: 0 dat
|
|
;esi: ylo
|
|
;edi: videopos/cnt
|
|
;ebp: ?
|
|
;esp:
|
|
ALIGN 16
|
|
qrhlineasm4:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
cmp eax, 0
|
|
jle near endqrhline
|
|
|
|
mov ebp, eax
|
|
test ebp, 3
|
|
jz short skipqrhline1
|
|
jmp short startqrhline1
|
|
|
|
ALIGN 16
|
|
startqrhline1:
|
|
mov cl, byte [ebx] ;bufplc
|
|
dec edi
|
|
qrmach2e: sub esi, 88888888h ;ylo
|
|
dec ebp
|
|
qrmach3e: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
qrmach4e: mov al, byte [ecx+88888888h] ;palookup
|
|
mov byte [edi], al ;vidcntoffs
|
|
test ebp, 3
|
|
jnz short startqrhline1
|
|
test ebp, ebp
|
|
jz short endqrhline
|
|
|
|
skipqrhline1:
|
|
mov cl, byte [ebx] ;bufplc
|
|
jmp short begqrhline
|
|
ALIGN 16
|
|
begqrhline:
|
|
qrmach7a: mov dl, byte [ebx+88888888h] ;bufplc
|
|
qrmach2a: sub esi, 88888888h ;ylo
|
|
qrmach3a: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
qrmach4a: mov ah, byte [ecx+88888888h] ;palookup
|
|
qrmach4b: mov al, byte [edx+88888888h] ;palookup
|
|
sub edi, 4
|
|
shl eax, 16
|
|
mov cl, byte [ebx] ;bufplc
|
|
qrmach7b: mov dl, byte [ebx+88888888h] ;bufplc
|
|
qrmach2b: sub esi, 88888888h ;ylo
|
|
qrmach3b: sbb ebx, 88888888h ;xhi*tilesizy + yhi+ycarry
|
|
qrmach4c: mov ah, byte [ecx+88888888h] ;palookup
|
|
qrmach4d: mov al, byte [edx+88888888h] ;palookup
|
|
mov cl, byte [ebx] ;bufplc
|
|
mov dword [edi], eax
|
|
sub ebp, 4
|
|
jnz short begqrhline
|
|
|
|
endqrhline:
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
setupdrawslab:
|
|
CDECLBEGINSET 2
|
|
|
|
mov dword [voxbpl1+2], eax
|
|
mov dword [voxbpl2+2], eax
|
|
mov dword [voxbpl3+2], eax
|
|
mov dword [voxbpl4+2], eax
|
|
mov dword [voxbpl5+2], eax
|
|
mov dword [voxbpl6+2], eax
|
|
mov dword [voxbpl7+2], eax
|
|
mov dword [voxbpl8+2], eax
|
|
|
|
mov dword [voxpal1+2], ebx
|
|
mov dword [voxpal2+2], ebx
|
|
mov dword [voxpal3+2], ebx
|
|
mov dword [voxpal4+2], ebx
|
|
mov dword [voxpal5+2], ebx
|
|
mov dword [voxpal6+2], ebx
|
|
mov dword [voxpal7+2], ebx
|
|
mov dword [voxpal8+2], ebx
|
|
|
|
CDECLENDSET 2
|
|
ret
|
|
|
|
|
|
ALIGN 16
|
|
drawslab:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
cmp eax, 2
|
|
je near voxbegdraw2
|
|
ja near voxskip2
|
|
xor eax, eax
|
|
voxbegdraw1:
|
|
mov ebp, ebx
|
|
shr ebp, 16
|
|
add ebx, edx
|
|
dec ecx
|
|
mov al, byte [esi+ebp]
|
|
voxpal1: mov al, byte [eax+88888888h]
|
|
mov byte [edi], al
|
|
voxbpl1: lea edi, [edi+88888888h]
|
|
jnz near voxbegdraw1
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
voxbegdraw2:
|
|
mov ebp, ebx
|
|
shr ebp, 16
|
|
add ebx, edx
|
|
xor eax, eax
|
|
dec ecx
|
|
mov al, byte [esi+ebp]
|
|
voxpal2: mov al, byte [eax+88888888h]
|
|
mov ah, al
|
|
mov word [edi], ax
|
|
voxbpl2: lea edi, [edi+88888888h]
|
|
jnz near voxbegdraw2
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
voxskip2:
|
|
cmp eax, 4
|
|
jne near voxskip4
|
|
xor eax, eax
|
|
voxbegdraw4:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal3: mov al, byte [eax+88888888h]
|
|
mov ah, al
|
|
shl eax, 8
|
|
mov al, ah
|
|
shl eax, 8
|
|
mov al, ah
|
|
mov dword [edi], eax
|
|
voxbpl3: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegdraw4
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
voxskip4:
|
|
add eax, edi
|
|
|
|
test edi, 1
|
|
jz near voxskipslab1
|
|
cmp edi, eax
|
|
je near voxskipslab1
|
|
|
|
push eax
|
|
push ebx
|
|
push ecx
|
|
push edi
|
|
voxbegslab1:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal4: mov al, byte [eax+88888888h]
|
|
mov byte [edi], al
|
|
voxbpl4: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegslab1
|
|
pop edi
|
|
pop ecx
|
|
pop ebx
|
|
pop eax
|
|
inc edi
|
|
|
|
voxskipslab1:
|
|
push eax
|
|
test edi, 2
|
|
jz near voxskipslab2
|
|
dec eax
|
|
cmp edi, eax
|
|
jge near voxskipslab2
|
|
|
|
push ebx
|
|
push ecx
|
|
push edi
|
|
voxbegslab2:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal5: mov al, byte [eax+88888888h]
|
|
mov ah, al
|
|
mov word [edi], ax
|
|
voxbpl5: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegslab2
|
|
pop edi
|
|
pop ecx
|
|
pop ebx
|
|
add edi, 2
|
|
|
|
voxskipslab2:
|
|
mov eax, dword [esp]
|
|
|
|
sub eax, 3
|
|
cmp edi, eax
|
|
jge near voxskipslab3
|
|
|
|
voxprebegslab3:
|
|
push ebx
|
|
push ecx
|
|
push edi
|
|
voxbegslab3:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal6: mov al, byte [eax+88888888h]
|
|
mov ah, al
|
|
shl eax, 8
|
|
mov al, ah
|
|
shl eax, 8
|
|
mov al, ah
|
|
mov dword [edi], eax
|
|
voxbpl6: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegslab3
|
|
pop edi
|
|
pop ecx
|
|
pop ebx
|
|
add edi, 4
|
|
|
|
mov eax, dword [esp]
|
|
|
|
sub eax, 3
|
|
cmp edi, eax
|
|
jl near voxprebegslab3
|
|
|
|
voxskipslab3:
|
|
mov eax, dword [esp]
|
|
|
|
dec eax
|
|
cmp edi, eax
|
|
jge near voxskipslab4
|
|
|
|
push ebx
|
|
push ecx
|
|
push edi
|
|
voxbegslab4:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal7: mov al, byte [eax+88888888h]
|
|
mov ah, al
|
|
mov word [edi], ax
|
|
voxbpl7: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegslab4
|
|
pop edi
|
|
pop ecx
|
|
pop ebx
|
|
add edi, 2
|
|
|
|
voxskipslab4:
|
|
pop eax
|
|
|
|
cmp edi, eax
|
|
je near voxskipslab5
|
|
|
|
voxbegslab5:
|
|
mov ebp, ebx
|
|
add ebx, edx
|
|
shr ebp, 16
|
|
xor eax, eax
|
|
mov al, byte [esi+ebp]
|
|
voxpal8: mov al, byte [eax+88888888h]
|
|
mov byte [edi], al
|
|
voxbpl8: add edi, 88888888h
|
|
dec ecx
|
|
jnz near voxbegslab5
|
|
|
|
voxskipslab5:
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
|
|
|
|
%if 0 ; STRETCHHLINE is unused as of 2012-02-26
|
|
;modify: loinc
|
|
;eax: | dat | dat | dat | dat |
|
|
;ebx: | loplc1 |
|
|
;ecx: | loplc2 | cnthi | cntlo |
|
|
;edx: |--------|--------|--------| hiplc1 |
|
|
;esi: |--------|--------|--------| hiplc2 |
|
|
;edi: |--------|--------|--------| vidplc |
|
|
;ebp: |--------|--------|--------| hiinc |
|
|
|
|
stretchhline:
|
|
CDECLBEGINSET 6
|
|
|
|
push ebp
|
|
|
|
mov eax, ebx
|
|
shl ebx, 16
|
|
sar eax, 16
|
|
and ecx, 0000ffffh
|
|
or ecx, ebx
|
|
|
|
add esi, eax
|
|
mov eax, edx
|
|
mov edx, esi
|
|
|
|
mov ebp, eax
|
|
shl eax, 16
|
|
sar ebp, 16
|
|
|
|
add ecx, eax
|
|
adc esi, ebp
|
|
|
|
add eax, eax
|
|
adc ebp, ebp
|
|
mov dword [loinc1+2], eax
|
|
mov dword [loinc2+2], eax
|
|
mov dword [loinc3+2], eax
|
|
mov dword [loinc4+2], eax
|
|
|
|
inc ch
|
|
|
|
jmp begloop
|
|
|
|
begloop:
|
|
mov al, [edx]
|
|
loinc1: sub ebx, 88888888h
|
|
sbb edx, ebp
|
|
mov ah, [esi]
|
|
loinc2: sub ecx, 88888888h
|
|
sbb esi, ebp
|
|
sub edi, 4
|
|
shl eax, 16
|
|
loinc3: sub ebx, 88888888h
|
|
mov al, [edx]
|
|
sbb edx, ebp
|
|
mov ah, [esi]
|
|
loinc4: sub ecx, 88888888h
|
|
sbb esi, ebp
|
|
mov [edi], eax
|
|
dec cl
|
|
jnz begloop
|
|
dec ch
|
|
jnz begloop
|
|
|
|
pop ebp
|
|
|
|
CDECLENDSET 6
|
|
ret
|
|
%endif ; %if 0 of STRETCHHLINE
|
|
|
|
|
|
mmxoverlay:
|
|
push ebx ;JBF
|
|
push ecx ;JBF
|
|
push edx ;JBF
|
|
|
|
pushfd ;Check if CPUID is available
|
|
pop eax
|
|
mov ebx, eax
|
|
xor eax, 00200000h
|
|
push eax
|
|
popfd
|
|
pushfd
|
|
pop eax
|
|
cmp eax, ebx
|
|
je pentium
|
|
xor eax, eax
|
|
dw 0a20fh
|
|
test eax, eax
|
|
jz pentium
|
|
mov eax, 1
|
|
dw 0a20fh
|
|
and eax, 00000f00h
|
|
test edx, 00800000h ;Check if MMX is available
|
|
jz nommx
|
|
cmp eax, 00000600h ;Check if P6 Family or not
|
|
jae pentiumii
|
|
jmp pentiummmx
|
|
nommx:
|
|
cmp eax, 00000600h ;Check if P6 Family or not
|
|
jae pentiumpro
|
|
pentium:
|
|
|
|
pop edx ;JBF
|
|
pop ecx ;JBF
|
|
pop ebx ;JBF
|
|
ret
|
|
|
|
;+--------------------------------------------------------------+
|
|
;| PENTIUM II Overlays |
|
|
;+--------------------------------------------------------------+
|
|
pentiumii:
|
|
;Hline overlay (MMX doens't help)
|
|
mov byte [sethlinesizes], 0xe9
|
|
mov dword [sethlinesizes+1], (prosethlinesizes-sethlinesizes-5)
|
|
mov byte [setpalookupaddress], 0xe9
|
|
mov dword [setpalookupaddress+1], (prosetpalookupaddress-setpalookupaddress-5)
|
|
mov byte [setuphlineasm4], 0xc3 ;ret (no code required)
|
|
mov byte [hlineasm4], 0xe9
|
|
mov dword [hlineasm4+1], (prohlineasm4-hlineasm4-5)
|
|
|
|
;Vline overlay
|
|
mov byte [setupvlineasm], 0xe9
|
|
mov dword [setupvlineasm+1], (prosetupvlineasm-setupvlineasm-5)
|
|
mov byte [vlineasm4], 0xe9
|
|
mov dword [vlineasm4+1], (provlineasm4-vlineasm4-5)
|
|
|
|
pop edx ;JBF
|
|
pop ecx ;JBF
|
|
pop ebx ;JBF
|
|
ret
|
|
|
|
;+--------------------------------------------------------------+
|
|
;| PENTIUM MMX Overlays |
|
|
;+--------------------------------------------------------------+
|
|
pentiummmx:
|
|
pop edx ;JBF
|
|
pop ecx ;JBF
|
|
pop ebx ;JBF
|
|
ret
|
|
|
|
;+--------------------------------------------------------------+
|
|
;| PENTIUM PRO Overlays |
|
|
;+--------------------------------------------------------------+
|
|
pentiumpro:
|
|
;Hline overlay (MMX doens't help)
|
|
mov byte [sethlinesizes], 0xe9
|
|
mov dword [sethlinesizes+1], (prosethlinesizes-sethlinesizes-5)
|
|
mov byte [setpalookupaddress], 0xe9
|
|
mov dword [setpalookupaddress+1], (prosetpalookupaddress-setpalookupaddress-5)
|
|
mov byte [setuphlineasm4], 0xc3 ;ret (no code required)
|
|
mov byte [hlineasm4], 0xe9
|
|
mov dword [hlineasm4+1], (prohlineasm4-hlineasm4-5)
|
|
|
|
;Vline overlay
|
|
mov byte [setupvlineasm], 0xe9
|
|
mov dword [setupvlineasm+1], (prosetupvlineasm-setupvlineasm-5)
|
|
mov byte [vlineasm4], 0xe9
|
|
mov dword [vlineasm4+1], (provlineasm4-vlineasm4-5)
|
|
|
|
pop edx ;JBF
|
|
pop ecx ;JBF
|
|
pop ebx ;JBF
|
|
ret
|
|
|
|
dep_end:
|
|
|
|
%endif
|