optimize code

git-svn-id: svn://kolibrios.org@6847 a494cfbc-eb01-0410-851d-a64ba20cac60
This commit is contained in:
IgorA 2017-01-27 16:58:51 +00:00
parent 3cbf21dcbe
commit 9a9304d04f
5 changed files with 147 additions and 176 deletions

View File

@ -55,10 +55,10 @@ deflate_copyright db ' deflate 1.2.8 Copyright 1995-2013 Jean-loup Gailly and Ma
; Function prototypes. ; Function prototypes.
;enum block_state ;enum block_state
need_more equ 1 ;block not completed, need more input or more output need_more equ 0 ;block not completed, need more input or more output
block_done equ 2 ;block flush performed block_done equ 1 ;block flush performed
finish_started equ 3 ;finish started, need only more output at next deflate finish_started equ 2 ;finish started, need only more output at next deflate
finish_done equ 4 ;finish done, accept no more input or output finish_done equ 3 ;finish done, accept no more input or output
; =========================================================================== ; ===========================================================================
; Local data ; Local data
@ -154,24 +154,25 @@ macro INSERT_STRING s, str, match_head
movzx eax,byte[eax] movzx eax,byte[eax]
UPDATE_HASH s, [s+deflate_state.ins_h], eax UPDATE_HASH s, [s+deflate_state.ins_h], eax
mov eax,[s+deflate_state.ins_h] mov eax,[s+deflate_state.ins_h]
shl eax,2 shl eax,1
add eax,[s+deflate_state.head] add eax,[s+deflate_state.head]
mov eax,[eax] movzx eax,word[eax]
mov match_head,eax mov match_head,eax
if FASTEST eq 0
push ebx push ebx
if FASTEST eq 0
mov ebx,[s+deflate_state.w_mask] mov ebx,[s+deflate_state.w_mask]
and ebx,str and ebx,str
shl ebx,2 shl ebx,1
add ebx,[s+deflate_state.prev] add ebx,[s+deflate_state.prev]
mov [ebx],eax mov [ebx],ax
pop ebx
end if end if
mov eax,[s+deflate_state.ins_h] mov eax,[s+deflate_state.ins_h]
shl eax,2 shl eax,1
add eax,[s+deflate_state.head] add eax,[s+deflate_state.head]
push str mov ebx,str
pop dword[eax] mov [eax],bx
pop ebx
} }
; =========================================================================== ; ===========================================================================
@ -182,12 +183,12 @@ macro CLEAR_HASH s
{ {
;mov eax,[s+deflate_state.hash_size] ;mov eax,[s+deflate_state.hash_size]
;dec eax ;dec eax
;shl eax,2 ;shl eax,1
;add eax,[s+deflate_state.head] ;add eax,[s+deflate_state.head]
;mov dword[eax],NIL ;mov word[eax],NIL
mov eax,[s+deflate_state.hash_size] mov eax,[s+deflate_state.hash_size]
;dec eax ;dec eax
shl eax,2 ;sizeof(*s.head) shl eax,1 ;sizeof(*s.head)
stdcall zmemzero, [s+deflate_state.head], eax stdcall zmemzero, [s+deflate_state.head], eax
} }
@ -372,9 +373,9 @@ end if
ZALLOC ebx, [edi+deflate_state.w_size], 2 ;2*sizeof(Byte) ZALLOC ebx, [edi+deflate_state.w_size], 2 ;2*sizeof(Byte)
mov [edi+deflate_state.window],eax mov [edi+deflate_state.window],eax
ZALLOC ebx, [edi+deflate_state.w_size], 4 ;sizeof(Pos) ZALLOC ebx, [edi+deflate_state.w_size], 2 ;sizeof(Pos)
mov [edi+deflate_state.prev],eax mov [edi+deflate_state.prev],eax
ZALLOC ebx, [edi+deflate_state.hash_size], 4 ;sizeof(Pos) ZALLOC ebx, [edi+deflate_state.hash_size], 2 ;sizeof(Pos)
mov [edi+deflate_state.head],eax mov [edi+deflate_state.head],eax
mov dword[edi+deflate_state.high_water],0 ;nothing written to s->window yet mov dword[edi+deflate_state.high_water],0 ;nothing written to s->window yet
@ -522,19 +523,19 @@ endl
UPDATE_HASH edi, [edi+deflate_state.ins_h], eax UPDATE_HASH edi, [edi+deflate_state.ins_h], eax
if FASTEST eq 0 if FASTEST eq 0
mov edx,[edi+deflate_state.ins_h] mov edx,[edi+deflate_state.ins_h]
shl edx,2 shl edx,1
add edx,[edi+deflate_state.head] add edx,[edi+deflate_state.head]
mov edx,[edx] ;edx = s.head[s.ins_h] movzx edx,word[edx] ;edx = s.head[s.ins_h]
mov eax,esi mov eax,esi
and eax,[edi+deflate_state.w_mask] and eax,[edi+deflate_state.w_mask]
shl eax,2 shl eax,1
add eax,[edi+deflate_state.prev] add eax,[edi+deflate_state.prev]
mov [eax],edx mov [eax],dx
end if end if
mov edx,[edi+deflate_state.ins_h] mov edx,[edi+deflate_state.ins_h]
shl edx,2 shl edx,1
add edx,[edi+deflate_state.head] add edx,[edi+deflate_state.head]
mov [edx],esi ;s.head[s.ins_h] = str mov [edx],si ;s.head[s.ins_h] = str
inc esi inc esi
dec ecx dec ecx
jnz .cycle1 ;while (--..) jnz .cycle1 ;while (--..)
@ -940,14 +941,12 @@ endp
; to avoid allocating a large strm->next_out buffer and copying into it. ; to avoid allocating a large strm->next_out buffer and copying into it.
; (See also read_buf()). ; (See also read_buf()).
;void (strm) ;void (z_streamp strm)
; z_streamp strm align 16
align 4
proc flush_pending uses eax ebx ecx edx, strm:dword proc flush_pending uses eax ebx ecx edx, strm:dword
;ecx - len ;ecx - len
;edx - deflate_state *s ;edx - deflate_state *s
;ebx - strm ;ebx - strm
zlib_debug 'flush_pending'
mov ebx,[strm] mov ebx,[strm]
mov edx,[ebx+z_stream.state] mov edx,[ebx+z_stream.state]
@ -958,8 +957,8 @@ proc flush_pending uses eax ebx ecx edx, strm:dword
jle @f ;if (..>..) jle @f ;if (..>..)
mov ecx,eax mov ecx,eax
@@: @@:
cmp ecx,0 test ecx,ecx
je @f jz @f
stdcall zmemcpy, [ebx+z_stream.next_out], [edx+deflate_state.pending_out], ecx stdcall zmemcpy, [ebx+z_stream.next_out], [edx+deflate_state.pending_out], ecx
add [ebx+z_stream.next_out],ecx add [ebx+z_stream.next_out],ecx
@ -979,14 +978,13 @@ endp
;int (strm, flush) ;int (strm, flush)
; z_streamp strm ; z_streamp strm
; int flush ; int flush
align 4 align 16
proc deflate uses ebx ecx edx edi esi, strm:dword, flush:dword proc deflate uses ebx ecx edx edi esi, strm:dword, flush:dword
locals locals
old_flush dd ? ;int ;value of flush param for previous deflate call old_flush dd ? ;int ;value of flush param for previous deflate call
val dd ? val dd ?
endl endl
mov ebx,[strm] mov ebx,[strm]
zlib_debug 'deflate strm = %d',ebx
cmp ebx,Z_NULL cmp ebx,Z_NULL
je @f je @f
mov edi,[ebx+z_stream.state] ;s = strm.state mov edi,[ebx+z_stream.state] ;s = strm.state
@ -1180,6 +1178,7 @@ if GZIP eq 1
;esi = beg ;start of bytes to update crc ;esi = beg ;start of bytes to update crc
movzx ecx,word[edx+gz_header.extra_len] movzx ecx,word[edx+gz_header.extra_len]
align 4
.cycle0: ;while (..<..) .cycle0: ;while (..<..)
cmp dword[edi+deflate_state.gzindex],ecx cmp dword[edi+deflate_state.gzindex],ecx
jge .cycle0end jge .cycle0end
@ -1288,7 +1287,7 @@ if GZIP eq 1
mov dword[edi+deflate_state.status],COMMENT_STATE mov dword[edi+deflate_state.status],COMMENT_STATE
jmp .end6 jmp .end6
.end22: ;else .end22: ;else
mov dword[edi+deflate_state.status],COMMENT_STATE; mov dword[edi+deflate_state.status],COMMENT_STATE
.end6: .end6:
cmp dword[edi+deflate_state.status],COMMENT_STATE cmp dword[edi+deflate_state.status],COMMENT_STATE
jne .end7 ;if (..==..) jne .end7 ;if (..==..)
@ -1361,14 +1360,13 @@ if GZIP eq 1
mov ecx,[edi+deflate_state.pending] mov ecx,[edi+deflate_state.pending]
add ecx,2 add ecx,2
cmp ecx,[edi+deflate_state.pending_buf_size] cmp ecx,[edi+deflate_state.pending_buf_size]
jg @f ;if (..<=..) jg .end8 ;if (..<=..)
mov ecx,[ebx+z_stream.adler] mov ecx,[ebx+z_stream.adler]
put_byte edi, cl put_byte edi, cl
put_byte edi, ch put_byte edi, ch
xor eax,eax ;stdcall calc_crc32, 0, Z_NULL, 0 xor eax,eax ;stdcall calc_crc32, 0, Z_NULL, 0
mov [ebx+z_stream.adler],eax mov [ebx+z_stream.adler],eax
mov dword[edi+deflate_state.status],BUSY_STATE mov dword[edi+deflate_state.status],BUSY_STATE
@@:
jmp .end8 jmp .end8
.end9: ;else .end9: ;else
mov dword[edi+deflate_state.status],BUSY_STATE mov dword[edi+deflate_state.status],BUSY_STATE
@ -1390,11 +1388,10 @@ end if
mov dword[edi+deflate_state.last_flush],-1 mov dword[edi+deflate_state.last_flush],-1
mov eax,Z_OK mov eax,Z_OK
jmp .end_f jmp .end_f
@@:
; Make sure there is something to do and avoid duplicate consecutive ; Make sure there is something to do and avoid duplicate consecutive
; flushes. For repeated and useless calls with Z_FINISH, we keep ; flushes. For repeated and useless calls with Z_FINISH, we keep
; returning Z_STREAM_END instead of Z_BUF_ERROR. ; returning Z_STREAM_END instead of Z_BUF_ERROR.
jmp @f align 4
.end13: .end13:
cmp dword[ebx+z_stream.avail_in],0 cmp dword[ebx+z_stream.avail_in],0
jne @f jne @f
@ -1554,7 +1551,6 @@ endp
align 4 align 4
proc deflateEnd uses ebx ecx edx, strm:dword proc deflateEnd uses ebx ecx edx, strm:dword
mov ebx,[strm] mov ebx,[strm]
zlib_debug 'deflateEnd'
cmp ebx,Z_NULL cmp ebx,Z_NULL
je @f je @f
mov edx,[ebx+z_stream.state] mov edx,[ebx+z_stream.state]
@ -1644,9 +1640,9 @@ proc deflateCopy uses ebx edx edi esi, dest:dword, source:dword
ZALLOC edx, [edi+deflate_state.w_size], 2 ;2*sizeof.db ZALLOC edx, [edi+deflate_state.w_size], 2 ;2*sizeof.db
mov dword[edi+deflate_state.window],eax mov dword[edi+deflate_state.window],eax
ZALLOC edx, [edi+deflate_state.w_size], 4 ;sizeof.dd ZALLOC edx, [edi+deflate_state.w_size], 2 ;sizeof.dw
mov dword[edi+deflate_state.prev],eax mov dword[edi+deflate_state.prev],eax
ZALLOC edx, [edi+deflate_state.hash_size], 4 ;sizeof.dd ZALLOC edx, [edi+deflate_state.hash_size], 2 ;sizeof.dw
mov dword[edi+deflate_state.head],eax mov dword[edi+deflate_state.head],eax
ZALLOC edx, [edi+deflate_state.lit_bufsize], 4 ;sizeof.dw+2 ZALLOC edx, [edi+deflate_state.lit_bufsize], 4 ;sizeof.dw+2
mov ebx,eax mov ebx,eax
@ -1671,10 +1667,10 @@ proc deflateCopy uses ebx edx edi esi, dest:dword, source:dword
shl eax,1 ;*= 2*sizeof.db shl eax,1 ;*= 2*sizeof.db
stdcall zmemcpy, [edi+deflate_state.window], [esi+deflate_state.window], eax stdcall zmemcpy, [edi+deflate_state.window], [esi+deflate_state.window], eax
mov eax,[edi+deflate_state.w_size] mov eax,[edi+deflate_state.w_size]
shl eax,2 ;*= sizeof.dd shl eax,1 ;*= sizeof.dw
stdcall zmemcpy, [edi+deflate_state.prev], [esi+deflate_state.prev], eax stdcall zmemcpy, [edi+deflate_state.prev], [esi+deflate_state.prev], eax
mov eax,[edi+deflate_state.hash_size] mov eax,[edi+deflate_state.hash_size]
shl eax,2 ;*= sizeof.dd shl eax,1 ;*= sizeof.dw
stdcall zmemcpy, [edi+deflate_state.head], [esi+deflate_state.head], eax stdcall zmemcpy, [edi+deflate_state.head], [esi+deflate_state.head], eax
stdcall zmemcpy, [edi+deflate_state.pending_buf], [esi+deflate_state.pending_buf], [edi+deflate_state.pending_buf_size] stdcall zmemcpy, [edi+deflate_state.pending_buf], [esi+deflate_state.pending_buf], [edi+deflate_state.pending_buf_size]
@ -1715,7 +1711,7 @@ endp
; z_streamp strm ; z_streamp strm
; Bytef *buf ; Bytef *buf
; unsigned size ; unsigned size
align 4 align 16
proc read_buf uses ebx ecx, strm:dword, buf:dword, size:dword proc read_buf uses ebx ecx, strm:dword, buf:dword, size:dword
mov ebx,[strm] mov ebx,[strm]
mov eax,[ebx+z_stream.avail_in] mov eax,[ebx+z_stream.avail_in]
@ -1740,7 +1736,9 @@ proc read_buf uses ebx ecx, strm:dword, buf:dword, size:dword
stdcall adler32, [ebx+z_stream.adler], [buf], eax stdcall adler32, [ebx+z_stream.adler], [buf], eax
mov [ebx+z_stream.adler],eax mov [ebx+z_stream.adler],eax
pop eax pop eax
if GZIP eq 1
jmp .end0 jmp .end0
end if
@@: @@:
if GZIP eq 1 if GZIP eq 1
cmp dword[ecx+deflate_state.wrap],2 cmp dword[ecx+deflate_state.wrap],2
@ -1749,8 +1747,8 @@ if GZIP eq 1
stdcall calc_crc32, [ebx+z_stream.adler], [buf], eax stdcall calc_crc32, [ebx+z_stream.adler], [buf], eax
mov [ebx+z_stream.adler],eax mov [ebx+z_stream.adler],eax
pop eax pop eax
end if
.end0: .end0:
end if
add [ebx+z_stream.next_in],eax add [ebx+z_stream.next_in],eax
add [ebx+z_stream.total_in],eax add [ebx+z_stream.total_in],eax
@ -1761,9 +1759,8 @@ endp
; =========================================================================== ; ===========================================================================
; Initialize the "longest match" routines for a new zlib stream ; Initialize the "longest match" routines for a new zlib stream
;void (s) ;void (deflate_state *s)
; deflate_state *s align 16
align 4
proc lm_init uses eax ebx edi, s:dword proc lm_init uses eax ebx edi, s:dword
mov edi,[s] mov edi,[s]
mov eax,[edi+deflate_state.w_size] mov eax,[edi+deflate_state.w_size]
@ -1805,7 +1802,7 @@ endp
;uInt (s, cur_match) ;uInt (s, cur_match)
; deflate_state *s ; deflate_state *s
; IPos cur_match ;current match ; IPos cur_match ;current match
align 4 align 16
proc longest_match uses ebx ecx edx edi esi, s:dword, cur_match:dword proc longest_match uses ebx ecx edx edi esi, s:dword, cur_match:dword
if FASTEST eq 0 if FASTEST eq 0
; =========================================================================== ; ===========================================================================
@ -1984,9 +1981,9 @@ align 4
.cycle0cont: .cycle0cont:
mov eax,[cur_match] mov eax,[cur_match]
and eax,[wmask] and eax,[wmask]
shl eax,2 shl eax,1
add eax,[prev] add eax,[prev]
mov eax,[eax] ;eax = prev[cur_match & wmask] movzx eax,word[eax] ;eax = prev[cur_match & wmask]
mov [cur_match],eax mov [cur_match],eax
cmp eax,[limit] cmp eax,[limit]
jle .cycle0end jle .cycle0end
@ -2094,11 +2091,9 @@ align 4
@@: @@:
end if ;FASTEST end if ;FASTEST
.end_f: .end_f:
;zlib_debug ' longest_match.ret = %d',eax
ret ret
endp endp
; =========================================================================== ; ===========================================================================
; Check that the match at match_start is indeed a match. ; Check that the match at match_start is indeed a match.
@ -2127,7 +2122,6 @@ end if ;DEBUG
ret ret
endp endp
; =========================================================================== ; ===========================================================================
; Fill the window when the lookahead becomes insufficient. ; Fill the window when the lookahead becomes insufficient.
; Updates strstart and lookahead. ; Updates strstart and lookahead.
@ -2138,9 +2132,8 @@ endp
; performed for at least two bytes (required for the zip translate_eol ; performed for at least two bytes (required for the zip translate_eol
; option -- not supported here). ; option -- not supported here).
;void (s) ;void (deflate_state *s)
; deflate_state *s align 16
align 4
proc fill_window, s:dword proc fill_window, s:dword
pushad pushad
;esi = p, str, curr ;esi = p, str, curr
@ -2148,7 +2141,6 @@ pushad
;Объем свободного пространства в конце окна. ;Объем свободного пространства в конце окна.
;ecx = wsize ;uInt ;ecx = wsize ;uInt
;edx = s.strm ;edx = s.strm
zlib_debug 'fill_window'
mov edi,[s] mov edi,[s]
cmp dword[edi+deflate_state.lookahead],MIN_LOOKAHEAD cmp dword[edi+deflate_state.lookahead],MIN_LOOKAHEAD
jl @f jl @f
@ -2158,7 +2150,6 @@ pushad
mov ecx,[edi+deflate_state.w_size] mov ecx,[edi+deflate_state.w_size]
mov edx,[edi+deflate_state.strm] mov edx,[edi+deflate_state.strm]
.cycle0: ;do .cycle0: ;do
zlib_debug 'do'
mov ebx,[edi+deflate_state.window_size] mov ebx,[edi+deflate_state.window_size]
sub ebx,[edi+deflate_state.lookahead] sub ebx,[edi+deflate_state.lookahead]
sub ebx,[edi+deflate_state.strstart] sub ebx,[edi+deflate_state.strstart]
@ -2177,7 +2168,6 @@ pushad
sub [edi+deflate_state.match_start],ecx sub [edi+deflate_state.match_start],ecx
sub [edi+deflate_state.strstart],ecx ;we now have strstart >= MAX_DIST sub [edi+deflate_state.strstart],ecx ;we now have strstart >= MAX_DIST
sub [edi+deflate_state.block_start],ecx sub [edi+deflate_state.block_start],ecx
; Slide the hash table (could be avoided with 32 bit values ; Slide the hash table (could be avoided with 32 bit values
; at the expense of memory usage). We slide even when level == 0 ; at the expense of memory usage). We slide even when level == 0
; to keep the hash table consistent if we switch back to level > 0 ; to keep the hash table consistent if we switch back to level > 0
@ -2190,32 +2180,31 @@ pushad
mov ebx,ecx mov ebx,ecx
mov ecx,[edi+deflate_state.hash_size] mov ecx,[edi+deflate_state.hash_size]
mov esi,ecx mov esi,ecx
shl esi,2 shl esi,1
add esi,[edi+deflate_state.head] add esi,[edi+deflate_state.head]
.cycle1: ;do .cycle1: ;do
sub esi,4 sub esi,2
mov eax,[esi] movzx eax,word[esi]
mov dword[esi],NIL mov word[esi],NIL
cmp eax,ebx cmp eax,ebx
jl @f jl @f
sub eax,ebx sub eax,ebx
mov dword[esi],eax mov [esi],ax
@@: @@:
loop .cycle1 ;while (..) loop .cycle1 ;while (..)
if FASTEST eq 0 if FASTEST eq 0
mov ecx,ebx mov ecx,ebx
mov esi,ecx mov esi,ecx
shl esi,2 shl esi,1
add esi,[edi+deflate_state.prev] add esi,[edi+deflate_state.prev]
.cycle2: ;do .cycle2: ;do
sub esi,4 sub esi,2
mov eax,[esi] movzx eax,word[esi]
mov dword[esi],NIL mov word[esi],NIL
cmp eax,ebx cmp eax,ebx
jl @f jl @f
sub eax,ebx sub eax,ebx
mov dword[esi],eax mov [esi],ax
@@: @@:
; If n is not on any hash chain, prev[n] is garbage but ; If n is not on any hash chain, prev[n] is garbage but
; its value will never be used. ; its value will never be used.
@ -2276,21 +2265,21 @@ end if
UPDATE_HASH edi, [edi+deflate_state.ins_h], eax UPDATE_HASH edi, [edi+deflate_state.ins_h], eax
if FASTEST eq 0 if FASTEST eq 0
mov eax,[edi+deflate_state.ins_h] mov eax,[edi+deflate_state.ins_h]
shl eax,2 shl eax,1
add eax,[edi+deflate_state.head] add eax,[edi+deflate_state.head]
push ebx push ebx
mov ebx,[edi+deflate_state.w_mask] mov ebx,[edi+deflate_state.w_mask]
and ebx,esi and ebx,esi
shl ebx,2 shl ebx,1
add ebx,[edi+deflate_state.prev] add ebx,[edi+deflate_state.prev]
mov eax,[eax] mov ax,[eax]
mov [ebx],eax mov [ebx],ax
pop ebx pop ebx
end if end if
mov eax,[edi+deflate_state.ins_h] mov eax,[edi+deflate_state.ins_h]
shl eax,2 shl eax,1
add eax,[edi+deflate_state.head] add eax,[edi+deflate_state.head]
mov [eax],esi mov [eax],si
inc esi inc esi
dec dword[edi+deflate_state.insert] dec dword[edi+deflate_state.insert]
mov eax,[edi+deflate_state.lookahead] mov eax,[edi+deflate_state.lookahead]
@ -2385,7 +2374,7 @@ local .end0
sub eax,[s+deflate_state.block_start] sub eax,[s+deflate_state.block_start]
push eax push eax
xor eax,eax xor eax,eax
cmp dword[s+deflate_state.block_start],0 cmp [s+deflate_state.block_start],eax
jl .end0 jl .end0
mov eax,[s+deflate_state.block_start] mov eax,[s+deflate_state.block_start]
add eax,[s+deflate_state.window] add eax,[s+deflate_state.window]
@ -2431,7 +2420,6 @@ proc deflate_stored uses ebx ecx edi, s:dword, flush:dword
; Stored blocks are limited to 0xffff bytes, pending_buf is limited ; Stored blocks are limited to 0xffff bytes, pending_buf is limited
; to pending_buf_size, and each stored block has a 5 byte header: ; to pending_buf_size, and each stored block has a 5 byte header:
mov edi,[s] mov edi,[s]
zlib_debug 'deflate_stored'
mov ecx,0xffff mov ecx,0xffff
mov eax,[edi+deflate_state.pending_buf_size] mov eax,[edi+deflate_state.pending_buf_size]
@ -2443,7 +2431,7 @@ proc deflate_stored uses ebx ecx edi, s:dword, flush:dword
; Copy as much as possible from input to output: ; Copy as much as possible from input to output:
align 4 align 4
.cycle0: ;for (;;) { .cycle0: ;for (;;)
; Fill the window as much as possible: ; Fill the window as much as possible:
cmp dword[edi+deflate_state.lookahead],1 cmp dword[edi+deflate_state.lookahead],1
jg .end0 ;if (..<=..) jg .end0 ;if (..<=..)
@ -2531,7 +2519,6 @@ locals
endl endl
;ecx = hash_head ;IPos ;head of the hash chain ;ecx = hash_head ;IPos ;head of the hash chain
mov edi,[s] mov edi,[s]
zlib_debug 'deflate_fast'
.cycle0: ;for (..) .cycle0: ;for (..)
; Make sure that we always have enough lookahead, except ; Make sure that we always have enough lookahead, except
@ -2686,7 +2673,6 @@ locals
endl endl
;ecx = hash_head ;IPos ;head of the hash chain ;ecx = hash_head ;IPos ;head of the hash chain
mov edi,[s] mov edi,[s]
zlib_debug 'deflate_slow'
; Process the input block. ; Process the input block.
.cycle0: ;for (;;) .cycle0: ;for (;;)
@ -2903,7 +2889,6 @@ locals
bflush dd ? ;int ;set if current block must be flushed bflush dd ? ;int ;set if current block must be flushed
endl endl
mov edx,[s] mov edx,[s]
zlib_debug 'deflate_rle'
align 4 align 4
.cycle0: ;for (;;) .cycle0: ;for (;;)
; Make sure that we always have enough lookahead, except ; Make sure that we always have enough lookahead, except
@ -3026,7 +3011,6 @@ locals
bflush dd ? ;int ;set if current block must be flushed bflush dd ? ;int ;set if current block must be flushed
endl endl
mov edi,[s] mov edi,[s]
zlib_debug 'deflate_huff'
align 4 align 4
.cycle0: ;for (;;) .cycle0: ;for (;;)
; Make sure that we have a literal to write. ; Make sure that we have a literal to write.

View File

@ -146,7 +146,9 @@ struct deflate_state ;internal_state
; levels >= 4. ; levels >= 4.
level dw ? ;int ;compression level (1..9) level dw ? ;int ;compression level (1..9)
rb 2 ;for align
strategy dw ? ;int ;favor or force Huffman coding strategy dw ? ;int ;favor or force Huffman coding
rb 2 ;for align
good_match dd ? ;uInt good_match dd ? ;uInt
; Use a faster search when the previous match is longer than this ; Use a faster search when the previous match is longer than this
@ -166,7 +168,7 @@ struct deflate_state ;internal_state
bl_count rw MAX_BITS+1 ;uint_16[] bl_count rw MAX_BITS+1 ;uint_16[]
; number of codes at each bit length for an optimal tree ; number of codes at each bit length for an optimal tree
heap rw 2*L_CODES+1 ;int[] ;heap used to build the Huffman trees heap rd 2*L_CODES+1 ;int[] ;heap used to build the Huffman trees
heap_len dd ? ;int ;number of elements in the heap heap_len dd ? ;int ;number of elements in the heap
heap_max dd ? ;int ;element of largest frequency heap_max dd ? ;int ;element of largest frequency
; The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used. ; The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used.
@ -209,11 +211,12 @@ struct deflate_state ;internal_state
insert dd ? ;uInt ;bytes at end of window left to insert insert dd ? ;uInt ;bytes at end of window left to insert
if DEBUG eq 1 if DEBUG eq 1
compressed_len dd ? ;ulg ;total bit length of compressed file mod 2^32 ;compressed_len dd ? ;ulg ;total bit length of compressed file mod 2^32
bits_sent dd ? ;ulg ;bit length of compressed data sent mod 2^32 ;bits_sent dd ? ;ulg ;bit length of compressed data sent mod 2^32
end if end if
bi_buf dw ? ;uint_16 bi_buf dw ? ;uint_16
rb 2 ;for align
; Output buffer. bits are inserted starting at the bottom (least ; Output buffer. bits are inserted starting at the bottom (least
; significant bits). ; significant bits).
@ -238,18 +241,17 @@ deflate_state.max_insert_length equ deflate_state.max_lazy_match
macro put_byte s, c macro put_byte s, c
{ {
movzx eax,word[s+deflate_state.pending] mov eax,[s+deflate_state.pending]
add eax,[s+deflate_state.pending_buf] add eax,[s+deflate_state.pending_buf]
mov byte[eax],c mov byte[eax],c
inc word[s+deflate_state.pending] inc dword[s+deflate_state.pending]
} }
macro put_dword s, d macro put_dword s, d
{ {
zlib_debug '(%d)',d mov eax,[s+deflate_state.pending]
movzx eax,word[s+deflate_state.pending]
add eax,[s+deflate_state.pending_buf] add eax,[s+deflate_state.pending_buf]
mov dword[eax],d mov dword[eax],d
add word[s+deflate_state.pending],4 add dword[s+deflate_state.pending],4
} }
MIN_LOOKAHEAD equ (MAX_MATCH+MIN_MATCH+1) MIN_LOOKAHEAD equ (MAX_MATCH+MIN_MATCH+1)
@ -305,8 +307,7 @@ end if
inc dword[s+deflate_state.last_lit] inc dword[s+deflate_state.last_lit]
and eax,0xff and eax,0xff
imul eax,sizeof.ct_data imul eax,sizeof.ct_data
add eax,s inc word[s+eax+deflate_state.dyn_ltree+Freq]
inc word[eax+deflate_state.dyn_ltree+Freq]
xor eax,eax xor eax,eax
mov ecx,[s+deflate_state.lit_bufsize] mov ecx,[s+deflate_state.lit_bufsize]
dec ecx dec ecx

View File

@ -172,7 +172,6 @@ macro put_short s, w
align 4 align 4
proc send_bits uses eax ecx edi, s:dword, value:dword, length:dword proc send_bits uses eax ecx edi, s:dword, value:dword, length:dword
; Tracevv((stderr," l %2d v %4x ", length, value)); ; Tracevv((stderr," l %2d v %4x ", length, value));
zlib_debug 'send_bits value = %d',[value]
;if DEBUG eq 1 ;if DEBUG eq 1
mov eax,[length] mov eax,[length]
cmp eax,0 cmp eax,0
@ -183,7 +182,7 @@ proc send_bits uses eax ecx edi, s:dword, value:dword, length:dword
zlib_assert 'invalid length' ;Assert(..>0 && ..<=15) zlib_assert 'invalid length' ;Assert(..>0 && ..<=15)
.end1: .end1:
mov edi,[s] mov edi,[s]
add [edi+deflate_state.bits_sent],eax ;;add [edi+deflate_state.bits_sent],eax
; If not enough room in bi_buf, use (valid) bits from bi_buf and ; If not enough room in bi_buf, use (valid) bits from bi_buf and
; (16 - bi_valid) bits from value, leaving (width - (16-bi_valid)) ; (16 - bi_valid) bits from value, leaving (width - (16-bi_valid))
@ -385,12 +384,10 @@ endp
; =========================================================================== ; ===========================================================================
; Initialize the tree data structures for a new zlib stream. ; Initialize the tree data structures for a new zlib stream.
;void (s) ;void (deflate_state* s)
; deflate_state* s
align 4 align 4
proc _tr_init uses eax edi, s:dword proc _tr_init uses eax edi, s:dword
mov edi,[s] mov edi,[s]
zlib_debug '_tr_init'
call tr_static_init call tr_static_init
mov eax,edi mov eax,edi
@ -421,8 +418,7 @@ endp
; =========================================================================== ; ===========================================================================
; Initialize a new block. ; Initialize a new block.
;void (s) ;void (deflate_state* s)
; deflate_state* s
align 4 align 4
proc init_block uses eax ecx edi, s:dword proc init_block uses eax ecx edi, s:dword
mov edi,[s] mov edi,[s]
@ -469,12 +465,12 @@ SMALLEST equ 1
macro pqremove s, tree, top macro pqremove s, tree, top
{ {
mov eax,s mov eax,s
add eax,deflate_state.heap+2*SMALLEST add eax,deflate_state.heap+4*SMALLEST
movzx top,word[eax] movzx top,word[eax]
push ebx push ebx
mov ebx,[s+deflate_state.heap_len] mov ebx,[s+deflate_state.heap_len]
mov bx,[s+deflate_state.heap+2*ebx] mov ebx,[s+deflate_state.heap+4*ebx]
mov word[eax],bx mov [eax],ebx
dec dword[s+deflate_state.heap_len] dec dword[s+deflate_state.heap_len]
pop ebx pop ebx
stdcall pqdownheap, s, tree, SMALLEST stdcall pqdownheap, s, tree, SMALLEST
@ -488,20 +484,20 @@ macro smaller tree, n, m, depth, m_end
{ {
;if (..<.. || (..==.. && depth[n] <= depth[m])) ;if (..<.. || (..==.. && depth[n] <= depth[m]))
local .end0 local .end0
movzx eax,n mov eax,n
imul eax,sizeof.ct_data imul eax,sizeof.ct_data
add eax,tree add eax,tree
mov ax,word[eax+Freq] mov ax,word[eax+Freq]
movzx ebx,m mov ebx,m
imul ebx,sizeof.ct_data imul ebx,sizeof.ct_data
add ebx,tree add ebx,tree
mov bx,word[ebx+Freq] mov bx,word[ebx+Freq]
cmp ax,bx cmp ax,bx
jl .end0 jl .end0
jne m_end jne m_end
movzx eax,n mov eax,n
mov al,byte[eax+depth] mov al,byte[eax+depth]
movzx ebx,m mov ebx,m
cmp al,byte[ebx+depth] cmp al,byte[ebx+depth]
jg m_end jg m_end
.end0: .end0:
@ -523,8 +519,7 @@ pushad
;ecx - v dw ;ecx - v dw
mov edi,[s] mov edi,[s]
mov esi,[k] mov esi,[k]
zlib_debug 'pqdownheap k = %d',esi mov ecx,[edi+deflate_state.heap+4*esi]
mov cx,[edi+deflate_state.heap+2*esi]
shl esi,1 shl esi,1
;esi = j ;left son of k ;esi = j ;left son of k
.cycle0: ;while (..<=..) .cycle0: ;while (..<=..)
@ -534,21 +529,21 @@ pushad
;;cmp esi,[edi+deflate_state.heap_len] ;;cmp esi,[edi+deflate_state.heap_len]
jge .end1 ;if (..<.. && jge .end1 ;if (..<.. &&
mov edx,esi mov edx,esi
shl edx,1 shl edx,2
add edx,edi add edx,edi
add edx,deflate_state.heap add edx,deflate_state.heap
smaller [tree], word[edx+2], word[edx], edi+deflate_state.depth, .end1 smaller [tree], dword[edx+4], dword[edx], edi+deflate_state.depth, .end1
inc esi inc esi
.end1: .end1:
; Exit if v is smaller than both sons ; Exit if v is smaller than both sons
mov dx,[edi+deflate_state.heap+2*esi] mov edx,[edi+deflate_state.heap+4*esi]
smaller [tree], cx, dx, edi+deflate_state.depth, .end2 smaller [tree], ecx, edx, edi+deflate_state.depth, .end2
jmp .cycle0end ;break jmp .cycle0end ;break
.end2: .end2:
; Exchange v with the smallest son ; Exchange v with the smallest son
;;mov dx,[edi+deflate_state.heap+2*esi] ;;mov dx,[edi+deflate_state.heap+2*esi]
mov eax,[k] mov eax,[k]
mov [edi+deflate_state.heap+2*eax],dx mov [edi+deflate_state.heap+4*eax],edx
mov [k],esi mov [k],esi
; And continue down the tree, setting j to the left son of k ; And continue down the tree, setting j to the left son of k
shl esi,1 shl esi,1
@ -556,7 +551,7 @@ pushad
align 4 align 4
.cycle0end: .cycle0end:
mov eax,[k] mov eax,[k]
mov [edi+deflate_state.heap+2*eax],cx mov [edi+deflate_state.heap+4*eax],ecx
popad popad
ret ret
endp endp
@ -591,7 +586,6 @@ locals
overflow dd 0 ;int ;number of elements with bit length too large overflow dd 0 ;int ;number of elements with bit length too large
endl endl
pushad pushad
zlib_debug 'gen_bitlen'
mov edi,[s] mov edi,[s]
mov edx,[desc] mov edx,[desc]
mov eax,[edx+tree_desc.dyn_tree] mov eax,[edx+tree_desc.dyn_tree]
@ -622,7 +616,7 @@ align 4
; overflow in the case of the bit length tree). ; overflow in the case of the bit length tree).
mov eax,[edi+deflate_state.heap_max] mov eax,[edi+deflate_state.heap_max]
movzx eax,word[edi+deflate_state.heap+2*eax] mov eax,[edi+deflate_state.heap+4*eax]
imul eax,sizeof.ct_data imul eax,sizeof.ct_data
add eax,[tree] add eax,[tree]
mov word[eax+Len],0 ;root of the heap mov word[eax+Len],0 ;root of the heap
@ -634,7 +628,7 @@ align 4
cmp dword[h],HEAP_SIZE cmp dword[h],HEAP_SIZE
jge .cycle1end ;for (..;..<..;..) jge .cycle1end ;for (..;..<..;..)
mov eax,[h] mov eax,[h]
movzx ecx,word[edi+deflate_state.heap+2*eax] mov ecx,[edi+deflate_state.heap+4*eax]
;ecx = n ;ecx = n
mov eax,sizeof.ct_data mov eax,sizeof.ct_data
imul eax,ecx imul eax,ecx
@ -752,7 +746,7 @@ align 4
je .cycle4end je .cycle4end
dec dword[h] dec dword[h]
mov eax,[h] mov eax,[h]
movzx eax,word[edi+deflate_state.heap+2*eax] mov eax,[edi+deflate_state.heap+4*eax]
mov [m],eax ;m = s.heap[--h] mov [m],eax ;m = s.heap[--h]
cmp eax,[max_code] cmp eax,[max_code]
jg .cycle4 ;if (..>..) continue jg .cycle4 ;if (..>..) continue
@ -804,7 +798,6 @@ locals
endl endl
; The distribution counts are first used to generate the code values ; The distribution counts are first used to generate the code values
; without bit reversal. ; without bit reversal.
zlib_debug 'gen_codes'
mov ebx,ebp mov ebx,ebp
sub ebx,2*(MAX_BITS+1) sub ebx,2*(MAX_BITS+1)
@ -912,7 +905,7 @@ endl
inc dword[edi+deflate_state.heap_len] inc dword[edi+deflate_state.heap_len]
mov eax,[edi+deflate_state.heap_len] mov eax,[edi+deflate_state.heap_len]
mov [max_code],ecx mov [max_code],ecx
mov [edi+deflate_state.heap+2*eax],cx mov dword[edi+deflate_state.heap+4*eax],ecx
mov byte[edi+deflate_state.depth+ecx],0 mov byte[edi+deflate_state.depth+ecx],0
jmp .end0 jmp .end0
align 4 align 4
@ -941,7 +934,7 @@ align 4
mov eax,[max_code] mov eax,[max_code]
@@: @@:
mov ecx,[edi+deflate_state.heap_len] mov ecx,[edi+deflate_state.heap_len]
mov [edi+deflate_state.heap+2*ecx],ax mov [edi+deflate_state.heap+4*ecx],eax
mov [node],eax mov [node],eax
imul eax,sizeof.ct_data imul eax,sizeof.ct_data
add eax,[tree] add eax,[tree]
@ -989,10 +982,10 @@ align 4
mov eax,[edi+deflate_state.heap_max] mov eax,[edi+deflate_state.heap_max]
dec eax dec eax
mov [edi+deflate_state.heap+2*eax],cx ;keep the nodes sorted by frequency mov [edi+deflate_state.heap+4*eax],ecx ;keep the nodes sorted by frequency
dec eax dec eax
mov [edi+deflate_state.heap_max],eax mov [edi+deflate_state.heap_max],eax
mov [edi+deflate_state.heap+2*eax],dx mov [edi+deflate_state.heap+4*eax],edx
; Create a new node father of n and m ; Create a new node father of n and m
;;mov edx,[m] ;;mov edx,[m]
@ -1040,16 +1033,16 @@ align 4
;end if ;end if
; and insert the new node in the heap ; and insert the new node in the heap
mov ecx,[node] mov ecx,[node]
mov [edi+deflate_state.heap+2*SMALLEST],cx mov [edi+deflate_state.heap+4*SMALLEST],ecx
inc dword[node] inc dword[node]
stdcall pqdownheap, edi, [tree], SMALLEST stdcall pqdownheap, edi, [tree], SMALLEST
cmp dword[edi+deflate_state.heap_len],2 cmp dword[edi+deflate_state.heap_len],2
jge .cycle3 ;while (..>=..) jge .cycle3 ;while (..>=..)
mov cx,[edi+deflate_state.heap+2*SMALLEST] mov ecx,[edi+deflate_state.heap+4*SMALLEST]
dec dword[edi+deflate_state.heap_max] dec dword[edi+deflate_state.heap_max]
mov eax,[edi+deflate_state.heap_max] mov eax,[edi+deflate_state.heap_max]
mov [edi+deflate_state.heap+2*eax],cx mov [edi+deflate_state.heap+4*eax],ecx
; At this point, the fields freq and dad are set. We can now ; At this point, the fields freq and dad are set. We can now
; generate the bit lengths. ; generate the bit lengths.
@ -1083,7 +1076,6 @@ locals
min_count dd 4 ;int ;min repeat count min_count dd 4 ;int ;min repeat count
endl endl
mov edi,[s] mov edi,[s]
zlib_debug 'scan_tree'
mov eax,[tree] mov eax,[tree]
movzx eax,word[eax+Len] movzx eax,word[eax+Len]
mov [nextlen],eax mov [nextlen],eax
@ -1204,7 +1196,6 @@ locals
min_count dd 4 ;int ;min repeat count min_count dd 4 ;int ;min repeat count
endl endl
mov edi,[s] mov edi,[s]
zlib_debug 'send_tree'
; *** tree[max_code+1].Len = -1 ;guard already set ; *** tree[max_code+1].Len = -1 ;guard already set
mov eax,[tree] mov eax,[tree]
movzx eax,word[eax+Len] movzx eax,word[eax+Len]
@ -1214,7 +1205,6 @@ endl
jnz .cycle0 ;if (..==0) jnz .cycle0 ;if (..==0)
mov dword[max_count],138 mov dword[max_count],138
mov dword[min_count],3 mov dword[min_count],3
align 4 align 4
.cycle0: ;for (..;..<=..;..) .cycle0: ;for (..;..<=..;..)
cmp ecx,[max_code] cmp ecx,[max_code]
@ -1322,8 +1312,7 @@ endp
; Construct the Huffman tree for the bit lengths and return the index in ; Construct the Huffman tree for the bit lengths and return the index in
; bl_order of the last bit length code to send. ; bl_order of the last bit length code to send.
;int (s) ;int (deflate_state* s)
; deflate_state* s
align 4 align 4
proc build_bl_tree uses edi, s:dword proc build_bl_tree uses edi, s:dword
locals locals
@ -1385,7 +1374,6 @@ endp
align 4 align 4
proc send_all_trees uses eax ebx ecx edi, s:dword, lcodes:dword, dcodes:dword, blcodes:dword proc send_all_trees uses eax ebx ecx edi, s:dword, lcodes:dword, dcodes:dword, blcodes:dword
;ecx = index in bl_order ;ecx = index in bl_order
zlib_debug 'send_all_trees'
cmp dword[lcodes],257 cmp dword[lcodes],257
jl @f jl @f
cmp dword[dcodes],1 cmp dword[dcodes],1
@ -1479,20 +1467,20 @@ endp
; =========================================================================== ; ===========================================================================
; Flush the bits in the bit buffer to pending output (leaves at most 7 bits) ; Flush the bits in the bit buffer to pending output (leaves at most 7 bits)
;void (s) ;void (deflate_state* s)
; deflate_state* s ;align 4
align 4 ;proc _tr_flush_bits, s:dword
proc _tr_flush_bits, s:dword ; stdcall bi_flush, [s]
stdcall bi_flush, [s] ; ret
ret ;endp
endp
_tr_flush_bits equ bi_flush
; =========================================================================== ; ===========================================================================
; Send one empty static block to give enough lookahead for inflate. ; Send one empty static block to give enough lookahead for inflate.
; This takes 10 bits, of which 7 may remain in the bit buffer. ; This takes 10 bits, of which 7 may remain in the bit buffer.
;void (s) ;void (deflate_state* s)
; deflate_state* s
align 4 align 4
proc _tr_align uses edi, s:dword proc _tr_align uses edi, s:dword
mov edi,[s] mov edi,[s]
@ -1523,7 +1511,6 @@ locals
endl endl
; Build the Huffman trees unless a stored block is forced ; Build the Huffman trees unless a stored block is forced
mov edi,[s] mov edi,[s]
zlib_debug '_tr_flush_block'
cmp word[edi+deflate_state.level],0 cmp word[edi+deflate_state.level],0
jle .end0 ;if (..>0) jle .end0 ;if (..>0)
@ -1728,10 +1715,9 @@ if TRUNCATE_BLOCK eq 1
; Try to guess if it is profitable to stop the current block here ; Try to guess if it is profitable to stop the current block here
mov eax,[edi+deflate_state.last_lit] mov eax,[edi+deflate_state.last_lit]
and eax,0x1fff and eax,0x1fff
cmp eax,0 jnz .end1
jne .end1
cmp word[edi+deflate_state.level],2 cmp word[edi+deflate_state.level],2
jle .end1 ;if (..==.. && ..>..) jle .end1 ;if (..==0 && ..>..)
; Compute an upper bound for the compressed length ; Compute an upper bound for the compressed length
; ulg out_length = (ulg)s->last_lit*8L; ; ulg out_length = (ulg)s->last_lit*8L;
; ulg in_length = (ulg)((long)s->strstart - s->block_start); ; ulg in_length = (ulg)((long)s->strstart - s->block_start);
@ -1775,7 +1761,6 @@ locals
lc dd ? ;int ;match length or unmatched char (if dist == 0) lc dd ? ;int ;match length or unmatched char (if dist == 0)
lx dd 0 ;unsigned ;running index in l_buf lx dd 0 ;unsigned ;running index in l_buf
u_code dd ? ;unsigned ;the code to send u_code dd ? ;unsigned ;the code to send
extra dd ? ;int ;number of extra bits to send
endl endl
mov edi,[s] mov edi,[s]
cmp dword[edi+deflate_state.last_lit],0 cmp dword[edi+deflate_state.last_lit],0
@ -1805,18 +1790,14 @@ endl
add eax,LITERALS+1 add eax,LITERALS+1
send_code edi, eax, [ltree] ;send the length code send_code edi, eax, [ltree] ;send the length code
mov eax,[u_code] mov eax,[u_code]
shl eax,2 mov eax,[4*eax+extra_lbits]
add eax,extra_lbits test eax,eax
mov eax,[eax] jz @f ;if (..!=0)
mov [extra],eax push eax ;extra
cmp eax,0
je @f ;if (..!=0)
mov eax,[u_code] mov eax,[u_code]
shl eax,2 mov eax,[4*eax+base_length]
add eax,base_length
mov eax,[eax]
sub [lc],eax sub [lc],eax
stdcall send_bits, edi, [lc], [extra] ;send the extra length bits stdcall send_bits, edi, [lc] ;, ... ;send the extra length bits
@@: @@:
dec dword[dist] ;dist is now the match distance - 1 dec dword[dist] ;dist is now the match distance - 1
d_code [dist] d_code [dist]
@ -1827,18 +1808,14 @@ endl
@@: @@:
send_code edi, [u_code], [dtree] ;send the distance code send_code edi, [u_code], [dtree] ;send the distance code
mov eax,[u_code] mov eax,[u_code]
shl eax,2 mov eax,[4*eax+extra_dbits]
add eax,extra_dbits test eax,eax
mov eax,[eax] jz .end1 ;if (..!=0)
mov [extra],eax push eax ;extra
cmp eax,0
je .end1 ;if (..!=0)
mov eax,[u_code] mov eax,[u_code]
shl eax,2 mov eax,[4*eax+base_dist]
add eax,base_dist
mov eax,[eax]
sub [dist],eax sub [dist],eax
stdcall send_bits, edi, [dist], [extra] ;send the extra distance bits stdcall send_bits, edi, [dist] ;, ... ;send the extra distance bits
.end1: ;literal or match pair ? .end1: ;literal or match pair ?
; Check that the overlay between pending_buf and d_buf+l_buf is ok: ; Check that the overlay between pending_buf and d_buf+l_buf is ok:
@ -1954,7 +1931,6 @@ endp
; int len ;its bit length ; int len ;its bit length
align 4 align 4
proc bi_reverse uses ebx, p1code:dword, len:dword proc bi_reverse uses ebx, p1code:dword, len:dword
zlib_debug 'bi_reverse'
xor eax,eax xor eax,eax
@@: ;do @@: ;do
mov ebx,[p1code] mov ebx,[p1code]
@ -1998,8 +1974,7 @@ endp
; =========================================================================== ; ===========================================================================
; Flush the bit buffer and align the output on a byte boundary ; Flush the bit buffer and align the output on a byte boundary
;void (s) ;void (deflate_state* s)
; deflate_state* s
align 4 align 4
proc bi_windup uses eax ecx edi, s:dword proc bi_windup uses eax ecx edi, s:dword
mov edi,[s] mov edi,[s]

View File

@ -26,6 +26,7 @@ macro zlib_assert fmt,p1
{ {
local .end_t local .end_t
local .m_fmt local .m_fmt
pushf
jmp .end_t jmp .end_t
.m_fmt db fmt,13,10,0 .m_fmt db fmt,13,10,0
align 4 align 4
@ -35,6 +36,7 @@ if p1 eq
else else
stdcall str_format_dbg, buf_param,.m_fmt,p1 stdcall str_format_dbg, buf_param,.m_fmt,p1
end if end if
popf
} }
include 'zlib.inc' include 'zlib.inc'

View File

@ -137,14 +137,23 @@ endp
align 4 align 4
proc zmemcpy uses ecx edi esi, dest:dword, source:dword, len:dword proc zmemcpy uses ecx edi esi, dest:dword, source:dword, len:dword
mov ecx,[len] mov ecx,[len]
cmp ecx,0 test ecx,ecx
jle @f jz .end0
mov edi,[dest] mov edi,[dest]
mov esi,[source] mov esi,[source]
rep movsb bt ecx,0 ;кратно 2 ?
jmp .end0 jnc @f
@@: rep movsb
zlib_debug 'zmemcpy size = %d',ecx jmp .end0
@@:
bt ecx,1 ;кратно 4 ?
jnc @f
shr ecx,1
rep movsw
jmp .end0
@@:
shr ecx,2
rep movsd
.end0: .end0:
ret ret
endp endp