forked from KolibriOS/kolibrios
optimize code
git-svn-id: svn://kolibrios.org@6847 a494cfbc-eb01-0410-851d-a64ba20cac60
This commit is contained in:
parent
3cbf21dcbe
commit
9a9304d04f
@ -55,10 +55,10 @@ deflate_copyright db ' deflate 1.2.8 Copyright 1995-2013 Jean-loup Gailly and Ma
|
||||
; Function prototypes.
|
||||
|
||||
;enum block_state
|
||||
need_more equ 1 ;block not completed, need more input or more output
|
||||
block_done equ 2 ;block flush performed
|
||||
finish_started equ 3 ;finish started, need only more output at next deflate
|
||||
finish_done equ 4 ;finish done, accept no more input or output
|
||||
need_more equ 0 ;block not completed, need more input or more output
|
||||
block_done equ 1 ;block flush performed
|
||||
finish_started equ 2 ;finish started, need only more output at next deflate
|
||||
finish_done equ 3 ;finish done, accept no more input or output
|
||||
|
||||
; ===========================================================================
|
||||
; Local data
|
||||
@ -154,24 +154,25 @@ macro INSERT_STRING s, str, match_head
|
||||
movzx eax,byte[eax]
|
||||
UPDATE_HASH s, [s+deflate_state.ins_h], eax
|
||||
mov eax,[s+deflate_state.ins_h]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[s+deflate_state.head]
|
||||
mov eax,[eax]
|
||||
movzx eax,word[eax]
|
||||
mov match_head,eax
|
||||
if FASTEST eq 0
|
||||
push ebx
|
||||
if FASTEST eq 0
|
||||
mov ebx,[s+deflate_state.w_mask]
|
||||
and ebx,str
|
||||
shl ebx,2
|
||||
shl ebx,1
|
||||
add ebx,[s+deflate_state.prev]
|
||||
mov [ebx],eax
|
||||
pop ebx
|
||||
mov [ebx],ax
|
||||
|
||||
end if
|
||||
mov eax,[s+deflate_state.ins_h]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[s+deflate_state.head]
|
||||
push str
|
||||
pop dword[eax]
|
||||
mov ebx,str
|
||||
mov [eax],bx
|
||||
pop ebx
|
||||
}
|
||||
|
||||
; ===========================================================================
|
||||
@ -182,12 +183,12 @@ macro CLEAR_HASH s
|
||||
{
|
||||
;mov eax,[s+deflate_state.hash_size]
|
||||
;dec eax
|
||||
;shl eax,2
|
||||
;shl eax,1
|
||||
;add eax,[s+deflate_state.head]
|
||||
;mov dword[eax],NIL
|
||||
;mov word[eax],NIL
|
||||
mov eax,[s+deflate_state.hash_size]
|
||||
;dec eax
|
||||
shl eax,2 ;sizeof(*s.head)
|
||||
shl eax,1 ;sizeof(*s.head)
|
||||
stdcall zmemzero, [s+deflate_state.head], eax
|
||||
}
|
||||
|
||||
@ -372,9 +373,9 @@ end if
|
||||
|
||||
ZALLOC ebx, [edi+deflate_state.w_size], 2 ;2*sizeof(Byte)
|
||||
mov [edi+deflate_state.window],eax
|
||||
ZALLOC ebx, [edi+deflate_state.w_size], 4 ;sizeof(Pos)
|
||||
ZALLOC ebx, [edi+deflate_state.w_size], 2 ;sizeof(Pos)
|
||||
mov [edi+deflate_state.prev],eax
|
||||
ZALLOC ebx, [edi+deflate_state.hash_size], 4 ;sizeof(Pos)
|
||||
ZALLOC ebx, [edi+deflate_state.hash_size], 2 ;sizeof(Pos)
|
||||
mov [edi+deflate_state.head],eax
|
||||
|
||||
mov dword[edi+deflate_state.high_water],0 ;nothing written to s->window yet
|
||||
@ -522,19 +523,19 @@ endl
|
||||
UPDATE_HASH edi, [edi+deflate_state.ins_h], eax
|
||||
if FASTEST eq 0
|
||||
mov edx,[edi+deflate_state.ins_h]
|
||||
shl edx,2
|
||||
shl edx,1
|
||||
add edx,[edi+deflate_state.head]
|
||||
mov edx,[edx] ;edx = s.head[s.ins_h]
|
||||
movzx edx,word[edx] ;edx = s.head[s.ins_h]
|
||||
mov eax,esi
|
||||
and eax,[edi+deflate_state.w_mask]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[edi+deflate_state.prev]
|
||||
mov [eax],edx
|
||||
mov [eax],dx
|
||||
end if
|
||||
mov edx,[edi+deflate_state.ins_h]
|
||||
shl edx,2
|
||||
shl edx,1
|
||||
add edx,[edi+deflate_state.head]
|
||||
mov [edx],esi ;s.head[s.ins_h] = str
|
||||
mov [edx],si ;s.head[s.ins_h] = str
|
||||
inc esi
|
||||
dec ecx
|
||||
jnz .cycle1 ;while (--..)
|
||||
@ -940,14 +941,12 @@ endp
|
||||
; to avoid allocating a large strm->next_out buffer and copying into it.
|
||||
; (See also read_buf()).
|
||||
|
||||
;void (strm)
|
||||
; z_streamp strm
|
||||
align 4
|
||||
;void (z_streamp strm)
|
||||
align 16
|
||||
proc flush_pending uses eax ebx ecx edx, strm:dword
|
||||
;ecx - len
|
||||
;edx - deflate_state *s
|
||||
;ebx - strm
|
||||
zlib_debug 'flush_pending'
|
||||
mov ebx,[strm]
|
||||
mov edx,[ebx+z_stream.state]
|
||||
|
||||
@ -958,8 +957,8 @@ proc flush_pending uses eax ebx ecx edx, strm:dword
|
||||
jle @f ;if (..>..)
|
||||
mov ecx,eax
|
||||
@@:
|
||||
cmp ecx,0
|
||||
je @f
|
||||
test ecx,ecx
|
||||
jz @f
|
||||
|
||||
stdcall zmemcpy, [ebx+z_stream.next_out], [edx+deflate_state.pending_out], ecx
|
||||
add [ebx+z_stream.next_out],ecx
|
||||
@ -979,14 +978,13 @@ endp
|
||||
;int (strm, flush)
|
||||
; z_streamp strm
|
||||
; int flush
|
||||
align 4
|
||||
align 16
|
||||
proc deflate uses ebx ecx edx edi esi, strm:dword, flush:dword
|
||||
locals
|
||||
old_flush dd ? ;int ;value of flush param for previous deflate call
|
||||
val dd ?
|
||||
endl
|
||||
mov ebx,[strm]
|
||||
zlib_debug 'deflate strm = %d',ebx
|
||||
cmp ebx,Z_NULL
|
||||
je @f
|
||||
mov edi,[ebx+z_stream.state] ;s = strm.state
|
||||
@ -1180,6 +1178,7 @@ if GZIP eq 1
|
||||
;esi = beg ;start of bytes to update crc
|
||||
|
||||
movzx ecx,word[edx+gz_header.extra_len]
|
||||
align 4
|
||||
.cycle0: ;while (..<..)
|
||||
cmp dword[edi+deflate_state.gzindex],ecx
|
||||
jge .cycle0end
|
||||
@ -1288,7 +1287,7 @@ if GZIP eq 1
|
||||
mov dword[edi+deflate_state.status],COMMENT_STATE
|
||||
jmp .end6
|
||||
.end22: ;else
|
||||
mov dword[edi+deflate_state.status],COMMENT_STATE;
|
||||
mov dword[edi+deflate_state.status],COMMENT_STATE
|
||||
.end6:
|
||||
cmp dword[edi+deflate_state.status],COMMENT_STATE
|
||||
jne .end7 ;if (..==..)
|
||||
@ -1361,14 +1360,13 @@ if GZIP eq 1
|
||||
mov ecx,[edi+deflate_state.pending]
|
||||
add ecx,2
|
||||
cmp ecx,[edi+deflate_state.pending_buf_size]
|
||||
jg @f ;if (..<=..)
|
||||
jg .end8 ;if (..<=..)
|
||||
mov ecx,[ebx+z_stream.adler]
|
||||
put_byte edi, cl
|
||||
put_byte edi, ch
|
||||
xor eax,eax ;stdcall calc_crc32, 0, Z_NULL, 0
|
||||
mov [ebx+z_stream.adler],eax
|
||||
mov dword[edi+deflate_state.status],BUSY_STATE
|
||||
@@:
|
||||
jmp .end8
|
||||
.end9: ;else
|
||||
mov dword[edi+deflate_state.status],BUSY_STATE
|
||||
@ -1390,11 +1388,10 @@ end if
|
||||
mov dword[edi+deflate_state.last_flush],-1
|
||||
mov eax,Z_OK
|
||||
jmp .end_f
|
||||
@@:
|
||||
; Make sure there is something to do and avoid duplicate consecutive
|
||||
; flushes. For repeated and useless calls with Z_FINISH, we keep
|
||||
; returning Z_STREAM_END instead of Z_BUF_ERROR.
|
||||
jmp @f
|
||||
align 4
|
||||
.end13:
|
||||
cmp dword[ebx+z_stream.avail_in],0
|
||||
jne @f
|
||||
@ -1554,7 +1551,6 @@ endp
|
||||
align 4
|
||||
proc deflateEnd uses ebx ecx edx, strm:dword
|
||||
mov ebx,[strm]
|
||||
zlib_debug 'deflateEnd'
|
||||
cmp ebx,Z_NULL
|
||||
je @f
|
||||
mov edx,[ebx+z_stream.state]
|
||||
@ -1644,9 +1640,9 @@ proc deflateCopy uses ebx edx edi esi, dest:dword, source:dword
|
||||
|
||||
ZALLOC edx, [edi+deflate_state.w_size], 2 ;2*sizeof.db
|
||||
mov dword[edi+deflate_state.window],eax
|
||||
ZALLOC edx, [edi+deflate_state.w_size], 4 ;sizeof.dd
|
||||
ZALLOC edx, [edi+deflate_state.w_size], 2 ;sizeof.dw
|
||||
mov dword[edi+deflate_state.prev],eax
|
||||
ZALLOC edx, [edi+deflate_state.hash_size], 4 ;sizeof.dd
|
||||
ZALLOC edx, [edi+deflate_state.hash_size], 2 ;sizeof.dw
|
||||
mov dword[edi+deflate_state.head],eax
|
||||
ZALLOC edx, [edi+deflate_state.lit_bufsize], 4 ;sizeof.dw+2
|
||||
mov ebx,eax
|
||||
@ -1671,10 +1667,10 @@ proc deflateCopy uses ebx edx edi esi, dest:dword, source:dword
|
||||
shl eax,1 ;*= 2*sizeof.db
|
||||
stdcall zmemcpy, [edi+deflate_state.window], [esi+deflate_state.window], eax
|
||||
mov eax,[edi+deflate_state.w_size]
|
||||
shl eax,2 ;*= sizeof.dd
|
||||
shl eax,1 ;*= sizeof.dw
|
||||
stdcall zmemcpy, [edi+deflate_state.prev], [esi+deflate_state.prev], eax
|
||||
mov eax,[edi+deflate_state.hash_size]
|
||||
shl eax,2 ;*= sizeof.dd
|
||||
shl eax,1 ;*= sizeof.dw
|
||||
stdcall zmemcpy, [edi+deflate_state.head], [esi+deflate_state.head], eax
|
||||
stdcall zmemcpy, [edi+deflate_state.pending_buf], [esi+deflate_state.pending_buf], [edi+deflate_state.pending_buf_size]
|
||||
|
||||
@ -1715,7 +1711,7 @@ endp
|
||||
; z_streamp strm
|
||||
; Bytef *buf
|
||||
; unsigned size
|
||||
align 4
|
||||
align 16
|
||||
proc read_buf uses ebx ecx, strm:dword, buf:dword, size:dword
|
||||
mov ebx,[strm]
|
||||
mov eax,[ebx+z_stream.avail_in]
|
||||
@ -1740,7 +1736,9 @@ proc read_buf uses ebx ecx, strm:dword, buf:dword, size:dword
|
||||
stdcall adler32, [ebx+z_stream.adler], [buf], eax
|
||||
mov [ebx+z_stream.adler],eax
|
||||
pop eax
|
||||
if GZIP eq 1
|
||||
jmp .end0
|
||||
end if
|
||||
@@:
|
||||
if GZIP eq 1
|
||||
cmp dword[ecx+deflate_state.wrap],2
|
||||
@ -1749,8 +1747,8 @@ if GZIP eq 1
|
||||
stdcall calc_crc32, [ebx+z_stream.adler], [buf], eax
|
||||
mov [ebx+z_stream.adler],eax
|
||||
pop eax
|
||||
end if
|
||||
.end0:
|
||||
end if
|
||||
add [ebx+z_stream.next_in],eax
|
||||
add [ebx+z_stream.total_in],eax
|
||||
|
||||
@ -1761,9 +1759,8 @@ endp
|
||||
; ===========================================================================
|
||||
; Initialize the "longest match" routines for a new zlib stream
|
||||
|
||||
;void (s)
|
||||
; deflate_state *s
|
||||
align 4
|
||||
;void (deflate_state *s)
|
||||
align 16
|
||||
proc lm_init uses eax ebx edi, s:dword
|
||||
mov edi,[s]
|
||||
mov eax,[edi+deflate_state.w_size]
|
||||
@ -1805,7 +1802,7 @@ endp
|
||||
;uInt (s, cur_match)
|
||||
; deflate_state *s
|
||||
; IPos cur_match ;current match
|
||||
align 4
|
||||
align 16
|
||||
proc longest_match uses ebx ecx edx edi esi, s:dword, cur_match:dword
|
||||
if FASTEST eq 0
|
||||
; ===========================================================================
|
||||
@ -1984,9 +1981,9 @@ align 4
|
||||
.cycle0cont:
|
||||
mov eax,[cur_match]
|
||||
and eax,[wmask]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[prev]
|
||||
mov eax,[eax] ;eax = prev[cur_match & wmask]
|
||||
movzx eax,word[eax] ;eax = prev[cur_match & wmask]
|
||||
mov [cur_match],eax
|
||||
cmp eax,[limit]
|
||||
jle .cycle0end
|
||||
@ -2094,11 +2091,9 @@ align 4
|
||||
@@:
|
||||
end if ;FASTEST
|
||||
.end_f:
|
||||
;zlib_debug ' longest_match.ret = %d',eax
|
||||
ret
|
||||
endp
|
||||
|
||||
|
||||
; ===========================================================================
|
||||
; Check that the match at match_start is indeed a match.
|
||||
|
||||
@ -2127,7 +2122,6 @@ end if ;DEBUG
|
||||
ret
|
||||
endp
|
||||
|
||||
|
||||
; ===========================================================================
|
||||
; Fill the window when the lookahead becomes insufficient.
|
||||
; Updates strstart and lookahead.
|
||||
@ -2138,9 +2132,8 @@ endp
|
||||
; performed for at least two bytes (required for the zip translate_eol
|
||||
; option -- not supported here).
|
||||
|
||||
;void (s)
|
||||
; deflate_state *s
|
||||
align 4
|
||||
;void (deflate_state *s)
|
||||
align 16
|
||||
proc fill_window, s:dword
|
||||
pushad
|
||||
;esi = p, str, curr
|
||||
@ -2148,7 +2141,6 @@ pushad
|
||||
;Объем свободного пространства в конце окна.
|
||||
;ecx = wsize ;uInt
|
||||
;edx = s.strm
|
||||
zlib_debug 'fill_window'
|
||||
mov edi,[s]
|
||||
cmp dword[edi+deflate_state.lookahead],MIN_LOOKAHEAD
|
||||
jl @f
|
||||
@ -2158,7 +2150,6 @@ pushad
|
||||
mov ecx,[edi+deflate_state.w_size]
|
||||
mov edx,[edi+deflate_state.strm]
|
||||
.cycle0: ;do
|
||||
zlib_debug 'do'
|
||||
mov ebx,[edi+deflate_state.window_size]
|
||||
sub ebx,[edi+deflate_state.lookahead]
|
||||
sub ebx,[edi+deflate_state.strstart]
|
||||
@ -2177,7 +2168,6 @@ pushad
|
||||
sub [edi+deflate_state.match_start],ecx
|
||||
sub [edi+deflate_state.strstart],ecx ;we now have strstart >= MAX_DIST
|
||||
sub [edi+deflate_state.block_start],ecx
|
||||
|
||||
; Slide the hash table (could be avoided with 32 bit values
|
||||
; at the expense of memory usage). We slide even when level == 0
|
||||
; to keep the hash table consistent if we switch back to level > 0
|
||||
@ -2190,32 +2180,31 @@ pushad
|
||||
mov ebx,ecx
|
||||
mov ecx,[edi+deflate_state.hash_size]
|
||||
mov esi,ecx
|
||||
shl esi,2
|
||||
shl esi,1
|
||||
add esi,[edi+deflate_state.head]
|
||||
.cycle1: ;do
|
||||
sub esi,4
|
||||
mov eax,[esi]
|
||||
mov dword[esi],NIL
|
||||
sub esi,2
|
||||
movzx eax,word[esi]
|
||||
mov word[esi],NIL
|
||||
cmp eax,ebx
|
||||
jl @f
|
||||
sub eax,ebx
|
||||
mov dword[esi],eax
|
||||
mov [esi],ax
|
||||
@@:
|
||||
loop .cycle1 ;while (..)
|
||||
|
||||
if FASTEST eq 0
|
||||
mov ecx,ebx
|
||||
mov esi,ecx
|
||||
shl esi,2
|
||||
shl esi,1
|
||||
add esi,[edi+deflate_state.prev]
|
||||
.cycle2: ;do
|
||||
sub esi,4
|
||||
mov eax,[esi]
|
||||
mov dword[esi],NIL
|
||||
sub esi,2
|
||||
movzx eax,word[esi]
|
||||
mov word[esi],NIL
|
||||
cmp eax,ebx
|
||||
jl @f
|
||||
sub eax,ebx
|
||||
mov dword[esi],eax
|
||||
mov [esi],ax
|
||||
@@:
|
||||
; If n is not on any hash chain, prev[n] is garbage but
|
||||
; its value will never be used.
|
||||
@ -2276,21 +2265,21 @@ end if
|
||||
UPDATE_HASH edi, [edi+deflate_state.ins_h], eax
|
||||
if FASTEST eq 0
|
||||
mov eax,[edi+deflate_state.ins_h]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[edi+deflate_state.head]
|
||||
push ebx
|
||||
mov ebx,[edi+deflate_state.w_mask]
|
||||
and ebx,esi
|
||||
shl ebx,2
|
||||
shl ebx,1
|
||||
add ebx,[edi+deflate_state.prev]
|
||||
mov eax,[eax]
|
||||
mov [ebx],eax
|
||||
mov ax,[eax]
|
||||
mov [ebx],ax
|
||||
pop ebx
|
||||
end if
|
||||
mov eax,[edi+deflate_state.ins_h]
|
||||
shl eax,2
|
||||
shl eax,1
|
||||
add eax,[edi+deflate_state.head]
|
||||
mov [eax],esi
|
||||
mov [eax],si
|
||||
inc esi
|
||||
dec dword[edi+deflate_state.insert]
|
||||
mov eax,[edi+deflate_state.lookahead]
|
||||
@ -2385,7 +2374,7 @@ local .end0
|
||||
sub eax,[s+deflate_state.block_start]
|
||||
push eax
|
||||
xor eax,eax
|
||||
cmp dword[s+deflate_state.block_start],0
|
||||
cmp [s+deflate_state.block_start],eax
|
||||
jl .end0
|
||||
mov eax,[s+deflate_state.block_start]
|
||||
add eax,[s+deflate_state.window]
|
||||
@ -2431,7 +2420,6 @@ proc deflate_stored uses ebx ecx edi, s:dword, flush:dword
|
||||
; Stored blocks are limited to 0xffff bytes, pending_buf is limited
|
||||
; to pending_buf_size, and each stored block has a 5 byte header:
|
||||
mov edi,[s]
|
||||
zlib_debug 'deflate_stored'
|
||||
|
||||
mov ecx,0xffff
|
||||
mov eax,[edi+deflate_state.pending_buf_size]
|
||||
@ -2443,7 +2431,7 @@ proc deflate_stored uses ebx ecx edi, s:dword, flush:dword
|
||||
|
||||
; Copy as much as possible from input to output:
|
||||
align 4
|
||||
.cycle0: ;for (;;) {
|
||||
.cycle0: ;for (;;)
|
||||
; Fill the window as much as possible:
|
||||
cmp dword[edi+deflate_state.lookahead],1
|
||||
jg .end0 ;if (..<=..)
|
||||
@ -2531,7 +2519,6 @@ locals
|
||||
endl
|
||||
;ecx = hash_head ;IPos ;head of the hash chain
|
||||
mov edi,[s]
|
||||
zlib_debug 'deflate_fast'
|
||||
|
||||
.cycle0: ;for (..)
|
||||
; Make sure that we always have enough lookahead, except
|
||||
@ -2686,7 +2673,6 @@ locals
|
||||
endl
|
||||
;ecx = hash_head ;IPos ;head of the hash chain
|
||||
mov edi,[s]
|
||||
zlib_debug 'deflate_slow'
|
||||
|
||||
; Process the input block.
|
||||
.cycle0: ;for (;;)
|
||||
@ -2903,7 +2889,6 @@ locals
|
||||
bflush dd ? ;int ;set if current block must be flushed
|
||||
endl
|
||||
mov edx,[s]
|
||||
zlib_debug 'deflate_rle'
|
||||
align 4
|
||||
.cycle0: ;for (;;)
|
||||
; Make sure that we always have enough lookahead, except
|
||||
@ -3026,7 +3011,6 @@ locals
|
||||
bflush dd ? ;int ;set if current block must be flushed
|
||||
endl
|
||||
mov edi,[s]
|
||||
zlib_debug 'deflate_huff'
|
||||
align 4
|
||||
.cycle0: ;for (;;)
|
||||
; Make sure that we have a literal to write.
|
||||
|
@ -146,7 +146,9 @@ struct deflate_state ;internal_state
|
||||
; levels >= 4.
|
||||
|
||||
level dw ? ;int ;compression level (1..9)
|
||||
rb 2 ;for align
|
||||
strategy dw ? ;int ;favor or force Huffman coding
|
||||
rb 2 ;for align
|
||||
|
||||
good_match dd ? ;uInt
|
||||
; Use a faster search when the previous match is longer than this
|
||||
@ -166,7 +168,7 @@ struct deflate_state ;internal_state
|
||||
bl_count rw MAX_BITS+1 ;uint_16[]
|
||||
; number of codes at each bit length for an optimal tree
|
||||
|
||||
heap rw 2*L_CODES+1 ;int[] ;heap used to build the Huffman trees
|
||||
heap rd 2*L_CODES+1 ;int[] ;heap used to build the Huffman trees
|
||||
heap_len dd ? ;int ;number of elements in the heap
|
||||
heap_max dd ? ;int ;element of largest frequency
|
||||
; The sons of heap[n] are heap[2*n] and heap[2*n+1]. heap[0] is not used.
|
||||
@ -209,11 +211,12 @@ struct deflate_state ;internal_state
|
||||
insert dd ? ;uInt ;bytes at end of window left to insert
|
||||
|
||||
if DEBUG eq 1
|
||||
compressed_len dd ? ;ulg ;total bit length of compressed file mod 2^32
|
||||
bits_sent dd ? ;ulg ;bit length of compressed data sent mod 2^32
|
||||
;compressed_len dd ? ;ulg ;total bit length of compressed file mod 2^32
|
||||
;bits_sent dd ? ;ulg ;bit length of compressed data sent mod 2^32
|
||||
end if
|
||||
|
||||
bi_buf dw ? ;uint_16
|
||||
rb 2 ;for align
|
||||
; Output buffer. bits are inserted starting at the bottom (least
|
||||
; significant bits).
|
||||
|
||||
@ -238,18 +241,17 @@ deflate_state.max_insert_length equ deflate_state.max_lazy_match
|
||||
|
||||
macro put_byte s, c
|
||||
{
|
||||
movzx eax,word[s+deflate_state.pending]
|
||||
mov eax,[s+deflate_state.pending]
|
||||
add eax,[s+deflate_state.pending_buf]
|
||||
mov byte[eax],c
|
||||
inc word[s+deflate_state.pending]
|
||||
inc dword[s+deflate_state.pending]
|
||||
}
|
||||
macro put_dword s, d
|
||||
{
|
||||
zlib_debug '(%d)',d
|
||||
movzx eax,word[s+deflate_state.pending]
|
||||
mov eax,[s+deflate_state.pending]
|
||||
add eax,[s+deflate_state.pending_buf]
|
||||
mov dword[eax],d
|
||||
add word[s+deflate_state.pending],4
|
||||
add dword[s+deflate_state.pending],4
|
||||
}
|
||||
|
||||
MIN_LOOKAHEAD equ (MAX_MATCH+MIN_MATCH+1)
|
||||
@ -305,8 +307,7 @@ end if
|
||||
inc dword[s+deflate_state.last_lit]
|
||||
and eax,0xff
|
||||
imul eax,sizeof.ct_data
|
||||
add eax,s
|
||||
inc word[eax+deflate_state.dyn_ltree+Freq]
|
||||
inc word[s+eax+deflate_state.dyn_ltree+Freq]
|
||||
xor eax,eax
|
||||
mov ecx,[s+deflate_state.lit_bufsize]
|
||||
dec ecx
|
||||
|
@ -172,7 +172,6 @@ macro put_short s, w
|
||||
align 4
|
||||
proc send_bits uses eax ecx edi, s:dword, value:dword, length:dword
|
||||
; Tracevv((stderr," l %2d v %4x ", length, value));
|
||||
zlib_debug 'send_bits value = %d',[value]
|
||||
;if DEBUG eq 1
|
||||
mov eax,[length]
|
||||
cmp eax,0
|
||||
@ -183,7 +182,7 @@ proc send_bits uses eax ecx edi, s:dword, value:dword, length:dword
|
||||
zlib_assert 'invalid length' ;Assert(..>0 && ..<=15)
|
||||
.end1:
|
||||
mov edi,[s]
|
||||
add [edi+deflate_state.bits_sent],eax
|
||||
;;add [edi+deflate_state.bits_sent],eax
|
||||
|
||||
; If not enough room in bi_buf, use (valid) bits from bi_buf and
|
||||
; (16 - bi_valid) bits from value, leaving (width - (16-bi_valid))
|
||||
@ -385,12 +384,10 @@ endp
|
||||
; ===========================================================================
|
||||
; Initialize the tree data structures for a new zlib stream.
|
||||
|
||||
;void (s)
|
||||
; deflate_state* s
|
||||
;void (deflate_state* s)
|
||||
align 4
|
||||
proc _tr_init uses eax edi, s:dword
|
||||
mov edi,[s]
|
||||
zlib_debug '_tr_init'
|
||||
call tr_static_init
|
||||
|
||||
mov eax,edi
|
||||
@ -421,8 +418,7 @@ endp
|
||||
; ===========================================================================
|
||||
; Initialize a new block.
|
||||
|
||||
;void (s)
|
||||
; deflate_state* s
|
||||
;void (deflate_state* s)
|
||||
align 4
|
||||
proc init_block uses eax ecx edi, s:dword
|
||||
mov edi,[s]
|
||||
@ -469,12 +465,12 @@ SMALLEST equ 1
|
||||
macro pqremove s, tree, top
|
||||
{
|
||||
mov eax,s
|
||||
add eax,deflate_state.heap+2*SMALLEST
|
||||
add eax,deflate_state.heap+4*SMALLEST
|
||||
movzx top,word[eax]
|
||||
push ebx
|
||||
mov ebx,[s+deflate_state.heap_len]
|
||||
mov bx,[s+deflate_state.heap+2*ebx]
|
||||
mov word[eax],bx
|
||||
mov ebx,[s+deflate_state.heap+4*ebx]
|
||||
mov [eax],ebx
|
||||
dec dword[s+deflate_state.heap_len]
|
||||
pop ebx
|
||||
stdcall pqdownheap, s, tree, SMALLEST
|
||||
@ -488,20 +484,20 @@ macro smaller tree, n, m, depth, m_end
|
||||
{
|
||||
;if (..<.. || (..==.. && depth[n] <= depth[m]))
|
||||
local .end0
|
||||
movzx eax,n
|
||||
mov eax,n
|
||||
imul eax,sizeof.ct_data
|
||||
add eax,tree
|
||||
mov ax,word[eax+Freq]
|
||||
movzx ebx,m
|
||||
mov ebx,m
|
||||
imul ebx,sizeof.ct_data
|
||||
add ebx,tree
|
||||
mov bx,word[ebx+Freq]
|
||||
cmp ax,bx
|
||||
jl .end0
|
||||
jne m_end
|
||||
movzx eax,n
|
||||
mov eax,n
|
||||
mov al,byte[eax+depth]
|
||||
movzx ebx,m
|
||||
mov ebx,m
|
||||
cmp al,byte[ebx+depth]
|
||||
jg m_end
|
||||
.end0:
|
||||
@ -523,8 +519,7 @@ pushad
|
||||
;ecx - v dw
|
||||
mov edi,[s]
|
||||
mov esi,[k]
|
||||
zlib_debug 'pqdownheap k = %d',esi
|
||||
mov cx,[edi+deflate_state.heap+2*esi]
|
||||
mov ecx,[edi+deflate_state.heap+4*esi]
|
||||
shl esi,1
|
||||
;esi = j ;left son of k
|
||||
.cycle0: ;while (..<=..)
|
||||
@ -534,21 +529,21 @@ pushad
|
||||
;;cmp esi,[edi+deflate_state.heap_len]
|
||||
jge .end1 ;if (..<.. &&
|
||||
mov edx,esi
|
||||
shl edx,1
|
||||
shl edx,2
|
||||
add edx,edi
|
||||
add edx,deflate_state.heap
|
||||
smaller [tree], word[edx+2], word[edx], edi+deflate_state.depth, .end1
|
||||
smaller [tree], dword[edx+4], dword[edx], edi+deflate_state.depth, .end1
|
||||
inc esi
|
||||
.end1:
|
||||
; Exit if v is smaller than both sons
|
||||
mov dx,[edi+deflate_state.heap+2*esi]
|
||||
smaller [tree], cx, dx, edi+deflate_state.depth, .end2
|
||||
mov edx,[edi+deflate_state.heap+4*esi]
|
||||
smaller [tree], ecx, edx, edi+deflate_state.depth, .end2
|
||||
jmp .cycle0end ;break
|
||||
.end2:
|
||||
; Exchange v with the smallest son
|
||||
;;mov dx,[edi+deflate_state.heap+2*esi]
|
||||
mov eax,[k]
|
||||
mov [edi+deflate_state.heap+2*eax],dx
|
||||
mov [edi+deflate_state.heap+4*eax],edx
|
||||
mov [k],esi
|
||||
; And continue down the tree, setting j to the left son of k
|
||||
shl esi,1
|
||||
@ -556,7 +551,7 @@ pushad
|
||||
align 4
|
||||
.cycle0end:
|
||||
mov eax,[k]
|
||||
mov [edi+deflate_state.heap+2*eax],cx
|
||||
mov [edi+deflate_state.heap+4*eax],ecx
|
||||
popad
|
||||
ret
|
||||
endp
|
||||
@ -591,7 +586,6 @@ locals
|
||||
overflow dd 0 ;int ;number of elements with bit length too large
|
||||
endl
|
||||
pushad
|
||||
zlib_debug 'gen_bitlen'
|
||||
mov edi,[s]
|
||||
mov edx,[desc]
|
||||
mov eax,[edx+tree_desc.dyn_tree]
|
||||
@ -622,7 +616,7 @@ align 4
|
||||
; overflow in the case of the bit length tree).
|
||||
|
||||
mov eax,[edi+deflate_state.heap_max]
|
||||
movzx eax,word[edi+deflate_state.heap+2*eax]
|
||||
mov eax,[edi+deflate_state.heap+4*eax]
|
||||
imul eax,sizeof.ct_data
|
||||
add eax,[tree]
|
||||
mov word[eax+Len],0 ;root of the heap
|
||||
@ -634,7 +628,7 @@ align 4
|
||||
cmp dword[h],HEAP_SIZE
|
||||
jge .cycle1end ;for (..;..<..;..)
|
||||
mov eax,[h]
|
||||
movzx ecx,word[edi+deflate_state.heap+2*eax]
|
||||
mov ecx,[edi+deflate_state.heap+4*eax]
|
||||
;ecx = n
|
||||
mov eax,sizeof.ct_data
|
||||
imul eax,ecx
|
||||
@ -752,7 +746,7 @@ align 4
|
||||
je .cycle4end
|
||||
dec dword[h]
|
||||
mov eax,[h]
|
||||
movzx eax,word[edi+deflate_state.heap+2*eax]
|
||||
mov eax,[edi+deflate_state.heap+4*eax]
|
||||
mov [m],eax ;m = s.heap[--h]
|
||||
cmp eax,[max_code]
|
||||
jg .cycle4 ;if (..>..) continue
|
||||
@ -804,7 +798,6 @@ locals
|
||||
endl
|
||||
; The distribution counts are first used to generate the code values
|
||||
; without bit reversal.
|
||||
zlib_debug 'gen_codes'
|
||||
mov ebx,ebp
|
||||
sub ebx,2*(MAX_BITS+1)
|
||||
|
||||
@ -912,7 +905,7 @@ endl
|
||||
inc dword[edi+deflate_state.heap_len]
|
||||
mov eax,[edi+deflate_state.heap_len]
|
||||
mov [max_code],ecx
|
||||
mov [edi+deflate_state.heap+2*eax],cx
|
||||
mov dword[edi+deflate_state.heap+4*eax],ecx
|
||||
mov byte[edi+deflate_state.depth+ecx],0
|
||||
jmp .end0
|
||||
align 4
|
||||
@ -941,7 +934,7 @@ align 4
|
||||
mov eax,[max_code]
|
||||
@@:
|
||||
mov ecx,[edi+deflate_state.heap_len]
|
||||
mov [edi+deflate_state.heap+2*ecx],ax
|
||||
mov [edi+deflate_state.heap+4*ecx],eax
|
||||
mov [node],eax
|
||||
imul eax,sizeof.ct_data
|
||||
add eax,[tree]
|
||||
@ -989,10 +982,10 @@ align 4
|
||||
|
||||
mov eax,[edi+deflate_state.heap_max]
|
||||
dec eax
|
||||
mov [edi+deflate_state.heap+2*eax],cx ;keep the nodes sorted by frequency
|
||||
mov [edi+deflate_state.heap+4*eax],ecx ;keep the nodes sorted by frequency
|
||||
dec eax
|
||||
mov [edi+deflate_state.heap_max],eax
|
||||
mov [edi+deflate_state.heap+2*eax],dx
|
||||
mov [edi+deflate_state.heap+4*eax],edx
|
||||
|
||||
; Create a new node father of n and m
|
||||
;;mov edx,[m]
|
||||
@ -1040,16 +1033,16 @@ align 4
|
||||
;end if
|
||||
; and insert the new node in the heap
|
||||
mov ecx,[node]
|
||||
mov [edi+deflate_state.heap+2*SMALLEST],cx
|
||||
mov [edi+deflate_state.heap+4*SMALLEST],ecx
|
||||
inc dword[node]
|
||||
stdcall pqdownheap, edi, [tree], SMALLEST
|
||||
cmp dword[edi+deflate_state.heap_len],2
|
||||
jge .cycle3 ;while (..>=..)
|
||||
|
||||
mov cx,[edi+deflate_state.heap+2*SMALLEST]
|
||||
mov ecx,[edi+deflate_state.heap+4*SMALLEST]
|
||||
dec dword[edi+deflate_state.heap_max]
|
||||
mov eax,[edi+deflate_state.heap_max]
|
||||
mov [edi+deflate_state.heap+2*eax],cx
|
||||
mov [edi+deflate_state.heap+4*eax],ecx
|
||||
|
||||
; At this point, the fields freq and dad are set. We can now
|
||||
; generate the bit lengths.
|
||||
@ -1083,7 +1076,6 @@ locals
|
||||
min_count dd 4 ;int ;min repeat count
|
||||
endl
|
||||
mov edi,[s]
|
||||
zlib_debug 'scan_tree'
|
||||
mov eax,[tree]
|
||||
movzx eax,word[eax+Len]
|
||||
mov [nextlen],eax
|
||||
@ -1204,7 +1196,6 @@ locals
|
||||
min_count dd 4 ;int ;min repeat count
|
||||
endl
|
||||
mov edi,[s]
|
||||
zlib_debug 'send_tree'
|
||||
; *** tree[max_code+1].Len = -1 ;guard already set
|
||||
mov eax,[tree]
|
||||
movzx eax,word[eax+Len]
|
||||
@ -1214,7 +1205,6 @@ endl
|
||||
jnz .cycle0 ;if (..==0)
|
||||
mov dword[max_count],138
|
||||
mov dword[min_count],3
|
||||
|
||||
align 4
|
||||
.cycle0: ;for (..;..<=..;..)
|
||||
cmp ecx,[max_code]
|
||||
@ -1322,8 +1312,7 @@ endp
|
||||
; Construct the Huffman tree for the bit lengths and return the index in
|
||||
; bl_order of the last bit length code to send.
|
||||
|
||||
;int (s)
|
||||
; deflate_state* s
|
||||
;int (deflate_state* s)
|
||||
align 4
|
||||
proc build_bl_tree uses edi, s:dword
|
||||
locals
|
||||
@ -1385,7 +1374,6 @@ endp
|
||||
align 4
|
||||
proc send_all_trees uses eax ebx ecx edi, s:dword, lcodes:dword, dcodes:dword, blcodes:dword
|
||||
;ecx = index in bl_order
|
||||
zlib_debug 'send_all_trees'
|
||||
cmp dword[lcodes],257
|
||||
jl @f
|
||||
cmp dword[dcodes],1
|
||||
@ -1479,20 +1467,20 @@ endp
|
||||
; ===========================================================================
|
||||
; Flush the bits in the bit buffer to pending output (leaves at most 7 bits)
|
||||
|
||||
;void (s)
|
||||
; deflate_state* s
|
||||
align 4
|
||||
proc _tr_flush_bits, s:dword
|
||||
stdcall bi_flush, [s]
|
||||
ret
|
||||
endp
|
||||
;void (deflate_state* s)
|
||||
;align 4
|
||||
;proc _tr_flush_bits, s:dword
|
||||
; stdcall bi_flush, [s]
|
||||
; ret
|
||||
;endp
|
||||
|
||||
_tr_flush_bits equ bi_flush
|
||||
|
||||
; ===========================================================================
|
||||
; Send one empty static block to give enough lookahead for inflate.
|
||||
; This takes 10 bits, of which 7 may remain in the bit buffer.
|
||||
|
||||
;void (s)
|
||||
; deflate_state* s
|
||||
;void (deflate_state* s)
|
||||
align 4
|
||||
proc _tr_align uses edi, s:dword
|
||||
mov edi,[s]
|
||||
@ -1523,7 +1511,6 @@ locals
|
||||
endl
|
||||
; Build the Huffman trees unless a stored block is forced
|
||||
mov edi,[s]
|
||||
zlib_debug '_tr_flush_block'
|
||||
cmp word[edi+deflate_state.level],0
|
||||
jle .end0 ;if (..>0)
|
||||
|
||||
@ -1728,10 +1715,9 @@ if TRUNCATE_BLOCK eq 1
|
||||
; Try to guess if it is profitable to stop the current block here
|
||||
mov eax,[edi+deflate_state.last_lit]
|
||||
and eax,0x1fff
|
||||
cmp eax,0
|
||||
jne .end1
|
||||
jnz .end1
|
||||
cmp word[edi+deflate_state.level],2
|
||||
jle .end1 ;if (..==.. && ..>..)
|
||||
jle .end1 ;if (..==0 && ..>..)
|
||||
; Compute an upper bound for the compressed length
|
||||
; ulg out_length = (ulg)s->last_lit*8L;
|
||||
; ulg in_length = (ulg)((long)s->strstart - s->block_start);
|
||||
@ -1775,7 +1761,6 @@ locals
|
||||
lc dd ? ;int ;match length or unmatched char (if dist == 0)
|
||||
lx dd 0 ;unsigned ;running index in l_buf
|
||||
u_code dd ? ;unsigned ;the code to send
|
||||
extra dd ? ;int ;number of extra bits to send
|
||||
endl
|
||||
mov edi,[s]
|
||||
cmp dword[edi+deflate_state.last_lit],0
|
||||
@ -1805,18 +1790,14 @@ endl
|
||||
add eax,LITERALS+1
|
||||
send_code edi, eax, [ltree] ;send the length code
|
||||
mov eax,[u_code]
|
||||
shl eax,2
|
||||
add eax,extra_lbits
|
||||
mov eax,[eax]
|
||||
mov [extra],eax
|
||||
cmp eax,0
|
||||
je @f ;if (..!=0)
|
||||
mov eax,[4*eax+extra_lbits]
|
||||
test eax,eax
|
||||
jz @f ;if (..!=0)
|
||||
push eax ;extra
|
||||
mov eax,[u_code]
|
||||
shl eax,2
|
||||
add eax,base_length
|
||||
mov eax,[eax]
|
||||
mov eax,[4*eax+base_length]
|
||||
sub [lc],eax
|
||||
stdcall send_bits, edi, [lc], [extra] ;send the extra length bits
|
||||
stdcall send_bits, edi, [lc] ;, ... ;send the extra length bits
|
||||
@@:
|
||||
dec dword[dist] ;dist is now the match distance - 1
|
||||
d_code [dist]
|
||||
@ -1827,18 +1808,14 @@ endl
|
||||
@@:
|
||||
send_code edi, [u_code], [dtree] ;send the distance code
|
||||
mov eax,[u_code]
|
||||
shl eax,2
|
||||
add eax,extra_dbits
|
||||
mov eax,[eax]
|
||||
mov [extra],eax
|
||||
cmp eax,0
|
||||
je .end1 ;if (..!=0)
|
||||
mov eax,[4*eax+extra_dbits]
|
||||
test eax,eax
|
||||
jz .end1 ;if (..!=0)
|
||||
push eax ;extra
|
||||
mov eax,[u_code]
|
||||
shl eax,2
|
||||
add eax,base_dist
|
||||
mov eax,[eax]
|
||||
mov eax,[4*eax+base_dist]
|
||||
sub [dist],eax
|
||||
stdcall send_bits, edi, [dist], [extra] ;send the extra distance bits
|
||||
stdcall send_bits, edi, [dist] ;, ... ;send the extra distance bits
|
||||
.end1: ;literal or match pair ?
|
||||
|
||||
; Check that the overlay between pending_buf and d_buf+l_buf is ok:
|
||||
@ -1954,7 +1931,6 @@ endp
|
||||
; int len ;its bit length
|
||||
align 4
|
||||
proc bi_reverse uses ebx, p1code:dword, len:dword
|
||||
zlib_debug 'bi_reverse'
|
||||
xor eax,eax
|
||||
@@: ;do
|
||||
mov ebx,[p1code]
|
||||
@ -1998,8 +1974,7 @@ endp
|
||||
; ===========================================================================
|
||||
; Flush the bit buffer and align the output on a byte boundary
|
||||
|
||||
;void (s)
|
||||
; deflate_state* s
|
||||
;void (deflate_state* s)
|
||||
align 4
|
||||
proc bi_windup uses eax ecx edi, s:dword
|
||||
mov edi,[s]
|
||||
|
@ -26,6 +26,7 @@ macro zlib_assert fmt,p1
|
||||
{
|
||||
local .end_t
|
||||
local .m_fmt
|
||||
pushf
|
||||
jmp .end_t
|
||||
.m_fmt db fmt,13,10,0
|
||||
align 4
|
||||
@ -35,6 +36,7 @@ if p1 eq
|
||||
else
|
||||
stdcall str_format_dbg, buf_param,.m_fmt,p1
|
||||
end if
|
||||
popf
|
||||
}
|
||||
|
||||
include 'zlib.inc'
|
||||
|
@ -137,14 +137,23 @@ endp
|
||||
align 4
|
||||
proc zmemcpy uses ecx edi esi, dest:dword, source:dword, len:dword
|
||||
mov ecx,[len]
|
||||
cmp ecx,0
|
||||
jle @f
|
||||
test ecx,ecx
|
||||
jz .end0
|
||||
mov edi,[dest]
|
||||
mov esi,[source]
|
||||
bt ecx,0 ;кратно 2 ?
|
||||
jnc @f
|
||||
rep movsb
|
||||
jmp .end0
|
||||
@@:
|
||||
zlib_debug 'zmemcpy size = %d',ecx
|
||||
bt ecx,1 ;кратно 4 ?
|
||||
jnc @f
|
||||
shr ecx,1
|
||||
rep movsw
|
||||
jmp .end0
|
||||
@@:
|
||||
shr ecx,2
|
||||
rep movsd
|
||||
.end0:
|
||||
ret
|
||||
endp
|
||||
|
Loading…
Reference in New Issue
Block a user