| ;/* inffas32.asm is a hand tuned assembler version of inffast.c -- fast decoding |
| ; * |
| ; * inffas32.asm is derivated from inffas86.c, with translation of assembly code |
| ; * |
| ; * Copyright (C) 1995-2003 Mark Adler |
| ; * For conditions of distribution and use, see copyright notice in zlib.h |
| ; * |
| ; * Copyright (C) 2003 Chris Anderson <christop@charm.net> |
| ; * Please use the copyright conditions above. |
| ; * |
| ; * Mar-13-2003 -- Most of this is derived from inffast.S which is derived from |
| ; * the gcc -S output of zlib-1.2.0/inffast.c. Zlib-1.2.0 is in beta release at |
| ; * the moment. I have successfully compiled and tested this code with gcc2.96, |
| ; * gcc3.2, icc5.0, msvc6.0. It is very close to the speed of inffast.S |
| ; * compiled with gcc -DNO_MMX, but inffast.S is still faster on the P3 with MMX |
| ; * enabled. I will attempt to merge the MMX code into this version. Newer |
| ; * versions of this and inffast.S can be found at |
| ; * http://www.eetbeetee.com/zlib/ and http://www.charm.net/~christop/zlib/ |
| ; * |
| ; * 2005 : modification by Gilles Vollant |
| ; */ |
| ; For Visual C++ 4.x and higher and ML 6.x and higher |
| ; ml.exe is in directory \MASM611C of Win95 DDK |
| ; ml.exe is also distributed in http://www.masm32.com/masmdl.htm |
| ; and in VC++2003 toolkit at http://msdn.microsoft.com/visualc/vctoolkit2003/ |
| ; |
| ; |
| ; compile with command line option |
| ; ml /coff /Zi /c /Flinffas32.lst inffas32.asm |
| |
| ; if you define NO_GZIP (see inflate.h), compile with |
| ; ml /coff /Zi /c /Flinffas32.lst /DNO_GUNZIP inffas32.asm |
| |
| |
| ; zlib122sup is 0 fort zlib 1.2.2.1 and lower |
| ; zlib122sup is 8 fort zlib 1.2.2.2 and more (with addition of dmax and head |
| ; in inflate_state in inflate.h) |
| zlib1222sup equ 8 |
| |
| |
| IFDEF GUNZIP |
| INFLATE_MODE_TYPE equ 11 |
| INFLATE_MODE_BAD equ 26 |
| ELSE |
| IFNDEF NO_GUNZIP |
| INFLATE_MODE_TYPE equ 11 |
| INFLATE_MODE_BAD equ 26 |
| ELSE |
| INFLATE_MODE_TYPE equ 3 |
| INFLATE_MODE_BAD equ 17 |
| ENDIF |
| ENDIF |
| |
| |
| ; 75 "inffast.S" |
| ;FILE "inffast.S" |
| |
| ;;;GLOBAL _inflate_fast |
| |
| ;;;SECTION .text |
| |
| |
| |
| .586p |
| .mmx |
| |
| name inflate_fast_x86 |
| .MODEL FLAT |
| |
| _DATA segment |
| inflate_fast_use_mmx: |
| dd 1 |
| |
| |
| _TEXT segment |
| |
| |
| |
| ALIGN 4 |
| db 'Fast decoding Code from Chris Anderson' |
| db 0 |
| |
| ALIGN 4 |
| invalid_literal_length_code_msg: |
| db 'invalid literal/length code' |
| db 0 |
| |
| ALIGN 4 |
| invalid_distance_code_msg: |
| db 'invalid distance code' |
| db 0 |
| |
| ALIGN 4 |
| invalid_distance_too_far_msg: |
| db 'invalid distance too far back' |
| db 0 |
| |
| |
| ALIGN 4 |
| inflate_fast_mask: |
| dd 0 |
| dd 1 |
| dd 3 |
| dd 7 |
| dd 15 |
| dd 31 |
| dd 63 |
| dd 127 |
| dd 255 |
| dd 511 |
| dd 1023 |
| dd 2047 |
| dd 4095 |
| dd 8191 |
| dd 16383 |
| dd 32767 |
| dd 65535 |
| dd 131071 |
| dd 262143 |
| dd 524287 |
| dd 1048575 |
| dd 2097151 |
| dd 4194303 |
| dd 8388607 |
| dd 16777215 |
| dd 33554431 |
| dd 67108863 |
| dd 134217727 |
| dd 268435455 |
| dd 536870911 |
| dd 1073741823 |
| dd 2147483647 |
| dd 4294967295 |
| |
| |
| mode_state equ 0 ;/* state->mode */ |
| wsize_state equ (32+zlib1222sup) ;/* state->wsize */ |
| write_state equ (36+4+zlib1222sup) ;/* state->write */ |
| window_state equ (40+4+zlib1222sup) ;/* state->window */ |
| hold_state equ (44+4+zlib1222sup) ;/* state->hold */ |
| bits_state equ (48+4+zlib1222sup) ;/* state->bits */ |
| lencode_state equ (64+4+zlib1222sup) ;/* state->lencode */ |
| distcode_state equ (68+4+zlib1222sup) ;/* state->distcode */ |
| lenbits_state equ (72+4+zlib1222sup) ;/* state->lenbits */ |
| distbits_state equ (76+4+zlib1222sup) ;/* state->distbits */ |
| |
| |
| ;;SECTION .text |
| ; 205 "inffast.S" |
| ;GLOBAL inflate_fast_use_mmx |
| |
| ;SECTION .data |
| |
| |
| ; GLOBAL inflate_fast_use_mmx:object |
| ;.size inflate_fast_use_mmx, 4 |
| ; 226 "inffast.S" |
| ;SECTION .text |
| |
| ALIGN 4 |
| _inflate_fast proc near |
| .FPO (16, 4, 0, 0, 1, 0) |
| push edi |
| push esi |
| push ebp |
| push ebx |
| pushfd |
| sub esp,64 |
| cld |
| |
| |
| |
| |
| mov esi, [esp+88] |
| mov edi, [esi+28] |
| |
| |
| |
| |
| |
| |
| |
| mov edx, [esi+4] |
| mov eax, [esi+0] |
| |
| add edx,eax |
| sub edx,11 |
| |
| mov [esp+44],eax |
| mov [esp+20],edx |
| |
| mov ebp, [esp+92] |
| mov ecx, [esi+16] |
| mov ebx, [esi+12] |
| |
| sub ebp,ecx |
| neg ebp |
| add ebp,ebx |
| |
| sub ecx,257 |
| add ecx,ebx |
| |
| mov [esp+60],ebx |
| mov [esp+40],ebp |
| mov [esp+16],ecx |
| ; 285 "inffast.S" |
| mov eax, [edi+lencode_state] |
| mov ecx, [edi+distcode_state] |
| |
| mov [esp+8],eax |
| mov [esp+12],ecx |
| |
| mov eax,1 |
| mov ecx, [edi+lenbits_state] |
| shl eax,cl |
| dec eax |
| mov [esp+0],eax |
| |
| mov eax,1 |
| mov ecx, [edi+distbits_state] |
| shl eax,cl |
| dec eax |
| mov [esp+4],eax |
| |
| mov eax, [edi+wsize_state] |
| mov ecx, [edi+write_state] |
| mov edx, [edi+window_state] |
| |
| mov [esp+52],eax |
| mov [esp+48],ecx |
| mov [esp+56],edx |
| |
| mov ebp, [edi+hold_state] |
| mov ebx, [edi+bits_state] |
| ; 321 "inffast.S" |
| mov esi, [esp+44] |
| mov ecx, [esp+20] |
| cmp ecx,esi |
| ja L_align_long |
| |
| add ecx,11 |
| sub ecx,esi |
| mov eax,12 |
| sub eax,ecx |
| lea edi, [esp+28] |
| rep movsb |
| mov ecx,eax |
| xor eax,eax |
| rep stosb |
| lea esi, [esp+28] |
| mov [esp+20],esi |
| jmp L_is_aligned |
| |
| |
| L_align_long: |
| test esi,3 |
| jz L_is_aligned |
| xor eax,eax |
| mov al, [esi] |
| inc esi |
| mov ecx,ebx |
| add ebx,8 |
| shl eax,cl |
| or ebp,eax |
| jmp L_align_long |
| |
| L_is_aligned: |
| mov edi, [esp+60] |
| ; 366 "inffast.S" |
| L_check_mmx: |
| cmp dword ptr [inflate_fast_use_mmx],2 |
| je L_init_mmx |
| ja L_do_loop |
| |
| push eax |
| push ebx |
| push ecx |
| push edx |
| pushfd |
| mov eax, [esp] |
| xor dword ptr [esp],0200000h |
| |
| |
| |
| |
| popfd |
| pushfd |
| pop edx |
| xor edx,eax |
| jz L_dont_use_mmx |
| xor eax,eax |
| cpuid |
| cmp ebx,0756e6547h |
| jne L_dont_use_mmx |
| cmp ecx,06c65746eh |
| jne L_dont_use_mmx |
| cmp edx,049656e69h |
| jne L_dont_use_mmx |
| mov eax,1 |
| cpuid |
| shr eax,8 |
| and eax,15 |
| cmp eax,6 |
| jne L_dont_use_mmx |
| test edx,0800000h |
| jnz L_use_mmx |
| jmp L_dont_use_mmx |
| L_use_mmx: |
| mov dword ptr [inflate_fast_use_mmx],2 |
| jmp L_check_mmx_pop |
| L_dont_use_mmx: |
| mov dword ptr [inflate_fast_use_mmx],3 |
| L_check_mmx_pop: |
| pop edx |
| pop ecx |
| pop ebx |
| pop eax |
| jmp L_check_mmx |
| ; 426 "inffast.S" |
| ALIGN 4 |
| L_do_loop: |
| ; 437 "inffast.S" |
| cmp bl,15 |
| ja L_get_length_code |
| |
| xor eax,eax |
| lodsw |
| mov cl,bl |
| add bl,16 |
| shl eax,cl |
| or ebp,eax |
| |
| L_get_length_code: |
| mov edx, [esp+0] |
| mov ecx, [esp+8] |
| and edx,ebp |
| mov eax, [ecx+edx*4] |
| |
| L_dolen: |
| |
| |
| |
| |
| |
| |
| mov cl,ah |
| sub bl,ah |
| shr ebp,cl |
| |
| |
| |
| |
| |
| |
| test al,al |
| jnz L_test_for_length_base |
| |
| shr eax,16 |
| stosb |
| |
| L_while_test: |
| |
| |
| cmp [esp+16],edi |
| jbe L_break_loop |
| |
| cmp [esp+20],esi |
| ja L_do_loop |
| jmp L_break_loop |
| |
| L_test_for_length_base: |
| ; 502 "inffast.S" |
| mov edx,eax |
| shr edx,16 |
| mov cl,al |
| |
| test al,16 |
| jz L_test_for_second_level_length |
| and cl,15 |
| jz L_save_len |
| cmp bl,cl |
| jae L_add_bits_to_len |
| |
| mov ch,cl |
| xor eax,eax |
| lodsw |
| mov cl,bl |
| add bl,16 |
| shl eax,cl |
| or ebp,eax |
| mov cl,ch |
| |
| L_add_bits_to_len: |
| mov eax,1 |
| shl eax,cl |
| dec eax |
| sub bl,cl |
| and eax,ebp |
| shr ebp,cl |
| add edx,eax |
| |
| L_save_len: |
| mov [esp+24],edx |
| |
| |
| L_decode_distance: |
| ; 549 "inffast.S" |
| cmp bl,15 |
| ja L_get_distance_code |
| |
| xor eax,eax |
| lodsw |
| mov cl,bl |
| add bl,16 |
| shl eax,cl |
| or ebp,eax |
| |
| L_get_distance_code: |
| mov edx, [esp+4] |
| mov ecx, [esp+12] |
| and edx,ebp |
| mov eax, [ecx+edx*4] |
| |
| |
| L_dodist: |
| mov edx,eax |
| shr edx,16 |
| mov cl,ah |
| sub bl,ah |
| shr ebp,cl |
| ; 584 "inffast.S" |
| mov cl,al |
| |
| test al,16 |
| jz L_test_for_second_level_dist |
| and cl,15 |
| jz L_check_dist_one |
| cmp bl,cl |
| jae L_add_bits_to_dist |
| |
| mov ch,cl |
| xor eax,eax |
| lodsw |
| mov cl,bl |
| add bl,16 |
| shl eax,cl |
| or ebp,eax |
| mov cl,ch |
| |
| L_add_bits_to_dist: |
| mov eax,1 |
| shl eax,cl |
| dec eax |
| sub bl,cl |
| and eax,ebp |
| shr ebp,cl |
| add edx,eax |
| jmp L_check_window |
| |
| L_check_window: |
| ; 625 "inffast.S" |
| mov [esp+44],esi |
| mov eax,edi |
| sub eax, [esp+40] |
| |
| cmp eax,edx |
| jb L_clip_window |
| |
| mov ecx, [esp+24] |
| mov esi,edi |
| sub esi,edx |
| |
| sub ecx,3 |
| mov al, [esi] |
| mov [edi],al |
| mov al, [esi+1] |
| mov dl, [esi+2] |
| add esi,3 |
| mov [edi+1],al |
| mov [edi+2],dl |
| add edi,3 |
| rep movsb |
| |
| mov esi, [esp+44] |
| jmp L_while_test |
| |
| ALIGN 4 |
| L_check_dist_one: |
| cmp edx,1 |
| jne L_check_window |
| cmp [esp+40],edi |
| je L_check_window |
| |
| dec edi |
| mov ecx, [esp+24] |
| mov al, [edi] |
| sub ecx,3 |
| |
| mov [edi+1],al |
| mov [edi+2],al |
| mov [edi+3],al |
| add edi,4 |
| rep stosb |
| |
| jmp L_while_test |
| |
| ALIGN 4 |
| L_test_for_second_level_length: |
| |
| |
| |
| |
| test al,64 |
| jnz L_test_for_end_of_block |
| |
| mov eax,1 |
| shl eax,cl |
| dec eax |
| and eax,ebp |
| add eax,edx |
| mov edx, [esp+8] |
| mov eax, [edx+eax*4] |
| jmp L_dolen |
| |
| ALIGN 4 |
| L_test_for_second_level_dist: |
| |
| |
| |
| |
| test al,64 |
| jnz L_invalid_distance_code |
| |
| mov eax,1 |
| shl eax,cl |
| dec eax |
| and eax,ebp |
| add eax,edx |
| mov edx, [esp+12] |
| mov eax, [edx+eax*4] |
| jmp L_dodist |
| |
| ALIGN 4 |
| L_clip_window: |
| ; 721 "inffast.S" |
| mov ecx,eax |
| mov eax, [esp+52] |
| neg ecx |
| mov esi, [esp+56] |
| |
| cmp eax,edx |
| jb L_invalid_distance_too_far |
| |
| add ecx,edx |
| cmp dword ptr [esp+48],0 |
| jne L_wrap_around_window |
| |
| sub eax,ecx |
| add esi,eax |
| ; 749 "inffast.S" |
| mov eax, [esp+24] |
| cmp eax,ecx |
| jbe L_do_copy1 |
| |
| sub eax,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,edx |
| jmp L_do_copy1 |
| |
| cmp eax,ecx |
| jbe L_do_copy1 |
| |
| sub eax,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,edx |
| jmp L_do_copy1 |
| |
| L_wrap_around_window: |
| ; 793 "inffast.S" |
| mov eax, [esp+48] |
| cmp ecx,eax |
| jbe L_contiguous_in_window |
| |
| add esi, [esp+52] |
| add esi,eax |
| sub esi,ecx |
| sub ecx,eax |
| |
| |
| mov eax, [esp+24] |
| cmp eax,ecx |
| jbe L_do_copy1 |
| |
| sub eax,ecx |
| rep movsb |
| mov esi, [esp+56] |
| mov ecx, [esp+48] |
| cmp eax,ecx |
| jbe L_do_copy1 |
| |
| sub eax,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,edx |
| jmp L_do_copy1 |
| |
| L_contiguous_in_window: |
| ; 836 "inffast.S" |
| add esi,eax |
| sub esi,ecx |
| |
| |
| mov eax, [esp+24] |
| cmp eax,ecx |
| jbe L_do_copy1 |
| |
| sub eax,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,edx |
| |
| L_do_copy1: |
| ; 862 "inffast.S" |
| mov ecx,eax |
| rep movsb |
| |
| mov esi, [esp+44] |
| jmp L_while_test |
| ; 878 "inffast.S" |
| ALIGN 4 |
| L_init_mmx: |
| emms |
| |
| |
| |
| |
| |
| movd mm0,ebp |
| mov ebp,ebx |
| ; 896 "inffast.S" |
| movd mm4,dword ptr [esp+0] |
| movq mm3,mm4 |
| movd mm5,dword ptr [esp+4] |
| movq mm2,mm5 |
| pxor mm1,mm1 |
| mov ebx, [esp+8] |
| jmp L_do_loop_mmx |
| |
| ALIGN 4 |
| L_do_loop_mmx: |
| psrlq mm0,mm1 |
| |
| cmp ebp,32 |
| ja L_get_length_code_mmx |
| |
| movd mm6,ebp |
| movd mm7,dword ptr [esi] |
| add esi,4 |
| psllq mm7,mm6 |
| add ebp,32 |
| por mm0,mm7 |
| |
| L_get_length_code_mmx: |
| pand mm4,mm0 |
| movd eax,mm4 |
| movq mm4,mm3 |
| mov eax, [ebx+eax*4] |
| |
| L_dolen_mmx: |
| movzx ecx,ah |
| movd mm1,ecx |
| sub ebp,ecx |
| |
| test al,al |
| jnz L_test_for_length_base_mmx |
| |
| shr eax,16 |
| stosb |
| |
| L_while_test_mmx: |
| |
| |
| cmp [esp+16],edi |
| jbe L_break_loop |
| |
| cmp [esp+20],esi |
| ja L_do_loop_mmx |
| jmp L_break_loop |
| |
| L_test_for_length_base_mmx: |
| |
| mov edx,eax |
| shr edx,16 |
| |
| test al,16 |
| jz L_test_for_second_level_length_mmx |
| and eax,15 |
| jz L_decode_distance_mmx |
| |
| psrlq mm0,mm1 |
| movd mm1,eax |
| movd ecx,mm0 |
| sub ebp,eax |
| and ecx, [inflate_fast_mask+eax*4] |
| add edx,ecx |
| |
| L_decode_distance_mmx: |
| psrlq mm0,mm1 |
| |
| cmp ebp,32 |
| ja L_get_dist_code_mmx |
| |
| movd mm6,ebp |
| movd mm7,dword ptr [esi] |
| add esi,4 |
| psllq mm7,mm6 |
| add ebp,32 |
| por mm0,mm7 |
| |
| L_get_dist_code_mmx: |
| mov ebx, [esp+12] |
| pand mm5,mm0 |
| movd eax,mm5 |
| movq mm5,mm2 |
| mov eax, [ebx+eax*4] |
| |
| L_dodist_mmx: |
| |
| movzx ecx,ah |
| mov ebx,eax |
| shr ebx,16 |
| sub ebp,ecx |
| movd mm1,ecx |
| |
| test al,16 |
| jz L_test_for_second_level_dist_mmx |
| and eax,15 |
| jz L_check_dist_one_mmx |
| |
| L_add_bits_to_dist_mmx: |
| psrlq mm0,mm1 |
| movd mm1,eax |
| movd ecx,mm0 |
| sub ebp,eax |
| and ecx, [inflate_fast_mask+eax*4] |
| add ebx,ecx |
| |
| L_check_window_mmx: |
| mov [esp+44],esi |
| mov eax,edi |
| sub eax, [esp+40] |
| |
| cmp eax,ebx |
| jb L_clip_window_mmx |
| |
| mov ecx,edx |
| mov esi,edi |
| sub esi,ebx |
| |
| sub ecx,3 |
| mov al, [esi] |
| mov [edi],al |
| mov al, [esi+1] |
| mov dl, [esi+2] |
| add esi,3 |
| mov [edi+1],al |
| mov [edi+2],dl |
| add edi,3 |
| rep movsb |
| |
| mov esi, [esp+44] |
| mov ebx, [esp+8] |
| jmp L_while_test_mmx |
| |
| ALIGN 4 |
| L_check_dist_one_mmx: |
| cmp ebx,1 |
| jne L_check_window_mmx |
| cmp [esp+40],edi |
| je L_check_window_mmx |
| |
| dec edi |
| mov ecx,edx |
| mov al, [edi] |
| sub ecx,3 |
| |
| mov [edi+1],al |
| mov [edi+2],al |
| mov [edi+3],al |
| add edi,4 |
| rep stosb |
| |
| mov ebx, [esp+8] |
| jmp L_while_test_mmx |
| |
| ALIGN 4 |
| L_test_for_second_level_length_mmx: |
| test al,64 |
| jnz L_test_for_end_of_block |
| |
| and eax,15 |
| psrlq mm0,mm1 |
| movd ecx,mm0 |
| and ecx, [inflate_fast_mask+eax*4] |
| add ecx,edx |
| mov eax, [ebx+ecx*4] |
| jmp L_dolen_mmx |
| |
| ALIGN 4 |
| L_test_for_second_level_dist_mmx: |
| test al,64 |
| jnz L_invalid_distance_code |
| |
| and eax,15 |
| psrlq mm0,mm1 |
| movd ecx,mm0 |
| and ecx, [inflate_fast_mask+eax*4] |
| mov eax, [esp+12] |
| add ecx,ebx |
| mov eax, [eax+ecx*4] |
| jmp L_dodist_mmx |
| |
| ALIGN 4 |
| L_clip_window_mmx: |
| |
| mov ecx,eax |
| mov eax, [esp+52] |
| neg ecx |
| mov esi, [esp+56] |
| |
| cmp eax,ebx |
| jb L_invalid_distance_too_far |
| |
| add ecx,ebx |
| cmp dword ptr [esp+48],0 |
| jne L_wrap_around_window_mmx |
| |
| sub eax,ecx |
| add esi,eax |
| |
| cmp edx,ecx |
| jbe L_do_copy1_mmx |
| |
| sub edx,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,ebx |
| jmp L_do_copy1_mmx |
| |
| cmp edx,ecx |
| jbe L_do_copy1_mmx |
| |
| sub edx,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,ebx |
| jmp L_do_copy1_mmx |
| |
| L_wrap_around_window_mmx: |
| |
| mov eax, [esp+48] |
| cmp ecx,eax |
| jbe L_contiguous_in_window_mmx |
| |
| add esi, [esp+52] |
| add esi,eax |
| sub esi,ecx |
| sub ecx,eax |
| |
| |
| cmp edx,ecx |
| jbe L_do_copy1_mmx |
| |
| sub edx,ecx |
| rep movsb |
| mov esi, [esp+56] |
| mov ecx, [esp+48] |
| cmp edx,ecx |
| jbe L_do_copy1_mmx |
| |
| sub edx,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,ebx |
| jmp L_do_copy1_mmx |
| |
| L_contiguous_in_window_mmx: |
| |
| add esi,eax |
| sub esi,ecx |
| |
| |
| cmp edx,ecx |
| jbe L_do_copy1_mmx |
| |
| sub edx,ecx |
| rep movsb |
| mov esi,edi |
| sub esi,ebx |
| |
| L_do_copy1_mmx: |
| |
| |
| mov ecx,edx |
| rep movsb |
| |
| mov esi, [esp+44] |
| mov ebx, [esp+8] |
| jmp L_while_test_mmx |
| ; 1174 "inffast.S" |
| L_invalid_distance_code: |
| |
| |
| |
| |
| |
| mov ecx, invalid_distance_code_msg |
| mov edx,INFLATE_MODE_BAD |
| jmp L_update_stream_state |
| |
| L_test_for_end_of_block: |
| |
| |
| |
| |
| |
| test al,32 |
| jz L_invalid_literal_length_code |
| |
| mov ecx,0 |
| mov edx,INFLATE_MODE_TYPE |
| jmp L_update_stream_state |
| |
| L_invalid_literal_length_code: |
| |
| |
| |
| |
| |
| mov ecx, invalid_literal_length_code_msg |
| mov edx,INFLATE_MODE_BAD |
| jmp L_update_stream_state |
| |
| L_invalid_distance_too_far: |
| |
| |
| |
| mov esi, [esp+44] |
| mov ecx, invalid_distance_too_far_msg |
| mov edx,INFLATE_MODE_BAD |
| jmp L_update_stream_state |
| |
| L_update_stream_state: |
| |
| mov eax, [esp+88] |
| test ecx,ecx |
| jz L_skip_msg |
| mov [eax+24],ecx |
| L_skip_msg: |
| mov eax, [eax+28] |
| mov [eax+mode_state],edx |
| jmp L_break_loop |
| |
| ALIGN 4 |
| L_break_loop: |
| ; 1243 "inffast.S" |
| cmp dword ptr [inflate_fast_use_mmx],2 |
| jne L_update_next_in |
| |
| |
| |
| mov ebx,ebp |
| |
| L_update_next_in: |
| ; 1266 "inffast.S" |
| mov eax, [esp+88] |
| mov ecx,ebx |
| mov edx, [eax+28] |
| shr ecx,3 |
| sub esi,ecx |
| shl ecx,3 |
| sub ebx,ecx |
| mov [eax+12],edi |
| mov [edx+bits_state],ebx |
| mov ecx,ebx |
| |
| lea ebx, [esp+28] |
| cmp [esp+20],ebx |
| jne L_buf_not_used |
| |
| sub esi,ebx |
| mov ebx, [eax+0] |
| mov [esp+20],ebx |
| add esi,ebx |
| mov ebx, [eax+4] |
| sub ebx,11 |
| add [esp+20],ebx |
| |
| L_buf_not_used: |
| mov [eax+0],esi |
| |
| mov ebx,1 |
| shl ebx,cl |
| dec ebx |
| |
| |
| |
| |
| |
| cmp dword ptr [inflate_fast_use_mmx],2 |
| jne L_update_hold |
| |
| |
| |
| psrlq mm0,mm1 |
| movd ebp,mm0 |
| |
| emms |
| |
| L_update_hold: |
| |
| |
| |
| and ebp,ebx |
| mov [edx+hold_state],ebp |
| |
| |
| |
| |
| mov ebx, [esp+20] |
| cmp ebx,esi |
| jbe L_last_is_smaller |
| |
| sub ebx,esi |
| add ebx,11 |
| mov [eax+4],ebx |
| jmp L_fixup_out |
| L_last_is_smaller: |
| sub esi,ebx |
| neg esi |
| add esi,11 |
| mov [eax+4],esi |
| |
| |
| |
| |
| L_fixup_out: |
| |
| mov ebx, [esp+16] |
| cmp ebx,edi |
| jbe L_end_is_smaller |
| |
| sub ebx,edi |
| add ebx,257 |
| mov [eax+16],ebx |
| jmp L_done |
| L_end_is_smaller: |
| sub edi,ebx |
| neg edi |
| add edi,257 |
| mov [eax+16],edi |
| |
| |
| |
| |
| |
| L_done: |
| add esp,64 |
| popfd |
| pop ebx |
| pop ebp |
| pop esi |
| pop edi |
| ret |
| _inflate_fast endp |
| |
| _TEXT ends |
| end |