wword.obj src added

git-svn-id: svn://kolibrios.org@2329 a494cfbc-eb01-0410-851d-a64ba20cac60
This commit is contained in:
Albom 2011-12-25 14:04:41 +00:00
parent 6bd8780b1a
commit bb704ae063
4 changed files with 266 additions and 0 deletions

View File

@ -0,0 +1,4 @@
del wword.obj
fasm wword.asm
kpack wword.obj
pause

View File

@ -0,0 +1,12 @@
wword.obj
==============
Извлечение текста из файлов MS Word 8.0 и 9.0.
Библиотека написана на основе программы doc2txt.
Автор doc2txt - Иван Рощин, http://www.ivr.da.ru
==============
Александр Богомаз aka Albom
albom85@yandex.ru
http://albom85.narod.ru

View File

@ -0,0 +1,241 @@
format MS COFF
public EXPORTS
section '.flat' code readable writable align 16
version:
mov eax, 10
ret
; int __stdcall convert (const char filename[], char buffer[], int mode)
convert:
mov eax, [esp+4]
mov dword [filename], eax
mov eax, [esp+8]
mov dword [buffer], eax
mov eax, [esp+12]
mov dword [mode], eax
pushad
mov eax, 68
mov ebx, 11
int 0x40
mov dword [file_in], 5
mov dword [file_in+4], 0
mov dword [file_in+8], 0
mov dword [file_in+12], 0
mov dword [file_in+16], bdvk
mov byte [file_in+20], 0
mov eax, [filename]
mov dword [file_in+21], eax
mov eax, 70
mov ebx, file_in
int 0x40
mov dword eax, [bdvk+32]
mov dword [buf_len], eax
mov eax, 68
mov ebx, 12
mov ecx, [buf_len]
int 0x40
mov [buf], eax
cmp eax, 0
jne _mem_ok
popad
mov eax, -1
ret 12
_mem_ok:
mov dword [file_in], 0
mov dword [file_in+4], 0x600
mov dword [file_in+8], 0
mov eax, [buf_len]
sub eax, 0x600
mov [buf_len], eax
mov dword [file_in+12], eax
mov eax, [buf]
mov dword [file_in+16], eax
mov byte [file_in+20], 0
mov eax, [filename]
mov dword [file_in+21], eax
mov eax, 70
mov ebx, file_in
int 0x40
call translate
mov eax, 68
mov ebx, 13
mov ecx, [buf]
int 0x40
popad
mov eax, [result]
ret 12
translate:
pushad
xor ebx, ebx
mov [result], 0
mov ecx, [buf] ; ¢å®¤­®© ¡ãä¥à
mov edx, [buffer] ; ¢ë室­®© ¡ãä¥à
_translate_loop:
cmp ebx, [buf_len]
je _translate_end
mov byte al, [ecx]
inc ecx
inc ebx
mov byte ah, [ecx]
cmp ah, 0
jne _translate_next1
cmp al, 0
je _translate_end
cmp al, 13
jne _translate_no13
mov byte [edx], 0x0d
inc edx
mov byte [edx], 0x0a
inc edx
mov byte [edx], 32
inc edx
mov byte [edx], 32
inc edx
mov byte [edx], 32
inc edx
mov al, 32
jmp _translate_copy
_translate_no13:
cmp al, 0x1f
jg _translate_eng_1
inc ecx
inc ebx
jmp _translate_loop
_translate_eng_1:
cmp al, 0x7f
jle _translate_eng_2
inc ecx
inc ebx
jmp _translate_loop
_translate_eng_2:
jmp _translate_copy
_translate_next1:
cmp ah, 4
jne _translate_next2
cmp al, 0x2f
jb _translate_rus_s
and eax, 0xff
add eax, rus_big
sub eax, 0x10
mov al, [eax]
jmp _translate_copy
_translate_rus_s:
and eax, 0xff
add eax, rus_small
sub eax, 0x30
mov al, [eax]
jmp _translate_copy
_translate_next2:
cmp ah, 0x20
jne _translate_next3
_translate_next3:
_translate_copy:
mov byte [edx], al
inc ecx
inc edx
inc ebx
inc [result]
jmp _translate_loop
_translate_end:
popad
ret
align 16
EXPORTS:
dd szVersion, version
dd szConvert, convert
dd 0, 0
szVersion db 'version',0
szConvert db 'convert',0
buf dd 0
buf_len dd 0
result dd 0
mode dd 0
buffer dd 0
filename dd 0
rus_big db '€<>ƒ„…†‡ˆ‰ŠŒ<E280B9>Ž<EFBFBD><C5BD>“”•˜™šœ<E280BA>žŸ'
rus_small db ' ¡¢£¤¥¦§¨©ª«¬­®¯àáâãäåæçèéêëìíîï'
section '.data' data readable writable align 16
file_in rd 1
rd 1
rd 1
rd 1
rd 1
rb 1
rd 1
bdvk rd 1
rb 1
rb 3
rb 4
rb 4
rb 4
rb 4
rb 4
rb 4
rd 1
rd 1

View File

@ -0,0 +1,9 @@
// Версия. 10 означает 0.1 (100 - 1.0, ...)
int version();
// filename - полный путь к доку
// buffer - буфер, должет быть не меньше размера дока
// mode - режим, пока не реализовано, указывать 0
// возвращаемое значение - число байт, записанных в буфер
int __stdcall convert (const char filename[], char buffer[], int mode);