forked from KolibriOS/kolibrios
53 lines
1.0 KiB
NASM
53 lines
1.0 KiB
NASM
|
/* Copyright (C) 1995 DJ Delorie, see COPYING.DJ for details */
|
||
|
##include<libc/asm.h>
|
||
|
# .file "memset.s"
|
||
|
.text
|
||
|
.global _memset
|
||
|
.align 4
|
||
|
_memset:
|
||
|
pushl %ebp
|
||
|
movl %esp,%ebp
|
||
|
pushl %edi
|
||
|
movl 8(%ebp),%edi
|
||
|
movl 12(%ebp),%eax
|
||
|
movl 16(%ebp),%ecx
|
||
|
cld
|
||
|
|
||
|
# We will handle memsets of <= 15 bytes one byte at a time.
|
||
|
# This avoids some extra overhead for small memsets, and
|
||
|
# knowing we are setting > 15 bytes eliminates some annoying
|
||
|
# checks in the "long move" case.
|
||
|
cmpl $15,%ecx
|
||
|
jle L3
|
||
|
|
||
|
# Otherwise, tile the byte value out into %eax.
|
||
|
# 0x41 -> 0x41414141, etc.
|
||
|
movb %al,%ah
|
||
|
movl %eax,%edx
|
||
|
sall $16,%eax
|
||
|
movw %dx,%ax
|
||
|
jmp L2
|
||
|
|
||
|
# Handle any cruft necessary to get %edi long-aligned.
|
||
|
L1: stosb
|
||
|
decl %ecx
|
||
|
L2: testl $3,%edi
|
||
|
jnz L1
|
||
|
|
||
|
# Now slam out all of the longs.
|
||
|
movl %ecx,%edx
|
||
|
shrl $2,%ecx
|
||
|
rep
|
||
|
stosl
|
||
|
|
||
|
# Finally, handle any trailing cruft. We know the high three bytes
|
||
|
# of %ecx must be zero, so just put the "slop count" in the low byte.
|
||
|
movb %dl,%cl
|
||
|
andb $3,%cl
|
||
|
L3: rep
|
||
|
stosb
|
||
|
popl %edi
|
||
|
movl 8(%ebp),%eax
|
||
|
leave
|
||
|
ret
|