Home | History | Annotate | Line # | Download | only in string
      1 /*	$NetBSD: memset.S,v 1.5 2014/05/23 03:17:31 uebayasi Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 2003 The NetBSD Foundation, Inc.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to The NetBSD Foundation
      8  * by David Laight.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  *
     19  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  * POSSIBILITY OF SUCH DAMAGE.
     30  */
     31 
     32 #include <machine/asm.h>
     33 
     34 #if defined(LIBC_SCCS)
     35 	RCSID("$NetBSD: memset.S,v 1.5 2014/05/23 03:17:31 uebayasi Exp $")
     36 #endif
     37 
     38 #ifdef BZERO
     39 ENTRY(bzero)
     40 #else
     41 ENTRY(memset)
     42 #endif
     43 #ifdef BZERO
     44 	movl	8(%esp),%ecx
     45 	xor	%eax,%eax
     46 #else
     47 	movl	12(%esp),%ecx
     48 	movzbl	8(%esp),%eax		/* unsigned char, zero extend */
     49 #endif
     50 	cmpl	$0x0f,%ecx		/* avoid mispredicted branch... */
     51 
     52 	pushl	%edi
     53 	movl	8(%esp),%edi
     54 
     55 	/*
     56 	 * if the string is too short, it's really not worth the overhead
     57 	 * of aligning to word boundries, etc.  So we jump to a plain
     58 	 * unaligned set.
     59 	 *
     60 	 * NB aligning the transfer is actually pointless on my athlon 700,
     61 	 * It does make a difference to a PII though.
     62 	 *
     63 	 * The PII, PIII and PIV all seem to have a massive performance
     64 	 * drop when the initial target address is an odd multiple of 4.
     65 	 */
     66 	jbe	.Lby_bytes
     67 
     68 #ifndef BZERO
     69 	movb	%al,%ah			/* copy char to all bytes in word */
     70 	movl	%eax,%edx
     71 	sall	$16,%eax
     72 	orl	%edx,%eax
     73 #endif
     74 
     75 	movl	%edi,%edx		/* detect misalignment */
     76 	neg	%edx
     77 	andl	$7,%edx
     78 	jnz	.Lalign
     79 .Laligned:
     80 	movl	%eax,-4(%edi,%ecx)	/* zap last 4 bytes */
     81 	shrl	$2,%ecx			/* zero by words */
     82 	rep
     83 	stosl
     84 .Ldone:
     85 #ifndef BZERO
     86 	movl	8(%esp),%eax		/* return address of buffer */
     87 #endif
     88 	pop	%edi
     89 	ret
     90 
     91 .Lalign:
     92 	movl	%eax,(%edi)		/* zap first 8 bytes */
     93 	movl	%eax,4(%edi)
     94 	subl	%edx,%ecx		/* remove from main count */
     95 	add	%edx,%edi
     96 	jmp	.Laligned
     97 
     98 .Lby_bytes:
     99 	rep
    100 	stosb
    101 
    102 #ifndef BZERO
    103 	movl	8(%esp),%eax		/* return address of buffer */
    104 #endif
    105 	popl	%edi
    106 	ret
    107 #ifdef BZERO
    108 END(bzero)
    109 #else
    110 END(memset)
    111 #endif
    112