Home | History | Annotate | Line # | Download | only in string
memchr.S revision 1.1
      1  1.1  christos /*
      2  1.1  christos  * Written by J.T. Conklin <jtc (at) acorntoolworks.com>
      3  1.1  christos  * Public domain.
      4  1.1  christos  */
      5  1.1  christos 
      6  1.1  christos #include <machine/asm.h>
      7  1.1  christos 
      8  1.1  christos #if defined(LIBC_SCCS)
      9  1.1  christos 	RCSID("$NetBSD: memchr.S,v 1.1 2005/12/20 19:28:51 christos Exp $")
     10  1.1  christos #endif
     11  1.1  christos 
     12  1.1  christos ENTRY(memchr)
     13  1.1  christos 	movzbq	%sil,%rcx
     14  1.1  christos 
     15  1.1  christos 	/*
     16  1.1  christos 	 * Align to word boundary.
     17  1.1  christos 	 * Consider unrolling loop?
     18  1.1  christos 	 */
     19  1.1  christos 	testq	%rdx,%rdx	/* nbytes == 0? */
     20  1.1  christos 	je	.Lzero
     21  1.1  christos .Lalign:
     22  1.1  christos 	testb	$7,%dil
     23  1.1  christos 	je	.Lword_aligned
     24  1.1  christos 	movq	%rdi,%rax
     25  1.1  christos 	cmpb	(%rdi),%cl
     26  1.1  christos 	je	.Ldone
     27  1.1  christos 	incq	%rdi
     28  1.1  christos 	decq	%rdx
     29  1.1  christos 	jnz	.Lalign
     30  1.1  christos 	jmp	.Lzero
     31  1.1  christos 
     32  1.1  christos .Lword_aligned:
     33  1.1  christos 	/* copy char to all bytes in word */
     34  1.1  christos 	movb	%cl,%ch
     35  1.1  christos 	movq	%rcx,%rsi
     36  1.1  christos 	salq	$16,%rcx
     37  1.1  christos 	orq	%rsi,%rcx
     38  1.1  christos 	movq	%rcx,%rsi
     39  1.1  christos 	salq	$32,%rcx
     40  1.1  christos 	orq	%rsi,%rcx
     41  1.1  christos 
     42  1.1  christos 	movabsq	$0x0101010101010101,%r8
     43  1.1  christos 	movabsq	$0x8080808080808080,%r9
     44  1.1  christos 
     45  1.1  christos 	_ALIGN_TEXT
     46  1.1  christos .Lloop:
     47  1.1  christos 	cmpq	$7,%rdx		/* nbytes > 8 */
     48  1.1  christos 	jbe	.Lbyte
     49  1.1  christos 	movq	(%rdi),%rsi
     50  1.1  christos 	addq	$8,%rdi
     51  1.1  christos 	xorq	%rcx,%rsi
     52  1.1  christos 	subq	$8,%rdx
     53  1.1  christos 	subq	%r8,%rsi
     54  1.1  christos 	testq	%r9,%rsi
     55  1.1  christos 	je	.Lloop
     56  1.1  christos 
     57  1.1  christos 	/*
     58  1.1  christos 	 * In rare cases, the above loop may exit prematurely. We must
     59  1.1  christos 	 * return to the loop if none of the bytes in the word are
     60  1.1  christos 	 * equal to ch.
     61  1.1  christos 	 */
     62  1.1  christos 
     63  1.1  christos 	leaq	-8(%rdi),%rax
     64  1.1  christos 	cmpb	-8(%rdi),%cl	/* 1st byte == ch? */
     65  1.1  christos 	je	.Ldone
     66  1.1  christos 
     67  1.1  christos 	leaq	-7(%rdi),%rax
     68  1.1  christos 	cmpb	-7(%rdi),%cl	/* 2nd byte == ch? */
     69  1.1  christos 	je	.Ldone
     70  1.1  christos 
     71  1.1  christos 	leaq	-6(%rdi),%rax
     72  1.1  christos 	cmpb	-6(%rdi),%cl	/* 3rd byte == ch? */
     73  1.1  christos 	je	.Ldone
     74  1.1  christos 
     75  1.1  christos 	leaq	-5(%rdi),%rax
     76  1.1  christos 	cmpb	-5(%rdi),%cl	/* 4th byte == ch? */
     77  1.1  christos 	je	.Ldone
     78  1.1  christos 
     79  1.1  christos 	leaq	-4(%rdi),%rax
     80  1.1  christos 	cmpb	-4(%rdi),%cl	/* 5th byte == ch? */
     81  1.1  christos 	je	.Ldone
     82  1.1  christos 
     83  1.1  christos 	leaq	-3(%rdi),%rax
     84  1.1  christos 	cmpb	-3(%rdi),%cl	/* 6th byte == ch? */
     85  1.1  christos 	je	.Ldone
     86  1.1  christos 
     87  1.1  christos 	leaq	-2(%rdi),%rax
     88  1.1  christos 	cmpb	-2(%rdi),%cl	/* 7th byte == ch? */
     89  1.1  christos 	je	.Ldone
     90  1.1  christos 
     91  1.1  christos 	leaq	-1(%rdi),%rax
     92  1.1  christos 	cmpb	-1(%rdi),%cl	/* 7th byte == ch? */
     93  1.1  christos 	jne	.Lloop
     94  1.1  christos 	ret
     95  1.1  christos 
     96  1.1  christos .Lbyte:
     97  1.1  christos 	testq	%rdx,%rdx
     98  1.1  christos 	je	.Lzero
     99  1.1  christos .Lbyte_loop:
    100  1.1  christos 	movq	%rdi,%rax
    101  1.1  christos 	cmpb	(%rdi),%cl
    102  1.1  christos 	je	.Ldone
    103  1.1  christos 	incq	%rdi
    104  1.1  christos 	decq	%rdx
    105  1.1  christos 	jnz	.Lbyte_loop
    106  1.1  christos 
    107  1.1  christos .Lzero:
    108  1.1  christos 	xorq	%rax,%rax
    109  1.1  christos 
    110  1.1  christos .Ldone:
    111  1.1  christos 	ret
    112