Home | History | Annotate | Line # | Download | only in sparc32
      1 dnl  SPARC mpn_addmul_1 -- Multiply a limb vector with a limb and add the
      2 dnl  result to a second limb vector.
      3 
      4 dnl  Copyright 1992-1994, 2000 Free Software Foundation, Inc.
      5 
      6 dnl  This file is part of the GNU MP Library.
      7 dnl
      8 dnl  The GNU MP Library is free software; you can redistribute it and/or modify
      9 dnl  it under the terms of either:
     10 dnl
     11 dnl    * the GNU Lesser General Public License as published by the Free
     12 dnl      Software Foundation; either version 3 of the License, or (at your
     13 dnl      option) any later version.
     14 dnl
     15 dnl  or
     16 dnl
     17 dnl    * the GNU General Public License as published by the Free Software
     18 dnl      Foundation; either version 2 of the License, or (at your option) any
     19 dnl      later version.
     20 dnl
     21 dnl  or both in parallel, as here.
     22 dnl
     23 dnl  The GNU MP Library is distributed in the hope that it will be useful, but
     24 dnl  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
     25 dnl  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
     26 dnl  for more details.
     27 dnl
     28 dnl  You should have received copies of the GNU General Public License and the
     29 dnl  GNU Lesser General Public License along with the GNU MP Library.  If not,
     30 dnl  see https://www.gnu.org/licenses/.
     31 
     32 
     33 include(`../config.m4')
     34 
     35 C INPUT PARAMETERS
     36 C res_ptr	o0
     37 C s1_ptr	o1
     38 C size		o2
     39 C s2_limb	o3
     40 
     41 ASM_START()
     42 PROLOGUE(mpn_addmul_1)
     43 	C Make S1_PTR and RES_PTR point at the end of their blocks
     44 	C and put (- 4 x SIZE) in index/loop counter.
     45 	sll	%o2,2,%o2
     46 	add	%o0,%o2,%o4	C RES_PTR in o4 since o0 is retval
     47 	add	%o1,%o2,%o1
     48 	sub	%g0,%o2,%o2
     49 
     50 	cmp	%o3,0xfff
     51 	bgu	L(large)
     52 	nop
     53 
     54 	ld	[%o1+%o2],%o5
     55 	mov	0,%o0
     56 	b	L(0)
     57 	 add	%o4,-4,%o4
     58 L(loop0):
     59 	addcc	%o5,%g1,%g1
     60 	ld	[%o1+%o2],%o5
     61 	addx	%o0,%g0,%o0
     62 	st	%g1,[%o4+%o2]
     63 L(0):	wr	%g0,%o3,%y
     64 	sra	%o5,31,%g2
     65 	and	%o3,%g2,%g2
     66 	andcc	%g1,0,%g1
     67 	mulscc	%g1,%o5,%g1
     68 	mulscc	%g1,%o5,%g1
     69 	mulscc	%g1,%o5,%g1
     70 	mulscc	%g1,%o5,%g1
     71 	mulscc	%g1,%o5,%g1
     72 	mulscc	%g1,%o5,%g1
     73 	mulscc	%g1,%o5,%g1
     74 	mulscc	%g1,%o5,%g1
     75 	mulscc	%g1,%o5,%g1
     76 	mulscc	%g1,%o5,%g1
     77 	mulscc	%g1,%o5,%g1
     78 	mulscc	%g1,%o5,%g1
     79 	mulscc	%g1,0,%g1
     80 	sra	%g1,20,%g4
     81 	sll	%g1,12,%g1
     82 	rd	%y,%g3
     83 	srl	%g3,20,%g3
     84 	or	%g1,%g3,%g1
     85 
     86 	addcc	%g1,%o0,%g1
     87 	addx	%g2,%g4,%o0	C add sign-compensation and cy to hi limb
     88 	addcc	%o2,4,%o2	C loop counter
     89 	bne	L(loop0)
     90 	 ld	[%o4+%o2],%o5
     91 
     92 	addcc	%o5,%g1,%g1
     93 	addx	%o0,%g0,%o0
     94 	retl
     95 	st	%g1,[%o4+%o2]
     96 
     97 L(large):
     98 	ld	[%o1+%o2],%o5
     99 	mov	0,%o0
    100 	sra	%o3,31,%g4	C g4 = mask of ones iff S2_LIMB < 0
    101 	b	L(1)
    102 	 add	%o4,-4,%o4
    103 L(loop):
    104 	addcc	%o5,%g3,%g3
    105 	ld	[%o1+%o2],%o5
    106 	addx	%o0,%g0,%o0
    107 	st	%g3,[%o4+%o2]
    108 L(1):	wr	%g0,%o5,%y
    109 	and	%o5,%g4,%g2
    110 	andcc	%g0,%g0,%g1
    111 	mulscc	%g1,%o3,%g1
    112 	mulscc	%g1,%o3,%g1
    113 	mulscc	%g1,%o3,%g1
    114 	mulscc	%g1,%o3,%g1
    115 	mulscc	%g1,%o3,%g1
    116 	mulscc	%g1,%o3,%g1
    117 	mulscc	%g1,%o3,%g1
    118 	mulscc	%g1,%o3,%g1
    119 	mulscc	%g1,%o3,%g1
    120 	mulscc	%g1,%o3,%g1
    121 	mulscc	%g1,%o3,%g1
    122 	mulscc	%g1,%o3,%g1
    123 	mulscc	%g1,%o3,%g1
    124 	mulscc	%g1,%o3,%g1
    125 	mulscc	%g1,%o3,%g1
    126 	mulscc	%g1,%o3,%g1
    127 	mulscc	%g1,%o3,%g1
    128 	mulscc	%g1,%o3,%g1
    129 	mulscc	%g1,%o3,%g1
    130 	mulscc	%g1,%o3,%g1
    131 	mulscc	%g1,%o3,%g1
    132 	mulscc	%g1,%o3,%g1
    133 	mulscc	%g1,%o3,%g1
    134 	mulscc	%g1,%o3,%g1
    135 	mulscc	%g1,%o3,%g1
    136 	mulscc	%g1,%o3,%g1
    137 	mulscc	%g1,%o3,%g1
    138 	mulscc	%g1,%o3,%g1
    139 	mulscc	%g1,%o3,%g1
    140 	mulscc	%g1,%o3,%g1
    141 	mulscc	%g1,%o3,%g1
    142 	mulscc	%g1,%o3,%g1
    143 	mulscc	%g1,%g0,%g1
    144 	rd	%y,%g3
    145 	addcc	%g3,%o0,%g3
    146 	addx	%g2,%g1,%o0
    147 	addcc	%o2,4,%o2
    148 	bne	L(loop)
    149 	 ld	[%o4+%o2],%o5
    150 
    151 	addcc	%o5,%g3,%g3
    152 	addx	%o0,%g0,%o0
    153 	retl
    154 	st	%g3,[%o4+%o2]
    155 EPILOGUE(mpn_addmul_1)
    156