Home | History | Annotate | Line # | Download | only in mips
      1 #include "mips_arch.h"
      2 
      3 #ifdef MIPSEB
      4 # define MSB 0
      5 # define LSB 7
      6 #else
      7 # define MSB 7
      8 # define LSB 0
      9 #endif
     10 
     11 .text
     12 .set	noat
     13 .set	noreorder
     14 
     15 .align	5
     16 .globl	poly1305_init
     17 .ent	poly1305_init
     18 poly1305_init:
     19 	.frame	$29,0,$31
     20 	.set	reorder
     21 
     22 	sd	$0,0($4)
     23 	sd	$0,8($4)
     24 	sd	$0,16($4)
     25 
     26 	beqz	$5,.Lno_key
     27 
     28 #if defined(_MIPS_ARCH_MIPS64R6)
     29 	ld	$8,0($5)
     30 	ld	$9,8($5)
     31 #else
     32 	ldl	$8,0+MSB($5)
     33 	ldl	$9,8+MSB($5)
     34 	ldr	$8,0+LSB($5)
     35 	ldr	$9,8+LSB($5)
     36 #endif
     37 #ifdef	MIPSEB
     38 # if defined(_MIPS_ARCH_MIPS64R2)
     39 	dsbh	$8,$8		# byte swap
     40 	 dsbh	$9,$9
     41 	dshd	$8,$8
     42 	 dshd	$9,$9
     43 # else
     44 	ori	$10,$0,0xFF
     45 	dsll	$1,$10,32
     46 	or	$10,$1		# 0x000000FF000000FF
     47 
     48 	and	$11,$8,$10	# byte swap
     49 	 and	$2,$9,$10
     50 	dsrl	$1,$8,24
     51 	 dsrl	$24,$9,24
     52 	dsll	$11,24
     53 	 dsll	$2,24
     54 	and	$1,$10
     55 	 and	$24,$10
     56 	dsll	$10,8			# 0x0000FF000000FF00
     57 	or	$11,$1
     58 	 or	$2,$24
     59 	and	$1,$8,$10
     60 	 and	$24,$9,$10
     61 	dsrl	$8,8
     62 	 dsrl	$9,8
     63 	dsll	$1,8
     64 	 dsll	$24,8
     65 	and	$8,$10
     66 	 and	$9,$10
     67 	or	$11,$1
     68 	 or	$2,$24
     69 	or	$8,$11
     70 	 or	$9,$2
     71 	dsrl	$11,$8,32
     72 	 dsrl	$2,$9,32
     73 	dsll	$8,32
     74 	 dsll	$9,32
     75 	or	$8,$11
     76 	 or	$9,$2
     77 # endif
     78 #endif
     79 	li	$10,1
     80 	dsll	$10,32
     81 	daddiu	$10,-63
     82 	dsll	$10,28
     83 	daddiu	$10,-1		# 0ffffffc0fffffff
     84 
     85 	and	$8,$10
     86 	daddiu	$10,-3		# 0ffffffc0ffffffc
     87 	and	$9,$10
     88 
     89 	sd	$8,24($4)
     90 	dsrl	$10,$9,2
     91 	sd	$9,32($4)
     92 	daddu	$10,$9		# s1 = r1 + (r1 >> 2)
     93 	sd	$10,40($4)
     94 
     95 .Lno_key:
     96 	li	$2,0			# return 0
     97 	jr	$31
     98 .end	poly1305_init
     99 .align	5
    100 .globl	poly1305_blocks
    101 .ent	poly1305_blocks
    102 poly1305_blocks:
    103 	.set	noreorder
    104 	dsrl	$6,4			# number of complete blocks
    105 	bnez	$6,poly1305_blocks_internal
    106 	nop
    107 	jr	$31
    108 	nop
    109 .end	poly1305_blocks
    110 
    111 .align	5
    112 .ent	poly1305_blocks_internal
    113 poly1305_blocks_internal:
    114 	.frame	$29,6*8,$31
    115 	.mask	0x00030000,-8
    116 	.set	noreorder
    117 	dsubu	$29,6*8
    118 	sd	$17,40($29)
    119 	sd	$16,32($29)
    120 	.set	reorder
    121 
    122 	ld	$12,0($4)		# load hash value
    123 	ld	$13,8($4)
    124 	ld	$14,16($4)
    125 
    126 	ld	$15,24($4)		# load key
    127 	ld	$16,32($4)
    128 	ld	$17,40($4)
    129 
    130 .Loop:
    131 #if defined(_MIPS_ARCH_MIPS64R6)
    132 	ld	$8,0($5)		# load input
    133 	ld	$9,8($5)
    134 #else
    135 	ldl	$8,0+MSB($5)	# load input
    136 	ldl	$9,8+MSB($5)
    137 	ldr	$8,0+LSB($5)
    138 	ldr	$9,8+LSB($5)
    139 #endif
    140 	daddiu	$6,-1
    141 	daddiu	$5,16
    142 #ifdef	MIPSEB
    143 # if defined(_MIPS_ARCH_MIPS64R2)
    144 	dsbh	$8,$8		# byte swap
    145 	 dsbh	$9,$9
    146 	dshd	$8,$8
    147 	 dshd	$9,$9
    148 # else
    149 	ori	$10,$0,0xFF
    150 	dsll	$1,$10,32
    151 	or	$10,$1		# 0x000000FF000000FF
    152 
    153 	and	$11,$8,$10	# byte swap
    154 	 and	$2,$9,$10
    155 	dsrl	$1,$8,24
    156 	 dsrl	$24,$9,24
    157 	dsll	$11,24
    158 	 dsll	$2,24
    159 	and	$1,$10
    160 	 and	$24,$10
    161 	dsll	$10,8			# 0x0000FF000000FF00
    162 	or	$11,$1
    163 	 or	$2,$24
    164 	and	$1,$8,$10
    165 	 and	$24,$9,$10
    166 	dsrl	$8,8
    167 	 dsrl	$9,8
    168 	dsll	$1,8
    169 	 dsll	$24,8
    170 	and	$8,$10
    171 	 and	$9,$10
    172 	or	$11,$1
    173 	 or	$2,$24
    174 	or	$8,$11
    175 	 or	$9,$2
    176 	dsrl	$11,$8,32
    177 	 dsrl	$2,$9,32
    178 	dsll	$8,32
    179 	 dsll	$9,32
    180 	or	$8,$11
    181 	 or	$9,$2
    182 # endif
    183 #endif
    184 	daddu	$12,$8		# accumulate input
    185 	daddu	$13,$9
    186 	sltu	$10,$12,$8
    187 	sltu	$11,$13,$9
    188 	daddu	$13,$10
    189 
    190 	dmultu	($15,$12)		# h0*r0
    191 	 daddu	$14,$7
    192 	 sltu	$10,$13,$10
    193 	mflo	($8,$15,$12)
    194 	mfhi	($9,$15,$12)
    195 
    196 	dmultu	($17,$13)		# h1*5*r1
    197 	 daddu	$10,$11
    198 	 daddu	$14,$10
    199 	mflo	($10,$17,$13)
    200 	mfhi	($11,$17,$13)
    201 
    202 	dmultu	($16,$12)		# h0*r1
    203 	 daddu	$8,$10
    204 	 daddu	$9,$11
    205 	mflo	($1,$16,$12)
    206 	mfhi	($25,$16,$12)
    207 	 sltu	$10,$8,$10
    208 	 daddu	$9,$10
    209 
    210 	dmultu	($15,$13)		# h1*r0
    211 	 daddu	$9,$1
    212 	 sltu	$1,$9,$1
    213 	mflo	($10,$15,$13)
    214 	mfhi	($11,$15,$13)
    215 	 daddu	$25,$1
    216 
    217 	dmultu	($17,$14)		# h2*5*r1
    218 	 daddu	$9,$10
    219 	 daddu	$25,$11
    220 	mflo	($1,$17,$14)
    221 
    222 	dmultu	($15,$14)		# h2*r0
    223 	 sltu	$10,$9,$10
    224 	 daddu	$25,$10
    225 	mflo	($2,$15,$14)
    226 
    227 	daddu	$9,$1
    228 	daddu	$25,$2
    229 	sltu	$1,$9,$1
    230 	daddu	$25,$1
    231 
    232 	li	$10,-4		# final reduction
    233 	and	$10,$25
    234 	dsrl	$11,$25,2
    235 	andi	$14,$25,3
    236 	daddu	$10,$11
    237 	daddu	$12,$8,$10
    238 	sltu	$10,$12,$10
    239 	daddu	$13,$9,$10
    240 	sltu	$10,$13,$10
    241 	daddu	$14,$14,$10
    242 
    243 	bnez	$6,.Loop
    244 
    245 	sd	$12,0($4)		# store hash value
    246 	sd	$13,8($4)
    247 	sd	$14,16($4)
    248 
    249 	.set	noreorder
    250 	ld	$17,40($29)		# epilogue
    251 	ld	$16,32($29)
    252 	jr	$31
    253 	daddu	$29,6*8
    254 .end	poly1305_blocks_internal
    255 .align	5
    256 .globl	poly1305_emit
    257 .ent	poly1305_emit
    258 poly1305_emit:
    259 	.frame	$29,0,$31
    260 	.set	reorder
    261 
    262 	ld	$10,0($4)
    263 	ld	$11,8($4)
    264 	ld	$1,16($4)
    265 
    266 	daddiu	$8,$10,5		# compare to modulus
    267 	sltiu	$2,$8,5
    268 	daddu	$9,$11,$2
    269 	sltu	$2,$9,$2
    270 	daddu	$1,$1,$2
    271 
    272 	dsrl	$1,2			# see if it carried/borrowed
    273 	dsubu	$1,$0,$1
    274 	nor	$2,$0,$1
    275 
    276 	and	$8,$1
    277 	and	$10,$2
    278 	and	$9,$1
    279 	and	$11,$2
    280 	or	$8,$10
    281 	or	$9,$11
    282 
    283 	lwu	$10,0($6)		# load nonce
    284 	lwu	$11,4($6)
    285 	lwu	$1,8($6)
    286 	lwu	$2,12($6)
    287 	dsll	$11,32
    288 	dsll	$2,32
    289 	or	$10,$11
    290 	or	$1,$2
    291 
    292 	daddu	$8,$10		# accumulate nonce
    293 	daddu	$9,$1
    294 	sltu	$10,$8,$10
    295 	daddu	$9,$10
    296 
    297 	dsrl	$10,$8,8		# write mac value
    298 	dsrl	$11,$8,16
    299 	dsrl	$1,$8,24
    300 	sb	$8,0($5)
    301 	dsrl	$2,$8,32
    302 	sb	$10,1($5)
    303 	dsrl	$10,$8,40
    304 	sb	$11,2($5)
    305 	dsrl	$11,$8,48
    306 	sb	$1,3($5)
    307 	dsrl	$1,$8,56
    308 	sb	$2,4($5)
    309 	dsrl	$2,$9,8
    310 	sb	$10,5($5)
    311 	dsrl	$10,$9,16
    312 	sb	$11,6($5)
    313 	dsrl	$11,$9,24
    314 	sb	$1,7($5)
    315 
    316 	sb	$9,8($5)
    317 	dsrl	$1,$9,32
    318 	sb	$2,9($5)
    319 	dsrl	$2,$9,40
    320 	sb	$10,10($5)
    321 	dsrl	$10,$9,48
    322 	sb	$11,11($5)
    323 	dsrl	$11,$9,56
    324 	sb	$1,12($5)
    325 	sb	$2,13($5)
    326 	sb	$10,14($5)
    327 	sb	$11,15($5)
    328 
    329 	jr	$31
    330 .end	poly1305_emit
    331 .rdata
    332 .asciiz	"Poly1305 for MIPS64, CRYPTOGAMS by <appro (at) openssl.org>"
    333 .align	2
    334