Home | History | Annotate | Line # | Download | only in arm
lib1funcs.S revision 1.8
      1 @ libgcc routines for ARM cpu.
      2 @ Division routines, written by Richard Earnshaw, (rearnsha@armltd.co.uk)
      3 
      4 /* Copyright (C) 1995-2019 Free Software Foundation, Inc.
      5 
      6 This file is free software; you can redistribute it and/or modify it
      7 under the terms of the GNU General Public License as published by the
      8 Free Software Foundation; either version 3, or (at your option) any
      9 later version.
     10 
     11 This file is distributed in the hope that it will be useful, but
     12 WITHOUT ANY WARRANTY; without even the implied warranty of
     13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
     14 General Public License for more details.
     15 
     16 Under Section 7 of GPL version 3, you are granted additional
     17 permissions described in the GCC Runtime Library Exception, version
     18 3.1, as published by the Free Software Foundation.
     19 
     20 You should have received a copy of the GNU General Public License and
     21 a copy of the GCC Runtime Library Exception along with this program;
     22 see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
     23 <http://www.gnu.org/licenses/>.  */
     24 
     25 /* An executable stack is *not* required for these functions.  */
     26 #if defined(__ELF__) && defined(__linux__)
     27 .section .note.GNU-stack,"",%progbits
     28 .previous
     29 #endif  /* __ELF__ and __linux__ */
     30 
     31 #ifdef __ARM_EABI__
     32 /* Some attributes that are common to all routines in this file.  */
     33 	/* Tag_ABI_align_needed: This code does not require 8-byte
     34 	   alignment from the caller.  */
     35 	/* .eabi_attribute 24, 0  -- default setting.  */
     36 	/* Tag_ABI_align_preserved: This code preserves 8-byte
     37 	   alignment in any callee.  */
     38 	.eabi_attribute 25, 1
     39 #endif /* __ARM_EABI__ */
     40 /* ------------------------------------------------------------------------ */
     41 
     42 /* We need to know what prefix to add to function names.  */
     43 
     44 #ifndef __USER_LABEL_PREFIX__
     45 #error  __USER_LABEL_PREFIX__ not defined
     46 #endif
     47 
     48 /* ANSI concatenation macros.  */
     49 
     50 #define CONCAT1(a, b) CONCAT2(a, b)
     51 #define CONCAT2(a, b) a ## b
     52 
     53 /* Use the right prefix for global labels.  */
     54 
     55 #define SYM(x) CONCAT1 (__USER_LABEL_PREFIX__, x)
     56 
     57 #ifdef __ELF__
     58 #ifdef __thumb__
     59 #define __PLT__  /* Not supported in Thumb assembler (for now).  */
     60 #elif defined __vxworks && !defined __PIC__
     61 #define __PLT__ /* Not supported by the kernel loader.  */
     62 #else
     63 #define __PLT__ (PLT)
     64 #endif
     65 #define TYPE(x) .type SYM(x),function
     66 #define SIZE(x) .size SYM(x), . - SYM(x)
     67 #define LSYM(x) .x
     68 #else
     69 #define __PLT__
     70 #define TYPE(x)
     71 #define SIZE(x)
     72 #define LSYM(x) x
     73 #endif
     74 
     75 /* Function end macros.  Variants for interworking.  */
     76 
     77 /* There are times when we might prefer Thumb1 code even if ARM code is
     78    permitted, for example, the code might be smaller, or there might be
     79    interworking problems with switching to ARM state if interworking is
     80    disabled.  */
     81 #if (defined(__thumb__)			\
     82      && !defined(__thumb2__)		\
     83      && (!defined(__THUMB_INTERWORK__)	\
     84 	 || defined (__OPTIMIZE_SIZE__)	\
     85 	 || !__ARM_ARCH_ISA_ARM))
     86 # define __prefer_thumb__
     87 #endif
     88 
     89 #if !__ARM_ARCH_ISA_ARM && __ARM_ARCH_ISA_THUMB == 1
     90 #define NOT_ISA_TARGET_32BIT 1
     91 #endif
     92 
     93 /* How to return from a function call depends on the architecture variant.  */
     94 
     95 #if (__ARM_ARCH > 4) || defined(__ARM_ARCH_4T__)
     96 
     97 # define RET		bx	lr
     98 # define RETc(x)	bx##x	lr
     99 
    100 /* Special precautions for interworking on armv4t.  */
    101 # if (__ARM_ARCH == 4)
    102 
    103 /* Always use bx, not ldr pc.  */
    104 #  if (defined(__thumb__) || defined(__THUMB_INTERWORK__))
    105 #    define __INTERWORKING__
    106 #   endif /* __THUMB__ || __THUMB_INTERWORK__ */
    107 
    108 /* Include thumb stub before arm mode code.  */
    109 #  if defined(__thumb__) && !defined(__THUMB_INTERWORK__)
    110 #   define __INTERWORKING_STUBS__
    111 #  endif /* __thumb__ && !__THUMB_INTERWORK__ */
    112 
    113 #endif /* __ARM_ARCH == 4 */
    114 
    115 #else
    116 
    117 # define RET		mov	pc, lr
    118 # define RETc(x)	mov##x	pc, lr
    119 
    120 #endif
    121 
    122 .macro	cfi_pop		advance, reg, cfa_offset
    123 #ifdef __ELF__
    124 	.pushsection	.debug_frame
    125 	.byte	0x4		/* DW_CFA_advance_loc4 */
    126 	.4byte	\advance
    127 	.byte	(0xc0 | \reg)	/* DW_CFA_restore */
    128 	.byte	0xe		/* DW_CFA_def_cfa_offset */
    129 	.uleb128 \cfa_offset
    130 	.popsection
    131 #endif
    132 .endm
    133 .macro	cfi_push	advance, reg, offset, cfa_offset
    134 #ifdef __ELF__
    135 	.pushsection	.debug_frame
    136 	.byte	0x4		/* DW_CFA_advance_loc4 */
    137 	.4byte	\advance
    138 	.byte	(0x80 | \reg)	/* DW_CFA_offset */
    139 	.uleb128 (\offset / -4)
    140 	.byte	0xe		/* DW_CFA_def_cfa_offset */
    141 	.uleb128 \cfa_offset
    142 	.popsection
    143 #endif
    144 .endm
    145 .macro cfi_start	start_label, end_label
    146 #ifdef __ELF__
    147 	.pushsection	.debug_frame
    148 LSYM(Lstart_frame):
    149 	.4byte	LSYM(Lend_cie) - LSYM(Lstart_cie) @ Length of CIE
    150 LSYM(Lstart_cie):
    151         .4byte	0xffffffff	@ CIE Identifier Tag
    152         .byte	0x1	@ CIE Version
    153         .ascii	"\0"	@ CIE Augmentation
    154         .uleb128 0x1	@ CIE Code Alignment Factor
    155         .sleb128 -4	@ CIE Data Alignment Factor
    156         .byte	0xe	@ CIE RA Column
    157         .byte	0xc	@ DW_CFA_def_cfa
    158         .uleb128 0xd
    159         .uleb128 0x0
    160 
    161 	.align 2
    162 LSYM(Lend_cie):
    163 	.4byte	LSYM(Lend_fde)-LSYM(Lstart_fde)	@ FDE Length
    164 LSYM(Lstart_fde):
    165 	.4byte	LSYM(Lstart_frame)	@ FDE CIE offset
    166 	.4byte	\start_label	@ FDE initial location
    167 	.4byte	\end_label-\start_label	@ FDE address range
    168 	.popsection
    169 #endif
    170 .endm
    171 .macro cfi_end	end_label
    172 #ifdef __ELF__
    173 	.pushsection	.debug_frame
    174 	.align	2
    175 LSYM(Lend_fde):
    176 	.popsection
    177 \end_label:
    178 #endif
    179 .endm
    180 
    181 /* Don't pass dirn, it's there just to get token pasting right.  */
    182 
    183 .macro	RETLDM	regs=, cond=, unwind=, dirn=ia
    184 #if defined (__INTERWORKING__)
    185 	.ifc "\regs",""
    186 	ldr\cond	lr, [sp], #8
    187 	.else
    188 # if defined(__thumb2__)
    189 	pop\cond	{\regs, lr}
    190 # else
    191 	ldm\cond\dirn	sp!, {\regs, lr}
    192 # endif
    193 	.endif
    194 	.ifnc "\unwind", ""
    195 	/* Mark LR as restored.  */
    196 97:	cfi_pop 97b - \unwind, 0xe, 0x0
    197 	.endif
    198 	bx\cond	lr
    199 #else
    200 	/* Caller is responsible for providing IT instruction.  */
    201 	.ifc "\regs",""
    202 	ldr\cond	pc, [sp], #8
    203 	.else
    204 # if defined(__thumb2__)
    205 	pop\cond	{\regs, pc}
    206 # else
    207 	ldm\cond\dirn	sp!, {\regs, pc}
    208 # endif
    209 	.endif
    210 #endif
    211 .endm
    212 
    213 /* The Unified assembly syntax allows the same code to be assembled for both
    214    ARM and Thumb-2.  However this is only supported by recent gas, so define
    215    a set of macros to allow ARM code on older assemblers.  */
    216 #if defined(__thumb2__)
    217 .macro do_it cond, suffix=""
    218 	it\suffix	\cond
    219 .endm
    220 .macro shift1 op, arg0, arg1, arg2
    221 	\op	\arg0, \arg1, \arg2
    222 .endm
    223 #define do_push	push
    224 #define do_pop	pop
    225 #define COND(op1, op2, cond) op1 ## op2 ## cond
    226 /* Perform an arithmetic operation with a variable shift operand.  This
    227    requires two instructions and a scratch register on Thumb-2.  */
    228 .macro shiftop name, dest, src1, src2, shiftop, shiftreg, tmp
    229 	\shiftop \tmp, \src2, \shiftreg
    230 	\name \dest, \src1, \tmp
    231 .endm
    232 #else
    233 .macro do_it cond, suffix=""
    234 .endm
    235 .macro shift1 op, arg0, arg1, arg2
    236 	mov	\arg0, \arg1, \op \arg2
    237 .endm
    238 #define do_push	stmfd sp!,
    239 #define do_pop	ldmfd sp!,
    240 #define COND(op1, op2, cond) op1 ## cond ## op2
    241 .macro shiftop name, dest, src1, src2, shiftop, shiftreg, tmp
    242 	\name \dest, \src1, \src2, \shiftop \shiftreg
    243 .endm
    244 #endif
    245 
    246 #ifdef __ARM_EABI__
    247 .macro ARM_LDIV0 name signed
    248 	cmp	r0, #0
    249 	.ifc	\signed, unsigned
    250 	movne	r0, #0xffffffff
    251 	.else
    252 	movgt	r0, #0x7fffffff
    253 	movlt	r0, #0x80000000
    254 	.endif
    255 	b	SYM (__aeabi_idiv0) __PLT__
    256 .endm
    257 #else
    258 .macro ARM_LDIV0 name signed
    259 	str	lr, [sp, #-8]!
    260 98:	cfi_push 98b - __\name, 0xe, -0x8, 0x8
    261 	bl	SYM (__div0) __PLT__
    262 	mov	r0, #0			@ About as wrong as it could be.
    263 	RETLDM	unwind=98b
    264 .endm
    265 #endif
    266 
    267 
    268 #ifdef __ARM_EABI__
    269 .macro THUMB_LDIV0 name signed
    270 #ifdef NOT_ISA_TARGET_32BIT
    271 
    272 	push	{r0, lr}
    273 	mov	r0, #0
    274 	bl	SYM(__aeabi_idiv0)
    275 	@ We know we are not on armv4t, so pop pc is safe.
    276 	pop	{r1, pc}
    277 
    278 #elif defined(__thumb2__)
    279 	.syntax unified
    280 	.ifc \signed, unsigned
    281 	cbz	r0, 1f
    282 	mov	r0, #0xffffffff
    283 1:
    284 	.else
    285 	cmp	r0, #0
    286 	do_it	gt
    287 	movgt	r0, #0x7fffffff
    288 	do_it	lt
    289 	movlt	r0, #0x80000000
    290 	.endif
    291 	b.w	SYM(__aeabi_idiv0) __PLT__
    292 #else
    293 	.align	2
    294 	bx	pc
    295 	nop
    296 	.arm
    297 	cmp	r0, #0
    298 	.ifc	\signed, unsigned
    299 	movne	r0, #0xffffffff
    300 	.else
    301 	movgt	r0, #0x7fffffff
    302 	movlt	r0, #0x80000000
    303 	.endif
    304 	b	SYM(__aeabi_idiv0) __PLT__
    305 	.thumb
    306 #endif
    307 .endm
    308 #else
    309 .macro THUMB_LDIV0 name signed
    310 	push	{ r1, lr }
    311 98:	cfi_push 98b - __\name, 0xe, -0x4, 0x8
    312 	bl	SYM (__div0)
    313 	mov	r0, #0			@ About as wrong as it could be.
    314 #if defined (__INTERWORKING__)
    315 	pop	{ r1, r2 }
    316 	bx	r2
    317 #else
    318 	pop	{ r1, pc }
    319 #endif
    320 .endm
    321 #endif
    322 
    323 .macro FUNC_END name
    324 	SIZE (__\name)
    325 .endm
    326 
    327 .macro DIV_FUNC_END name signed
    328 	cfi_start	__\name, LSYM(Lend_div0)
    329 LSYM(Ldiv0):
    330 #ifdef __thumb__
    331 	THUMB_LDIV0 \name \signed
    332 #else
    333 	ARM_LDIV0 \name \signed
    334 #endif
    335 	cfi_end	LSYM(Lend_div0)
    336 	FUNC_END \name
    337 .endm
    338 
    339 .macro THUMB_FUNC_START name
    340 	.globl	SYM (\name)
    341 	TYPE	(\name)
    342 	.thumb_func
    343 SYM (\name):
    344 .endm
    345 
    346 /* Function start macros.  Variants for ARM and Thumb.  */
    347 
    348 #ifdef __thumb__
    349 #define THUMB_FUNC .thumb_func
    350 #define THUMB_CODE .force_thumb
    351 # if defined(__thumb2__)
    352 #define THUMB_SYNTAX .syntax divided
    353 # else
    354 #define THUMB_SYNTAX
    355 # endif
    356 #else
    357 #define THUMB_FUNC
    358 #define THUMB_CODE
    359 #define THUMB_SYNTAX
    360 #endif
    361 
    362 .macro FUNC_START name
    363 	.text
    364 	.globl SYM (__\name)
    365 	TYPE (__\name)
    366 	.align 0
    367 	THUMB_CODE
    368 	THUMB_FUNC
    369 	THUMB_SYNTAX
    370 SYM (__\name):
    371 .endm
    372 
    373 .macro ARM_SYM_START name
    374        TYPE (\name)
    375        .align 0
    376 SYM (\name):
    377 .endm
    378 
    379 .macro SYM_END name
    380        SIZE (\name)
    381 .endm
    382 
    383 /* Special function that will always be coded in ARM assembly, even if
    384    in Thumb-only compilation.  */
    385 
    386 #if defined(__thumb2__)
    387 
    388 /* For Thumb-2 we build everything in thumb mode.  */
    389 .macro ARM_FUNC_START name
    390        FUNC_START \name
    391        .syntax unified
    392 .endm
    393 #define EQUIV .thumb_set
    394 .macro  ARM_CALL name
    395 	bl	__\name
    396 .endm
    397 
    398 #elif defined(__INTERWORKING_STUBS__)
    399 
    400 .macro	ARM_FUNC_START name
    401 	FUNC_START \name
    402 	bx	pc
    403 	nop
    404 	.arm
    405 /* A hook to tell gdb that we've switched to ARM mode.  Also used to call
    406    directly from other local arm routines.  */
    407 _L__\name:
    408 .endm
    409 #define EQUIV .thumb_set
    410 /* Branch directly to a function declared with ARM_FUNC_START.
    411    Must be called in arm mode.  */
    412 .macro  ARM_CALL name
    413 	bl	_L__\name
    414 .endm
    415 
    416 #else /* !(__INTERWORKING_STUBS__ || __thumb2__) */
    417 
    418 #ifdef NOT_ISA_TARGET_32BIT
    419 #define EQUIV .thumb_set
    420 #else
    421 .macro	ARM_FUNC_START name
    422 	.text
    423 	.globl SYM (__\name)
    424 	TYPE (__\name)
    425 	.align 0
    426 	.arm
    427 SYM (__\name):
    428 .endm
    429 #define EQUIV .set
    430 .macro  ARM_CALL name
    431 	bl	__\name
    432 .endm
    433 #endif
    434 
    435 #endif
    436 
    437 .macro	FUNC_ALIAS new old
    438 	.globl	SYM (__\new)
    439 #if defined (__thumb__)
    440 	.thumb_set	SYM (__\new), SYM (__\old)
    441 #else
    442 	.set	SYM (__\new), SYM (__\old)
    443 #endif
    444 .endm
    445 
    446 #ifndef NOT_ISA_TARGET_32BIT
    447 .macro	ARM_FUNC_ALIAS new old
    448 	.globl	SYM (__\new)
    449 	EQUIV	SYM (__\new), SYM (__\old)
    450 #if defined(__INTERWORKING_STUBS__)
    451 	.set	SYM (_L__\new), SYM (_L__\old)
    452 #endif
    453 .endm
    454 #endif
    455 
    456 #ifdef __ARMEB__
    457 #define xxh r0
    458 #define xxl r1
    459 #define yyh r2
    460 #define yyl r3
    461 #else
    462 #define xxh r1
    463 #define xxl r0
    464 #define yyh r3
    465 #define yyl r2
    466 #endif
    467 
    468 #ifdef __ARM_EABI__
    469 .macro	WEAK name
    470 	.weak SYM (__\name)
    471 .endm
    472 #endif
    473 
    474 #ifdef __thumb__
    475 /* Register aliases.  */
    476 
    477 work		.req	r4	@ XXXX is this safe ?
    478 dividend	.req	r0
    479 divisor		.req	r1
    480 overdone	.req	r2
    481 result		.req	r2
    482 curbit		.req	r3
    483 #endif
    484 #if 0
    485 ip		.req	r12
    486 sp		.req	r13
    487 lr		.req	r14
    488 pc		.req	r15
    489 #endif
    490 
    491 /* ------------------------------------------------------------------------ */
    492 /*		Bodies of the division and modulo routines.		    */
    493 /* ------------------------------------------------------------------------ */
    494 .macro ARM_DIV_BODY dividend, divisor, result, curbit
    495 
    496 #if defined (__ARM_FEATURE_CLZ) && ! defined (__OPTIMIZE_SIZE__)
    497 
    498 #if defined (__thumb2__)
    499 	clz	\curbit, \dividend
    500 	clz	\result, \divisor
    501 	sub	\curbit, \result, \curbit
    502 	rsb	\curbit, \curbit, #31
    503 	adr	\result, 1f
    504 	add	\curbit, \result, \curbit, lsl #4
    505 	mov	\result, #0
    506 	mov	pc, \curbit
    507 .p2align 3
    508 1:
    509 	.set	shift, 32
    510 	.rept	32
    511 	.set	shift, shift - 1
    512 	cmp.w	\dividend, \divisor, lsl #shift
    513 	nop.n
    514 	adc.w	\result, \result, \result
    515 	it	cs
    516 	subcs.w	\dividend, \dividend, \divisor, lsl #shift
    517 	.endr
    518 #else
    519 	clz	\curbit, \dividend
    520 	clz	\result, \divisor
    521 	sub	\curbit, \result, \curbit
    522 	rsbs	\curbit, \curbit, #31
    523 	addne	\curbit, \curbit, \curbit, lsl #1
    524 	mov	\result, #0
    525 	addne	pc, pc, \curbit, lsl #2
    526 	nop
    527 	.set	shift, 32
    528 	.rept	32
    529 	.set	shift, shift - 1
    530 	cmp	\dividend, \divisor, lsl #shift
    531 	adc	\result, \result, \result
    532 	subcs	\dividend, \dividend, \divisor, lsl #shift
    533 	.endr
    534 #endif
    535 
    536 #else /* !defined (__ARM_FEATURE_CLZ) || defined (__OPTIMIZE_SIZE__) */
    537 #if defined (__ARM_FEATURE_CLZ)
    538 
    539 	clz	\curbit, \divisor
    540 	clz	\result, \dividend
    541 	sub	\result, \curbit, \result
    542 	mov	\curbit, #1
    543 	mov	\divisor, \divisor, lsl \result
    544 	mov	\curbit, \curbit, lsl \result
    545 	mov	\result, #0
    546 
    547 #else /* !defined (__ARM_FEATURE_CLZ) */
    548 
    549 	@ Initially shift the divisor left 3 bits if possible,
    550 	@ set curbit accordingly.  This allows for curbit to be located
    551 	@ at the left end of each 4-bit nibbles in the division loop
    552 	@ to save one loop in most cases.
    553 	tst	\divisor, #0xe0000000
    554 	moveq	\divisor, \divisor, lsl #3
    555 	moveq	\curbit, #8
    556 	movne	\curbit, #1
    557 
    558 	@ Unless the divisor is very big, shift it up in multiples of
    559 	@ four bits, since this is the amount of unwinding in the main
    560 	@ division loop.  Continue shifting until the divisor is
    561 	@ larger than the dividend.
    562 1:	cmp	\divisor, #0x10000000
    563 	cmplo	\divisor, \dividend
    564 	movlo	\divisor, \divisor, lsl #4
    565 	movlo	\curbit, \curbit, lsl #4
    566 	blo	1b
    567 
    568 	@ For very big divisors, we must shift it a bit at a time, or
    569 	@ we will be in danger of overflowing.
    570 1:	cmp	\divisor, #0x80000000
    571 	cmplo	\divisor, \dividend
    572 	movlo	\divisor, \divisor, lsl #1
    573 	movlo	\curbit, \curbit, lsl #1
    574 	blo	1b
    575 
    576 	mov	\result, #0
    577 
    578 #endif /* !defined (__ARM_FEATURE_CLZ) */
    579 
    580 	@ Division loop
    581 1:	cmp	\dividend, \divisor
    582 	do_it	hs, t
    583 	subhs	\dividend, \dividend, \divisor
    584 	orrhs	\result,   \result,   \curbit
    585 	cmp	\dividend, \divisor,  lsr #1
    586 	do_it	hs, t
    587 	subhs	\dividend, \dividend, \divisor, lsr #1
    588 	orrhs	\result,   \result,   \curbit,  lsr #1
    589 	cmp	\dividend, \divisor,  lsr #2
    590 	do_it	hs, t
    591 	subhs	\dividend, \dividend, \divisor, lsr #2
    592 	orrhs	\result,   \result,   \curbit,  lsr #2
    593 	cmp	\dividend, \divisor,  lsr #3
    594 	do_it	hs, t
    595 	subhs	\dividend, \dividend, \divisor, lsr #3
    596 	orrhs	\result,   \result,   \curbit,  lsr #3
    597 	cmp	\dividend, #0			@ Early termination?
    598 	do_it	ne, t
    599 	movnes	\curbit,   \curbit,  lsr #4	@ No, any more bits to do?
    600 	movne	\divisor,  \divisor, lsr #4
    601 	bne	1b
    602 
    603 #endif /* !defined (__ARM_FEATURE_CLZ) || defined (__OPTIMIZE_SIZE__) */
    604 
    605 .endm
    606 /* ------------------------------------------------------------------------ */
    607 .macro ARM_DIV2_ORDER divisor, order
    608 
    609 #if defined (__ARM_FEATURE_CLZ)
    610 
    611 	clz	\order, \divisor
    612 	rsb	\order, \order, #31
    613 
    614 #else
    615 
    616 	cmp	\divisor, #(1 << 16)
    617 	movhs	\divisor, \divisor, lsr #16
    618 	movhs	\order, #16
    619 	movlo	\order, #0
    620 
    621 	cmp	\divisor, #(1 << 8)
    622 	movhs	\divisor, \divisor, lsr #8
    623 	addhs	\order, \order, #8
    624 
    625 	cmp	\divisor, #(1 << 4)
    626 	movhs	\divisor, \divisor, lsr #4
    627 	addhs	\order, \order, #4
    628 
    629 	cmp	\divisor, #(1 << 2)
    630 	addhi	\order, \order, #3
    631 	addls	\order, \order, \divisor, lsr #1
    632 
    633 #endif
    634 
    635 .endm
    636 /* ------------------------------------------------------------------------ */
    637 .macro ARM_MOD_BODY dividend, divisor, order, spare
    638 
    639 #if defined(__ARM_FEATURE_CLZ) && ! defined (__OPTIMIZE_SIZE__)
    640 
    641 	clz	\order, \divisor
    642 	clz	\spare, \dividend
    643 	sub	\order, \order, \spare
    644 	rsbs	\order, \order, #31
    645 	addne	pc, pc, \order, lsl #3
    646 	nop
    647 	.set	shift, 32
    648 	.rept	32
    649 	.set	shift, shift - 1
    650 	cmp	\dividend, \divisor, lsl #shift
    651 	subcs	\dividend, \dividend, \divisor, lsl #shift
    652 	.endr
    653 
    654 #else /* !defined (__ARM_FEATURE_CLZ) || defined (__OPTIMIZE_SIZE__) */
    655 #if defined (__ARM_FEATURE_CLZ)
    656 
    657 	clz	\order, \divisor
    658 	clz	\spare, \dividend
    659 	sub	\order, \order, \spare
    660 	mov	\divisor, \divisor, lsl \order
    661 
    662 #else /* !defined (__ARM_FEATURE_CLZ) */
    663 
    664 	mov	\order, #0
    665 
    666 	@ Unless the divisor is very big, shift it up in multiples of
    667 	@ four bits, since this is the amount of unwinding in the main
    668 	@ division loop.  Continue shifting until the divisor is
    669 	@ larger than the dividend.
    670 1:	cmp	\divisor, #0x10000000
    671 	cmplo	\divisor, \dividend
    672 	movlo	\divisor, \divisor, lsl #4
    673 	addlo	\order, \order, #4
    674 	blo	1b
    675 
    676 	@ For very big divisors, we must shift it a bit at a time, or
    677 	@ we will be in danger of overflowing.
    678 1:	cmp	\divisor, #0x80000000
    679 	cmplo	\divisor, \dividend
    680 	movlo	\divisor, \divisor, lsl #1
    681 	addlo	\order, \order, #1
    682 	blo	1b
    683 
    684 #endif /* !defined (__ARM_FEATURE_CLZ) */
    685 
    686 	@ Perform all needed substractions to keep only the reminder.
    687 	@ Do comparisons in batch of 4 first.
    688 	subs	\order, \order, #3		@ yes, 3 is intended here
    689 	blt	2f
    690 
    691 1:	cmp	\dividend, \divisor
    692 	subhs	\dividend, \dividend, \divisor
    693 	cmp	\dividend, \divisor,  lsr #1
    694 	subhs	\dividend, \dividend, \divisor, lsr #1
    695 	cmp	\dividend, \divisor,  lsr #2
    696 	subhs	\dividend, \dividend, \divisor, lsr #2
    697 	cmp	\dividend, \divisor,  lsr #3
    698 	subhs	\dividend, \dividend, \divisor, lsr #3
    699 	cmp	\dividend, #1
    700 	mov	\divisor, \divisor, lsr #4
    701 	subges	\order, \order, #4
    702 	bge	1b
    703 
    704 	tst	\order, #3
    705 	teqne	\dividend, #0
    706 	beq	5f
    707 
    708 	@ Either 1, 2 or 3 comparison/substractions are left.
    709 2:	cmn	\order, #2
    710 	blt	4f
    711 	beq	3f
    712 	cmp	\dividend, \divisor
    713 	subhs	\dividend, \dividend, \divisor
    714 	mov	\divisor,  \divisor,  lsr #1
    715 3:	cmp	\dividend, \divisor
    716 	subhs	\dividend, \dividend, \divisor
    717 	mov	\divisor,  \divisor,  lsr #1
    718 4:	cmp	\dividend, \divisor
    719 	subhs	\dividend, \dividend, \divisor
    720 5:
    721 
    722 #endif /* !defined (__ARM_FEATURE_CLZ) || defined (__OPTIMIZE_SIZE__) */
    723 
    724 .endm
    725 /* ------------------------------------------------------------------------ */
    726 .macro THUMB_DIV_MOD_BODY modulo
    727 	@ Load the constant 0x10000000 into our work register.
    728 	mov	work, #1
    729 	lsl	work, #28
    730 LSYM(Loop1):
    731 	@ Unless the divisor is very big, shift it up in multiples of
    732 	@ four bits, since this is the amount of unwinding in the main
    733 	@ division loop.  Continue shifting until the divisor is
    734 	@ larger than the dividend.
    735 	cmp	divisor, work
    736 	bhs	LSYM(Lbignum)
    737 	cmp	divisor, dividend
    738 	bhs	LSYM(Lbignum)
    739 	lsl	divisor, #4
    740 	lsl	curbit,  #4
    741 	b	LSYM(Loop1)
    742 LSYM(Lbignum):
    743 	@ Set work to 0x80000000
    744 	lsl	work, #3
    745 LSYM(Loop2):
    746 	@ For very big divisors, we must shift it a bit at a time, or
    747 	@ we will be in danger of overflowing.
    748 	cmp	divisor, work
    749 	bhs	LSYM(Loop3)
    750 	cmp	divisor, dividend
    751 	bhs	LSYM(Loop3)
    752 	lsl	divisor, #1
    753 	lsl	curbit,  #1
    754 	b	LSYM(Loop2)
    755 LSYM(Loop3):
    756 	@ Test for possible subtractions ...
    757   .if \modulo
    758 	@ ... On the final pass, this may subtract too much from the dividend,
    759 	@ so keep track of which subtractions are done, we can fix them up
    760 	@ afterwards.
    761 	mov	overdone, #0
    762 	cmp	dividend, divisor
    763 	blo	LSYM(Lover1)
    764 	sub	dividend, dividend, divisor
    765 LSYM(Lover1):
    766 	lsr	work, divisor, #1
    767 	cmp	dividend, work
    768 	blo	LSYM(Lover2)
    769 	sub	dividend, dividend, work
    770 	mov	ip, curbit
    771 	mov	work, #1
    772 	ror	curbit, work
    773 	orr	overdone, curbit
    774 	mov	curbit, ip
    775 LSYM(Lover2):
    776 	lsr	work, divisor, #2
    777 	cmp	dividend, work
    778 	blo	LSYM(Lover3)
    779 	sub	dividend, dividend, work
    780 	mov	ip, curbit
    781 	mov	work, #2
    782 	ror	curbit, work
    783 	orr	overdone, curbit
    784 	mov	curbit, ip
    785 LSYM(Lover3):
    786 	lsr	work, divisor, #3
    787 	cmp	dividend, work
    788 	blo	LSYM(Lover4)
    789 	sub	dividend, dividend, work
    790 	mov	ip, curbit
    791 	mov	work, #3
    792 	ror	curbit, work
    793 	orr	overdone, curbit
    794 	mov	curbit, ip
    795 LSYM(Lover4):
    796 	mov	ip, curbit
    797   .else
    798 	@ ... and note which bits are done in the result.  On the final pass,
    799 	@ this may subtract too much from the dividend, but the result will be ok,
    800 	@ since the "bit" will have been shifted out at the bottom.
    801 	cmp	dividend, divisor
    802 	blo	LSYM(Lover1)
    803 	sub	dividend, dividend, divisor
    804 	orr	result, result, curbit
    805 LSYM(Lover1):
    806 	lsr	work, divisor, #1
    807 	cmp	dividend, work
    808 	blo	LSYM(Lover2)
    809 	sub	dividend, dividend, work
    810 	lsr	work, curbit, #1
    811 	orr	result, work
    812 LSYM(Lover2):
    813 	lsr	work, divisor, #2
    814 	cmp	dividend, work
    815 	blo	LSYM(Lover3)
    816 	sub	dividend, dividend, work
    817 	lsr	work, curbit, #2
    818 	orr	result, work
    819 LSYM(Lover3):
    820 	lsr	work, divisor, #3
    821 	cmp	dividend, work
    822 	blo	LSYM(Lover4)
    823 	sub	dividend, dividend, work
    824 	lsr	work, curbit, #3
    825 	orr	result, work
    826 LSYM(Lover4):
    827   .endif
    828 
    829 	cmp	dividend, #0			@ Early termination?
    830 	beq	LSYM(Lover5)
    831 	lsr	curbit,  #4			@ No, any more bits to do?
    832 	beq	LSYM(Lover5)
    833 	lsr	divisor, #4
    834 	b	LSYM(Loop3)
    835 LSYM(Lover5):
    836   .if \modulo
    837 	@ Any subtractions that we should not have done will be recorded in
    838 	@ the top three bits of "overdone".  Exactly which were not needed
    839 	@ are governed by the position of the bit, stored in ip.
    840 	mov	work, #0xe
    841 	lsl	work, #28
    842 	and	overdone, work
    843 	beq	LSYM(Lgot_result)
    844 
    845 	@ If we terminated early, because dividend became zero, then the
    846 	@ bit in ip will not be in the bottom nibble, and we should not
    847 	@ perform the additions below.  We must test for this though
    848 	@ (rather relying upon the TSTs to prevent the additions) since
    849 	@ the bit in ip could be in the top two bits which might then match
    850 	@ with one of the smaller RORs.
    851 	mov	curbit, ip
    852 	mov	work, #0x7
    853 	tst	curbit, work
    854 	beq	LSYM(Lgot_result)
    855 
    856 	mov	curbit, ip
    857 	mov	work, #3
    858 	ror	curbit, work
    859 	tst	overdone, curbit
    860 	beq	LSYM(Lover6)
    861 	lsr	work, divisor, #3
    862 	add	dividend, work
    863 LSYM(Lover6):
    864 	mov	curbit, ip
    865 	mov	work, #2
    866 	ror	curbit, work
    867 	tst	overdone, curbit
    868 	beq	LSYM(Lover7)
    869 	lsr	work, divisor, #2
    870 	add	dividend, work
    871 LSYM(Lover7):
    872 	mov	curbit, ip
    873 	mov	work, #1
    874 	ror	curbit, work
    875 	tst	overdone, curbit
    876 	beq	LSYM(Lgot_result)
    877 	lsr	work, divisor, #1
    878 	add	dividend, work
    879   .endif
    880 LSYM(Lgot_result):
    881 .endm
    882 
    883 /* If performance is preferred, the following functions are provided.  */
    884 #if defined(__prefer_thumb__) && !defined(__OPTIMIZE_SIZE__)
    885 
    886 /* Branch to div(n), and jump to label if curbit is lo than divisior.  */
    887 .macro BranchToDiv n, label
    888 	lsr	curbit, dividend, \n
    889 	cmp	curbit, divisor
    890 	blo	\label
    891 .endm
    892 
    893 /* Body of div(n).  Shift the divisor in n bits and compare the divisor
    894    and dividend.  Update the dividend as the substruction result.  */
    895 .macro DoDiv n
    896 	lsr	curbit, dividend, \n
    897 	cmp	curbit, divisor
    898 	bcc	1f
    899 	lsl	curbit, divisor, \n
    900 	sub	dividend, dividend, curbit
    901 
    902 1:	adc	result, result
    903 .endm
    904 
    905 /* The body of division with positive divisor.  Unless the divisor is very
    906    big, shift it up in multiples of four bits, since this is the amount of
    907    unwinding in the main division loop.  Continue shifting until the divisor
    908    is larger than the dividend.  */
    909 .macro THUMB1_Div_Positive
    910 	mov	result, #0
    911 	BranchToDiv #1, LSYM(Lthumb1_div1)
    912 	BranchToDiv #4, LSYM(Lthumb1_div4)
    913 	BranchToDiv #8, LSYM(Lthumb1_div8)
    914 	BranchToDiv #12, LSYM(Lthumb1_div12)
    915 	BranchToDiv #16, LSYM(Lthumb1_div16)
    916 LSYM(Lthumb1_div_large_positive):
    917 	mov	result, #0xff
    918 	lsl	divisor, divisor, #8
    919 	rev	result, result
    920 	lsr	curbit, dividend, #16
    921 	cmp	curbit, divisor
    922 	blo	1f
    923 	asr	result, #8
    924 	lsl	divisor, divisor, #8
    925 	beq	LSYM(Ldivbyzero_waypoint)
    926 
    927 1:	lsr	curbit, dividend, #12
    928 	cmp	curbit, divisor
    929 	blo	LSYM(Lthumb1_div12)
    930 	b	LSYM(Lthumb1_div16)
    931 LSYM(Lthumb1_div_loop):
    932 	lsr	divisor, divisor, #8
    933 LSYM(Lthumb1_div16):
    934 	Dodiv	#15
    935 	Dodiv	#14
    936 	Dodiv	#13
    937 	Dodiv	#12
    938 LSYM(Lthumb1_div12):
    939 	Dodiv	#11
    940 	Dodiv	#10
    941 	Dodiv	#9
    942 	Dodiv	#8
    943 	bcs	LSYM(Lthumb1_div_loop)
    944 LSYM(Lthumb1_div8):
    945 	Dodiv	#7
    946 	Dodiv	#6
    947 	Dodiv	#5
    948 LSYM(Lthumb1_div5):
    949 	Dodiv	#4
    950 LSYM(Lthumb1_div4):
    951 	Dodiv	#3
    952 LSYM(Lthumb1_div3):
    953 	Dodiv	#2
    954 LSYM(Lthumb1_div2):
    955 	Dodiv	#1
    956 LSYM(Lthumb1_div1):
    957 	sub	divisor, dividend, divisor
    958 	bcs	1f
    959 	cpy	divisor, dividend
    960 
    961 1:	adc	result, result
    962 	cpy	dividend, result
    963 	RET
    964 
    965 LSYM(Ldivbyzero_waypoint):
    966 	b	LSYM(Ldiv0)
    967 .endm
    968 
    969 /* The body of division with negative divisor.  Similar with
    970    THUMB1_Div_Positive except that the shift steps are in multiples
    971    of six bits.  */
    972 .macro THUMB1_Div_Negative
    973 	lsr	result, divisor, #31
    974 	beq	1f
    975 	neg	divisor, divisor
    976 
    977 1:	asr	curbit, dividend, #32
    978 	bcc	2f
    979 	neg	dividend, dividend
    980 
    981 2:	eor	curbit, result
    982 	mov	result, #0
    983 	cpy	ip, curbit
    984 	BranchToDiv #4, LSYM(Lthumb1_div_negative4)
    985 	BranchToDiv #8, LSYM(Lthumb1_div_negative8)
    986 LSYM(Lthumb1_div_large):
    987 	mov	result, #0xfc
    988 	lsl	divisor, divisor, #6
    989 	rev	result, result
    990 	lsr	curbit, dividend, #8
    991 	cmp	curbit, divisor
    992 	blo	LSYM(Lthumb1_div_negative8)
    993 
    994 	lsl	divisor, divisor, #6
    995 	asr	result, result, #6
    996 	cmp	curbit, divisor
    997 	blo	LSYM(Lthumb1_div_negative8)
    998 
    999 	lsl	divisor, divisor, #6
   1000 	asr	result, result, #6
   1001 	cmp	curbit, divisor
   1002 	blo	LSYM(Lthumb1_div_negative8)
   1003 
   1004 	lsl	divisor, divisor, #6
   1005 	beq	LSYM(Ldivbyzero_negative)
   1006 	asr	result, result, #6
   1007 	b	LSYM(Lthumb1_div_negative8)
   1008 LSYM(Lthumb1_div_negative_loop):
   1009 	lsr	divisor, divisor, #6
   1010 LSYM(Lthumb1_div_negative8):
   1011 	DoDiv	#7
   1012 	DoDiv	#6
   1013 	DoDiv	#5
   1014 	DoDiv	#4
   1015 LSYM(Lthumb1_div_negative4):
   1016 	DoDiv	#3
   1017 	DoDiv	#2
   1018 	bcs	LSYM(Lthumb1_div_negative_loop)
   1019 	DoDiv	#1
   1020 	sub	divisor, dividend, divisor
   1021 	bcs	1f
   1022 	cpy	divisor, dividend
   1023 
   1024 1:	cpy	curbit, ip
   1025 	adc	result, result
   1026 	asr	curbit, curbit, #1
   1027 	cpy	dividend, result
   1028 	bcc	2f
   1029 	neg	dividend, dividend
   1030 	cmp	curbit, #0
   1031 
   1032 2:	bpl	3f
   1033 	neg	divisor, divisor
   1034 
   1035 3:	RET
   1036 
   1037 LSYM(Ldivbyzero_negative):
   1038 	cpy	curbit, ip
   1039 	asr	curbit, curbit, #1
   1040 	bcc	LSYM(Ldiv0)
   1041 	neg	dividend, dividend
   1042 .endm
   1043 #endif /* ARM Thumb version.  */
   1044 
   1045 /* ------------------------------------------------------------------------ */
   1046 /*		Start of the Real Functions				    */
   1047 /* ------------------------------------------------------------------------ */
   1048 #ifdef L_udivsi3
   1049 
   1050 #if defined(__prefer_thumb__)
   1051 
   1052 	FUNC_START udivsi3
   1053 	FUNC_ALIAS aeabi_uidiv udivsi3
   1054 #if defined(__OPTIMIZE_SIZE__)
   1055 
   1056 	cmp	divisor, #0
   1057 	beq	LSYM(Ldiv0)
   1058 LSYM(udivsi3_skip_div0_test):
   1059 	mov	curbit, #1
   1060 	mov	result, #0
   1061 
   1062 	push	{ work }
   1063 	cmp	dividend, divisor
   1064 	blo	LSYM(Lgot_result)
   1065 
   1066 	THUMB_DIV_MOD_BODY 0
   1067 
   1068 	mov	r0, result
   1069 	pop	{ work }
   1070 	RET
   1071 
   1072 /* Implementation of aeabi_uidiv for ARMv6m.  This version is only
   1073    used in ARMv6-M when we need an efficient implementation.  */
   1074 #else
   1075 LSYM(udivsi3_skip_div0_test):
   1076 	THUMB1_Div_Positive
   1077 
   1078 #endif /* __OPTIMIZE_SIZE__ */
   1079 
   1080 #elif defined(__ARM_ARCH_EXT_IDIV__)
   1081 
   1082 	ARM_FUNC_START udivsi3
   1083 	ARM_FUNC_ALIAS aeabi_uidiv udivsi3
   1084 
   1085 	cmp	r1, #0
   1086 	beq	LSYM(Ldiv0)
   1087 
   1088 	udiv	r0, r0, r1
   1089 	RET
   1090 
   1091 #else /* ARM version/Thumb-2.  */
   1092 
   1093 	ARM_FUNC_START udivsi3
   1094 	ARM_FUNC_ALIAS aeabi_uidiv udivsi3
   1095 
   1096 	/* Note: if called via udivsi3_skip_div0_test, this will unnecessarily
   1097 	   check for division-by-zero a second time.  */
   1098 LSYM(udivsi3_skip_div0_test):
   1099 	subs	r2, r1, #1
   1100 	do_it	eq
   1101 	RETc(eq)
   1102 	bcc	LSYM(Ldiv0)
   1103 	cmp	r0, r1
   1104 	bls	11f
   1105 	tst	r1, r2
   1106 	beq	12f
   1107 
   1108 	ARM_DIV_BODY r0, r1, r2, r3
   1109 
   1110 	mov	r0, r2
   1111 	RET
   1112 
   1113 11:	do_it	eq, e
   1114 	moveq	r0, #1
   1115 	movne	r0, #0
   1116 	RET
   1117 
   1118 12:	ARM_DIV2_ORDER r1, r2
   1119 
   1120 	mov	r0, r0, lsr r2
   1121 	RET
   1122 
   1123 #endif /* ARM version */
   1124 
   1125 	DIV_FUNC_END udivsi3 unsigned
   1126 
   1127 #if defined(__prefer_thumb__)
   1128 FUNC_START aeabi_uidivmod
   1129 	cmp	r1, #0
   1130 	beq	LSYM(Ldiv0)
   1131 # if defined(__OPTIMIZE_SIZE__)
   1132 	push	{r0, r1, lr}
   1133 	bl	LSYM(udivsi3_skip_div0_test)
   1134 	POP	{r1, r2, r3}
   1135 	mul	r2, r0
   1136 	sub	r1, r1, r2
   1137 	bx	r3
   1138 # else
   1139 	/* Both the quotient and remainder are calculated simultaneously
   1140 	   in THUMB1_Div_Positive.  There is no need to calculate the
   1141 	   remainder again here.  */
   1142 	b	LSYM(udivsi3_skip_div0_test)
   1143 	RET
   1144 # endif /* __OPTIMIZE_SIZE__ */
   1145 
   1146 #elif defined(__ARM_ARCH_EXT_IDIV__)
   1147 ARM_FUNC_START aeabi_uidivmod
   1148 	cmp	r1, #0
   1149 	beq	LSYM(Ldiv0)
   1150 	mov     r2, r0
   1151 	udiv	r0, r0, r1
   1152 	mls     r1, r0, r1, r2
   1153 	RET
   1154 #else
   1155 ARM_FUNC_START aeabi_uidivmod
   1156 	cmp	r1, #0
   1157 	beq	LSYM(Ldiv0)
   1158 	stmfd	sp!, { r0, r1, lr }
   1159 	bl	LSYM(udivsi3_skip_div0_test)
   1160 	ldmfd	sp!, { r1, r2, lr }
   1161 	mul	r3, r2, r0
   1162 	sub	r1, r1, r3
   1163 	RET
   1164 #endif
   1165 	FUNC_END aeabi_uidivmod
   1166 
   1167 #endif /* L_udivsi3 */
   1168 /* ------------------------------------------------------------------------ */
   1169 #ifdef L_umodsi3
   1170 
   1171 #if defined(__ARM_ARCH_EXT_IDIV__) && __ARM_ARCH_ISA_THUMB != 1
   1172 
   1173 	ARM_FUNC_START umodsi3
   1174 
   1175 	cmp	r1, #0
   1176 	beq	LSYM(Ldiv0)
   1177 	udiv	r2, r0, r1
   1178 	mls     r0, r1, r2, r0
   1179 	RET
   1180 
   1181 #elif defined(__thumb__)
   1182 
   1183 	FUNC_START umodsi3
   1184 
   1185 	cmp	divisor, #0
   1186 	beq	LSYM(Ldiv0)
   1187 	mov	curbit, #1
   1188 	cmp	dividend, divisor
   1189 	bhs	LSYM(Lover10)
   1190 	RET
   1191 
   1192 LSYM(Lover10):
   1193 	push	{ work }
   1194 
   1195 	THUMB_DIV_MOD_BODY 1
   1196 
   1197 	pop	{ work }
   1198 	RET
   1199 
   1200 #else  /* ARM version.  */
   1201 
   1202 	FUNC_START umodsi3
   1203 
   1204 	subs	r2, r1, #1			@ compare divisor with 1
   1205 	bcc	LSYM(Ldiv0)
   1206 	cmpne	r0, r1				@ compare dividend with divisor
   1207 	moveq   r0, #0
   1208 	tsthi	r1, r2				@ see if divisor is power of 2
   1209 	andeq	r0, r0, r2
   1210 	RETc(ls)
   1211 
   1212 	ARM_MOD_BODY r0, r1, r2, r3
   1213 
   1214 	RET
   1215 
   1216 #endif /* ARM version.  */
   1217 
   1218 	DIV_FUNC_END umodsi3 unsigned
   1219 
   1220 #endif /* L_umodsi3 */
   1221 /* ------------------------------------------------------------------------ */
   1222 #ifdef L_divsi3
   1223 
   1224 #if defined(__prefer_thumb__)
   1225 
   1226 	FUNC_START divsi3
   1227 	FUNC_ALIAS aeabi_idiv divsi3
   1228 #if defined(__OPTIMIZE_SIZE__)
   1229 
   1230 	cmp	divisor, #0
   1231 	beq	LSYM(Ldiv0)
   1232 LSYM(divsi3_skip_div0_test):
   1233 	push	{ work }
   1234 	mov	work, dividend
   1235 	eor	work, divisor		@ Save the sign of the result.
   1236 	mov	ip, work
   1237 	mov	curbit, #1
   1238 	mov	result, #0
   1239 	cmp	divisor, #0
   1240 	bpl	LSYM(Lover10)
   1241 	neg	divisor, divisor	@ Loops below use unsigned.
   1242 LSYM(Lover10):
   1243 	cmp	dividend, #0
   1244 	bpl	LSYM(Lover11)
   1245 	neg	dividend, dividend
   1246 LSYM(Lover11):
   1247 	cmp	dividend, divisor
   1248 	blo	LSYM(Lgot_result)
   1249 
   1250 	THUMB_DIV_MOD_BODY 0
   1251 
   1252 	mov	r0, result
   1253 	mov	work, ip
   1254 	cmp	work, #0
   1255 	bpl	LSYM(Lover12)
   1256 	neg	r0, r0
   1257 LSYM(Lover12):
   1258 	pop	{ work }
   1259 	RET
   1260 
   1261 /* Implementation of aeabi_idiv for ARMv6m.  This version is only
   1262    used in ARMv6-M when we need an efficient implementation.  */
   1263 #else
   1264 LSYM(divsi3_skip_div0_test):
   1265 	cpy	curbit, dividend
   1266 	orr	curbit, divisor
   1267 	bmi	LSYM(Lthumb1_div_negative)
   1268 
   1269 LSYM(Lthumb1_div_positive):
   1270 	THUMB1_Div_Positive
   1271 
   1272 LSYM(Lthumb1_div_negative):
   1273 	THUMB1_Div_Negative
   1274 
   1275 #endif /* __OPTIMIZE_SIZE__ */
   1276 
   1277 #elif defined(__ARM_ARCH_EXT_IDIV__)
   1278 
   1279 	ARM_FUNC_START divsi3
   1280 	ARM_FUNC_ALIAS aeabi_idiv divsi3
   1281 
   1282 	cmp 	r1, #0
   1283 	beq	LSYM(Ldiv0)
   1284 	sdiv	r0, r0, r1
   1285 	RET
   1286 
   1287 #else /* ARM/Thumb-2 version.  */
   1288 
   1289 	ARM_FUNC_START divsi3
   1290 	ARM_FUNC_ALIAS aeabi_idiv divsi3
   1291 
   1292 	cmp	r1, #0
   1293 	beq	LSYM(Ldiv0)
   1294 LSYM(divsi3_skip_div0_test):
   1295 	eor	ip, r0, r1			@ save the sign of the result.
   1296 	do_it	mi
   1297 	rsbmi	r1, r1, #0			@ loops below use unsigned.
   1298 	subs	r2, r1, #1			@ division by 1 or -1 ?
   1299 	beq	10f
   1300 	movs	r3, r0
   1301 	do_it	mi
   1302 	rsbmi	r3, r0, #0			@ positive dividend value
   1303 	cmp	r3, r1
   1304 	bls	11f
   1305 	tst	r1, r2				@ divisor is power of 2 ?
   1306 	beq	12f
   1307 
   1308 	ARM_DIV_BODY r3, r1, r0, r2
   1309 
   1310 	cmp	ip, #0
   1311 	do_it	mi
   1312 	rsbmi	r0, r0, #0
   1313 	RET
   1314 
   1315 10:	teq	ip, r0				@ same sign ?
   1316 	do_it	mi
   1317 	rsbmi	r0, r0, #0
   1318 	RET
   1319 
   1320 11:	do_it	lo
   1321 	movlo	r0, #0
   1322 	do_it	eq,t
   1323 	moveq	r0, ip, asr #31
   1324 	orreq	r0, r0, #1
   1325 	RET
   1326 
   1327 12:	ARM_DIV2_ORDER r1, r2
   1328 
   1329 	cmp	ip, #0
   1330 	mov	r0, r3, lsr r2
   1331 	do_it	mi
   1332 	rsbmi	r0, r0, #0
   1333 	RET
   1334 
   1335 #endif /* ARM version */
   1336 
   1337 	DIV_FUNC_END divsi3 signed
   1338 
   1339 #if defined(__prefer_thumb__)
   1340 FUNC_START aeabi_idivmod
   1341 	cmp	r1, #0
   1342 	beq	LSYM(Ldiv0)
   1343 # if defined(__OPTIMIZE_SIZE__)
   1344 	push	{r0, r1, lr}
   1345 	bl	LSYM(divsi3_skip_div0_test)
   1346 	POP	{r1, r2, r3}
   1347 	mul	r2, r0
   1348 	sub	r1, r1, r2
   1349 	bx	r3
   1350 # else
   1351 	/* Both the quotient and remainder are calculated simultaneously
   1352 	   in THUMB1_Div_Positive and THUMB1_Div_Negative.  There is no
   1353 	   need to calculate the remainder again here.  */
   1354 	b	LSYM(divsi3_skip_div0_test)
   1355 	RET
   1356 # endif /* __OPTIMIZE_SIZE__ */
   1357 
   1358 #elif defined(__ARM_ARCH_EXT_IDIV__)
   1359 ARM_FUNC_START aeabi_idivmod
   1360 	cmp 	r1, #0
   1361 	beq	LSYM(Ldiv0)
   1362 	mov     r2, r0
   1363 	sdiv	r0, r0, r1
   1364 	mls     r1, r0, r1, r2
   1365 	RET
   1366 #else
   1367 ARM_FUNC_START aeabi_idivmod
   1368 	cmp	r1, #0
   1369 	beq	LSYM(Ldiv0)
   1370 	stmfd	sp!, { r0, r1, lr }
   1371 	bl	LSYM(divsi3_skip_div0_test)
   1372 	ldmfd	sp!, { r1, r2, lr }
   1373 	mul	r3, r2, r0
   1374 	sub	r1, r1, r3
   1375 	RET
   1376 #endif
   1377 	FUNC_END aeabi_idivmod
   1378 
   1379 #endif /* L_divsi3 */
   1380 /* ------------------------------------------------------------------------ */
   1381 #ifdef L_modsi3
   1382 
   1383 #if defined(__ARM_ARCH_EXT_IDIV__) && __ARM_ARCH_ISA_THUMB != 1
   1384 
   1385 	ARM_FUNC_START modsi3
   1386 
   1387 	cmp	r1, #0
   1388 	beq	LSYM(Ldiv0)
   1389 
   1390 	sdiv	r2, r0, r1
   1391 	mls     r0, r1, r2, r0
   1392 	RET
   1393 
   1394 #elif defined(__thumb__)
   1395 
   1396 	FUNC_START modsi3
   1397 
   1398 	mov	curbit, #1
   1399 	cmp	divisor, #0
   1400 	beq	LSYM(Ldiv0)
   1401 	bpl	LSYM(Lover10)
   1402 	neg	divisor, divisor		@ Loops below use unsigned.
   1403 LSYM(Lover10):
   1404 	push	{ work }
   1405 	@ Need to save the sign of the dividend, unfortunately, we need
   1406 	@ work later on.  Must do this after saving the original value of
   1407 	@ the work register, because we will pop this value off first.
   1408 	push	{ dividend }
   1409 	cmp	dividend, #0
   1410 	bpl	LSYM(Lover11)
   1411 	neg	dividend, dividend
   1412 LSYM(Lover11):
   1413 	cmp	dividend, divisor
   1414 	blo	LSYM(Lgot_result)
   1415 
   1416 	THUMB_DIV_MOD_BODY 1
   1417 
   1418 	pop	{ work }
   1419 	cmp	work, #0
   1420 	bpl	LSYM(Lover12)
   1421 	neg	dividend, dividend
   1422 LSYM(Lover12):
   1423 	pop	{ work }
   1424 	RET
   1425 
   1426 #else /* ARM version.  */
   1427 
   1428 	FUNC_START modsi3
   1429 
   1430 	cmp	r1, #0
   1431 	beq	LSYM(Ldiv0)
   1432 	rsbmi	r1, r1, #0			@ loops below use unsigned.
   1433 	movs	ip, r0				@ preserve sign of dividend
   1434 	rsbmi	r0, r0, #0			@ if negative make positive
   1435 	subs	r2, r1, #1			@ compare divisor with 1
   1436 	cmpne	r0, r1				@ compare dividend with divisor
   1437 	moveq	r0, #0
   1438 	tsthi	r1, r2				@ see if divisor is power of 2
   1439 	andeq	r0, r0, r2
   1440 	bls	10f
   1441 
   1442 	ARM_MOD_BODY r0, r1, r2, r3
   1443 
   1444 10:	cmp	ip, #0
   1445 	rsbmi	r0, r0, #0
   1446 	RET
   1447 
   1448 #endif /* ARM version */
   1449 
   1450 	DIV_FUNC_END modsi3 signed
   1451 
   1452 #endif /* L_modsi3 */
   1453 /* ------------------------------------------------------------------------ */
   1454 #ifdef L_dvmd_tls
   1455 
   1456 #ifdef __ARM_EABI__
   1457 	WEAK aeabi_idiv0
   1458 	WEAK aeabi_ldiv0
   1459 	FUNC_START aeabi_idiv0
   1460 	FUNC_START aeabi_ldiv0
   1461 	RET
   1462 	FUNC_END aeabi_ldiv0
   1463 	FUNC_END aeabi_idiv0
   1464 #else
   1465 	FUNC_START div0
   1466 	RET
   1467 	FUNC_END div0
   1468 #endif
   1469 
   1470 #endif /* L_divmodsi_tools */
   1471 /* ------------------------------------------------------------------------ */
   1472 #ifdef L_dvmd_lnx
   1473 @ GNU/Linux division-by zero handler.  Used in place of L_dvmd_tls
   1474 
   1475 /* Constant taken from <asm/signal.h>.  */
   1476 #define SIGFPE	8
   1477 
   1478 #ifdef __ARM_EABI__
   1479 	cfi_start	__aeabi_ldiv0, LSYM(Lend_aeabi_ldiv0)
   1480 	WEAK aeabi_idiv0
   1481 	WEAK aeabi_ldiv0
   1482 	ARM_FUNC_START aeabi_idiv0
   1483 	ARM_FUNC_START aeabi_ldiv0
   1484 	do_push	{r1, lr}
   1485 98:	cfi_push 98b - __aeabi_ldiv0, 0xe, -0x4, 0x8
   1486 #else
   1487 	cfi_start	__div0, LSYM(Lend_div0)
   1488 	ARM_FUNC_START div0
   1489 	do_push	{r1, lr}
   1490 98:	cfi_push 98b - __div0, 0xe, -0x4, 0x8
   1491 #endif
   1492 
   1493 	mov	r0, #SIGFPE
   1494 	bl	SYM(raise) __PLT__
   1495 	RETLDM	r1 unwind=98b
   1496 
   1497 #ifdef __ARM_EABI__
   1498 	cfi_end	LSYM(Lend_aeabi_ldiv0)
   1499 	FUNC_END aeabi_ldiv0
   1500 	FUNC_END aeabi_idiv0
   1501 #else
   1502 	cfi_end	LSYM(Lend_div0)
   1503 	FUNC_END div0
   1504 #endif
   1505 
   1506 #endif /* L_dvmd_lnx */
   1507 #ifdef L_clear_cache
   1508 #if defined __ARM_EABI__ && defined __linux__
   1509 @ EABI GNU/Linux call to cacheflush syscall.
   1510 	ARM_FUNC_START clear_cache
   1511 	do_push	{r7}
   1512 #if __ARM_ARCH >= 7 || defined(__ARM_ARCH_6T2__)
   1513 	movw	r7, #2
   1514 	movt	r7, #0xf
   1515 #else
   1516 	mov	r7, #0xf0000
   1517 	add	r7, r7, #2
   1518 #endif
   1519 	mov	r2, #0
   1520 	swi	0
   1521 	do_pop	{r7}
   1522 	RET
   1523 	FUNC_END clear_cache
   1524 #else
   1525 #error "This is only for ARM EABI GNU/Linux"
   1526 #endif
   1527 #endif /* L_clear_cache */
   1528 
   1529 #ifdef L_speculation_barrier
   1530 	FUNC_START speculation_barrier
   1531 #if __ARM_ARCH >= 7
   1532 	isb
   1533 	dsb sy
   1534 #elif defined __ARM_EABI__ && defined __linux__
   1535 	/* We don't have a speculation barrier directly for this
   1536 	   platform/architecture variant.  But we can use a kernel
   1537 	   clear_cache service routine which will emit such instructions
   1538 	   if run on a later version of the architecture.  We don't
   1539 	   really want to flush the cache, but we must give it a valid
   1540 	   address, so just clear pc..pc+1.  */
   1541 #if defined __thumb__ && !defined __thumb2__
   1542 	push	{r7}
   1543 	mov	r7, #0xf
   1544 	lsl	r7, #16
   1545 	add	r7, #2
   1546 	adr	r0, . + 4
   1547 	add	r1, r0, #1
   1548 	mov	r2, #0
   1549 	svc	0
   1550 	pop	{r7}
   1551 #else
   1552 	do_push	{r7}
   1553 #ifdef __ARM_ARCH_6T2__
   1554 	movw	r7, #2
   1555 	movt	r7, #0xf
   1556 #else
   1557 	mov	r7, #0xf0000
   1558 	add	r7, r7, #2
   1559 #endif
   1560 	add	r0, pc, #0	/* ADR.  */
   1561 	add	r1, r0, #1
   1562 	mov	r2, #0
   1563 	svc	0
   1564 	do_pop	{r7}
   1565 #endif /* Thumb1 only */
   1566 #else
   1567 #warning "No speculation barrier defined for this platform"
   1568 #endif
   1569 	RET
   1570 	FUNC_END speculation_barrier
   1571 #endif
   1572 /* ------------------------------------------------------------------------ */
   1573 /* Dword shift operations.  */
   1574 /* All the following Dword shift variants rely on the fact that
   1575 	shft xxx, Reg
   1576    is in fact done as
   1577 	shft xxx, (Reg & 255)
   1578    so for Reg value in (32...63) and (-1...-31) we will get zero (in the
   1579    case of logical shifts) or the sign (for asr).  */
   1580 
   1581 #ifdef __ARMEB__
   1582 #define al	r1
   1583 #define ah	r0
   1584 #else
   1585 #define al	r0
   1586 #define ah	r1
   1587 #endif
   1588 
   1589 /* Prevent __aeabi double-word shifts from being produced on SymbianOS.  */
   1590 #ifndef __symbian__
   1591 
   1592 #ifdef L_lshrdi3
   1593 
   1594 	FUNC_START lshrdi3
   1595 	FUNC_ALIAS aeabi_llsr lshrdi3
   1596 
   1597 #ifdef __thumb__
   1598 	lsr	al, r2
   1599 	mov	r3, ah
   1600 	lsr	ah, r2
   1601 	mov	ip, r3
   1602 	sub	r2, #32
   1603 	lsr	r3, r2
   1604 	orr	al, r3
   1605 	neg	r2, r2
   1606 	mov	r3, ip
   1607 	lsl	r3, r2
   1608 	orr	al, r3
   1609 	RET
   1610 #else
   1611 	subs	r3, r2, #32
   1612 	rsb	ip, r2, #32
   1613 	movmi	al, al, lsr r2
   1614 	movpl	al, ah, lsr r3
   1615 	orrmi	al, al, ah, lsl ip
   1616 	mov	ah, ah, lsr r2
   1617 	RET
   1618 #endif
   1619 	FUNC_END aeabi_llsr
   1620 	FUNC_END lshrdi3
   1621 
   1622 #endif
   1623 
   1624 #ifdef L_ashrdi3
   1625 
   1626 	FUNC_START ashrdi3
   1627 	FUNC_ALIAS aeabi_lasr ashrdi3
   1628 
   1629 #ifdef __thumb__
   1630 	lsr	al, r2
   1631 	mov	r3, ah
   1632 	asr	ah, r2
   1633 	sub	r2, #32
   1634 	@ If r2 is negative at this point the following step would OR
   1635 	@ the sign bit into all of AL.  That's not what we want...
   1636 	bmi	1f
   1637 	mov	ip, r3
   1638 	asr	r3, r2
   1639 	orr	al, r3
   1640 	mov	r3, ip
   1641 1:
   1642 	neg	r2, r2
   1643 	lsl	r3, r2
   1644 	orr	al, r3
   1645 	RET
   1646 #else
   1647 	subs	r3, r2, #32
   1648 	rsb	ip, r2, #32
   1649 	movmi	al, al, lsr r2
   1650 	movpl	al, ah, asr r3
   1651 	orrmi	al, al, ah, lsl ip
   1652 	mov	ah, ah, asr r2
   1653 	RET
   1654 #endif
   1655 
   1656 	FUNC_END aeabi_lasr
   1657 	FUNC_END ashrdi3
   1658 
   1659 #endif
   1660 
   1661 #ifdef L_ashldi3
   1662 
   1663 	FUNC_START ashldi3
   1664 	FUNC_ALIAS aeabi_llsl ashldi3
   1665 
   1666 #ifdef __thumb__
   1667 	lsl	ah, r2
   1668 	mov	r3, al
   1669 	lsl	al, r2
   1670 	mov	ip, r3
   1671 	sub	r2, #32
   1672 	lsl	r3, r2
   1673 	orr	ah, r3
   1674 	neg	r2, r2
   1675 	mov	r3, ip
   1676 	lsr	r3, r2
   1677 	orr	ah, r3
   1678 	RET
   1679 #else
   1680 	subs	r3, r2, #32
   1681 	rsb	ip, r2, #32
   1682 	movmi	ah, ah, lsl r2
   1683 	movpl	ah, al, lsl r3
   1684 	orrmi	ah, ah, al, lsr ip
   1685 	mov	al, al, lsl r2
   1686 	RET
   1687 #endif
   1688 	FUNC_END aeabi_llsl
   1689 	FUNC_END ashldi3
   1690 
   1691 #endif
   1692 
   1693 #endif /* __symbian__ */
   1694 
   1695 #ifdef L_clzsi2
   1696 #ifdef NOT_ISA_TARGET_32BIT
   1697 FUNC_START clzsi2
   1698 	mov	r1, #28
   1699 	mov	r3, #1
   1700 	lsl	r3, r3, #16
   1701 	cmp	r0, r3 /* 0x10000 */
   1702 	bcc	2f
   1703 	lsr	r0, r0, #16
   1704 	sub	r1, r1, #16
   1705 2:	lsr	r3, r3, #8
   1706 	cmp	r0, r3 /* #0x100 */
   1707 	bcc	2f
   1708 	lsr	r0, r0, #8
   1709 	sub	r1, r1, #8
   1710 2:	lsr	r3, r3, #4
   1711 	cmp	r0, r3 /* #0x10 */
   1712 	bcc	2f
   1713 	lsr	r0, r0, #4
   1714 	sub	r1, r1, #4
   1715 2:	adr	r2, 1f
   1716 	ldrb	r0, [r2, r0]
   1717 	add	r0, r0, r1
   1718 	bx lr
   1719 .align 2
   1720 1:
   1721 .byte 4, 3, 2, 2, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0
   1722 	FUNC_END clzsi2
   1723 #else
   1724 ARM_FUNC_START clzsi2
   1725 # if defined (__ARM_FEATURE_CLZ)
   1726 	clz	r0, r0
   1727 	RET
   1728 # else
   1729 	mov	r1, #28
   1730 	cmp	r0, #0x10000
   1731 	do_it	cs, t
   1732 	movcs	r0, r0, lsr #16
   1733 	subcs	r1, r1, #16
   1734 	cmp	r0, #0x100
   1735 	do_it	cs, t
   1736 	movcs	r0, r0, lsr #8
   1737 	subcs	r1, r1, #8
   1738 	cmp	r0, #0x10
   1739 	do_it	cs, t
   1740 	movcs	r0, r0, lsr #4
   1741 	subcs	r1, r1, #4
   1742 	adr	r2, 1f
   1743 	ldrb	r0, [r2, r0]
   1744 	add	r0, r0, r1
   1745 	RET
   1746 .align 2
   1747 1:
   1748 .byte 4, 3, 2, 2, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0
   1749 # endif /* !defined (__ARM_FEATURE_CLZ) */
   1750 	FUNC_END clzsi2
   1751 #endif
   1752 #endif /* L_clzsi2 */
   1753 
   1754 #ifdef L_clzdi2
   1755 #if !defined (__ARM_FEATURE_CLZ)
   1756 
   1757 # ifdef NOT_ISA_TARGET_32BIT
   1758 FUNC_START clzdi2
   1759 	push	{r4, lr}
   1760 # else
   1761 ARM_FUNC_START clzdi2
   1762 	do_push	{r4, lr}
   1763 # endif
   1764 	cmp	xxh, #0
   1765 	bne	1f
   1766 # ifdef __ARMEB__
   1767 	mov	r0, xxl
   1768 	bl	__clzsi2
   1769 	add	r0, r0, #32
   1770 	b 2f
   1771 1:
   1772 	bl	__clzsi2
   1773 # else
   1774 	bl	__clzsi2
   1775 	add	r0, r0, #32
   1776 	b 2f
   1777 1:
   1778 	mov	r0, xxh
   1779 	bl	__clzsi2
   1780 # endif
   1781 2:
   1782 # ifdef NOT_ISA_TARGET_32BIT
   1783 	pop	{r4, pc}
   1784 # else
   1785 	RETLDM	r4
   1786 # endif
   1787 	FUNC_END clzdi2
   1788 
   1789 #else /* defined (__ARM_FEATURE_CLZ) */
   1790 
   1791 ARM_FUNC_START clzdi2
   1792 	cmp	xxh, #0
   1793 	do_it	eq, et
   1794 	clzeq	r0, xxl
   1795 	clzne	r0, xxh
   1796 	addeq	r0, r0, #32
   1797 	RET
   1798 	FUNC_END clzdi2
   1799 
   1800 #endif
   1801 #endif /* L_clzdi2 */
   1802 
   1803 #ifdef L_ctzsi2
   1804 #ifdef NOT_ISA_TARGET_32BIT
   1805 FUNC_START ctzsi2
   1806 	neg	r1, r0
   1807 	and	r0, r0, r1
   1808 	mov	r1, #28
   1809 	mov	r3, #1
   1810 	lsl	r3, r3, #16
   1811 	cmp	r0, r3 /* 0x10000 */
   1812 	bcc	2f
   1813 	lsr	r0, r0, #16
   1814 	sub	r1, r1, #16
   1815 2:	lsr	r3, r3, #8
   1816 	cmp	r0, r3 /* #0x100 */
   1817 	bcc	2f
   1818 	lsr	r0, r0, #8
   1819 	sub	r1, r1, #8
   1820 2:	lsr	r3, r3, #4
   1821 	cmp	r0, r3 /* #0x10 */
   1822 	bcc	2f
   1823 	lsr	r0, r0, #4
   1824 	sub	r1, r1, #4
   1825 2:	adr	r2, 1f
   1826 	ldrb	r0, [r2, r0]
   1827 	sub	r0, r0, r1
   1828 	bx lr
   1829 .align 2
   1830 1:
   1831 .byte	27, 28, 29, 29, 30, 30, 30, 30, 31, 31, 31, 31, 31, 31, 31, 31
   1832 	FUNC_END ctzsi2
   1833 #else
   1834 ARM_FUNC_START ctzsi2
   1835 	rsb	r1, r0, #0
   1836 	and	r0, r0, r1
   1837 # if defined (__ARM_FEATURE_CLZ)
   1838 	clz	r0, r0
   1839 	rsb	r0, r0, #31
   1840 	RET
   1841 # else
   1842 	mov	r1, #28
   1843 	cmp	r0, #0x10000
   1844 	do_it	cs, t
   1845 	movcs	r0, r0, lsr #16
   1846 	subcs	r1, r1, #16
   1847 	cmp	r0, #0x100
   1848 	do_it	cs, t
   1849 	movcs	r0, r0, lsr #8
   1850 	subcs	r1, r1, #8
   1851 	cmp	r0, #0x10
   1852 	do_it	cs, t
   1853 	movcs	r0, r0, lsr #4
   1854 	subcs	r1, r1, #4
   1855 	adr	r2, 1f
   1856 	ldrb	r0, [r2, r0]
   1857 	sub	r0, r0, r1
   1858 	RET
   1859 .align 2
   1860 1:
   1861 .byte	27, 28, 29, 29, 30, 30, 30, 30, 31, 31, 31, 31, 31, 31, 31, 31
   1862 # endif /* !defined (__ARM_FEATURE_CLZ) */
   1863 	FUNC_END ctzsi2
   1864 #endif
   1865 #endif /* L_clzsi2 */
   1866 
   1867 /* ------------------------------------------------------------------------ */
   1868 /* These next two sections are here despite the fact that they contain Thumb
   1869    assembler because their presence allows interworked code to be linked even
   1870    when the GCC library is this one.  */
   1871 
   1872 /* Do not build the interworking functions when the target architecture does
   1873    not support Thumb instructions.  (This can be a multilib option).  */
   1874 #if defined __ARM_ARCH_4T__ || defined __ARM_ARCH_5T__\
   1875       || defined __ARM_ARCH_5TE__ || defined __ARM_ARCH_5TEJ__ \
   1876       || __ARM_ARCH >= 6
   1877 
   1878 #if defined L_call_via_rX
   1879 
   1880 /* These labels & instructions are used by the Arm/Thumb interworking code.
   1881    The address of function to be called is loaded into a register and then
   1882    one of these labels is called via a BL instruction.  This puts the
   1883    return address into the link register with the bottom bit set, and the
   1884    code here switches to the correct mode before executing the function.  */
   1885 
   1886 	.text
   1887 	.align 0
   1888         .force_thumb
   1889 
   1890 .macro call_via register
   1891 	THUMB_FUNC_START _call_via_\register
   1892 
   1893 	bx	\register
   1894 	nop
   1895 
   1896 	SIZE	(_call_via_\register)
   1897 .endm
   1898 
   1899 	call_via r0
   1900 	call_via r1
   1901 	call_via r2
   1902 	call_via r3
   1903 	call_via r4
   1904 	call_via r5
   1905 	call_via r6
   1906 	call_via r7
   1907 	call_via r8
   1908 	call_via r9
   1909 	call_via sl
   1910 	call_via fp
   1911 	call_via ip
   1912 	call_via sp
   1913 	call_via lr
   1914 
   1915 #endif /* L_call_via_rX */
   1916 
   1917 /* Don't bother with the old interworking routines for Thumb-2.  */
   1918 /* ??? Maybe only omit these on "m" variants.  */
   1919 #if !defined(__thumb2__) && __ARM_ARCH_ISA_ARM
   1920 
   1921 #if defined L_interwork_call_via_rX
   1922 
   1923 /* These labels & instructions are used by the Arm/Thumb interworking code,
   1924    when the target address is in an unknown instruction set.  The address
   1925    of function to be called is loaded into a register and then one of these
   1926    labels is called via a BL instruction.  This puts the return address
   1927    into the link register with the bottom bit set, and the code here
   1928    switches to the correct mode before executing the function.  Unfortunately
   1929    the target code cannot be relied upon to return via a BX instruction, so
   1930    instead we have to store the resturn address on the stack and allow the
   1931    called function to return here instead.  Upon return we recover the real
   1932    return address and use a BX to get back to Thumb mode.
   1933 
   1934    There are three variations of this code.  The first,
   1935    _interwork_call_via_rN(), will push the return address onto the
   1936    stack and pop it in _arm_return().  It should only be used if all
   1937    arguments are passed in registers.
   1938 
   1939    The second, _interwork_r7_call_via_rN(), instead stores the return
   1940    address at [r7, #-4].  It is the caller's responsibility to ensure
   1941    that this address is valid and contains no useful data.
   1942 
   1943    The third, _interwork_r11_call_via_rN(), works in the same way but
   1944    uses r11 instead of r7.  It is useful if the caller does not really
   1945    need a frame pointer.  */
   1946 
   1947 	.text
   1948 	.align 0
   1949 
   1950 	.code   32
   1951 	.globl _arm_return
   1952 LSYM(Lstart_arm_return):
   1953 	cfi_start	LSYM(Lstart_arm_return) LSYM(Lend_arm_return)
   1954 	cfi_push	0, 0xe, -0x8, 0x8
   1955 	nop	@ This nop is for the benefit of debuggers, so that
   1956 		@ backtraces will use the correct unwind information.
   1957 _arm_return:
   1958 	RETLDM	unwind=LSYM(Lstart_arm_return)
   1959 	cfi_end	LSYM(Lend_arm_return)
   1960 
   1961 	.globl _arm_return_r7
   1962 _arm_return_r7:
   1963 	ldr	lr, [r7, #-4]
   1964 	bx	lr
   1965 
   1966 	.globl _arm_return_r11
   1967 _arm_return_r11:
   1968 	ldr	lr, [r11, #-4]
   1969 	bx	lr
   1970 
   1971 .macro interwork_with_frame frame, register, name, return
   1972 	.code	16
   1973 
   1974 	THUMB_FUNC_START \name
   1975 
   1976 	bx	pc
   1977 	nop
   1978 
   1979 	.code	32
   1980 	tst	\register, #1
   1981 	streq	lr, [\frame, #-4]
   1982 	adreq	lr, _arm_return_\frame
   1983 	bx	\register
   1984 
   1985 	SIZE	(\name)
   1986 .endm
   1987 
   1988 .macro interwork register
   1989 	.code	16
   1990 
   1991 	THUMB_FUNC_START _interwork_call_via_\register
   1992 
   1993 	bx	pc
   1994 	nop
   1995 
   1996 	.code	32
   1997 	.globl LSYM(Lchange_\register)
   1998 LSYM(Lchange_\register):
   1999 	tst	\register, #1
   2000 	streq	lr, [sp, #-8]!
   2001 	adreq	lr, _arm_return
   2002 	bx	\register
   2003 
   2004 	SIZE	(_interwork_call_via_\register)
   2005 
   2006 	interwork_with_frame r7,\register,_interwork_r7_call_via_\register
   2007 	interwork_with_frame r11,\register,_interwork_r11_call_via_\register
   2008 .endm
   2009 
   2010 	interwork r0
   2011 	interwork r1
   2012 	interwork r2
   2013 	interwork r3
   2014 	interwork r4
   2015 	interwork r5
   2016 	interwork r6
   2017 	interwork r7
   2018 	interwork r8
   2019 	interwork r9
   2020 	interwork sl
   2021 	interwork fp
   2022 	interwork ip
   2023 	interwork sp
   2024 
   2025 	/* The LR case has to be handled a little differently...  */
   2026 	.code 16
   2027 
   2028 	THUMB_FUNC_START _interwork_call_via_lr
   2029 
   2030 	bx 	pc
   2031 	nop
   2032 
   2033 	.code 32
   2034 	.globl .Lchange_lr
   2035 .Lchange_lr:
   2036 	tst	lr, #1
   2037 	stmeqdb	r13!, {lr, pc}
   2038 	mov	ip, lr
   2039 	adreq	lr, _arm_return
   2040 	bx	ip
   2041 
   2042 	SIZE	(_interwork_call_via_lr)
   2043 
   2044 #endif /* L_interwork_call_via_rX */
   2045 #endif /* !__thumb2__ */
   2046 
   2047 /* Functions to support compact pic switch tables in thumb1 state.
   2048    All these routines take an index into the table in r0.  The
   2049    table is at LR & ~1 (but this must be rounded up in the case
   2050    of 32-bit entires).  They are only permitted to clobber r12
   2051    and r14 and r0 must be preserved on exit.  */
   2052 #ifdef L_thumb1_case_sqi
   2053 
   2054 	.text
   2055 	.align 0
   2056         .force_thumb
   2057 	.syntax unified
   2058 	THUMB_FUNC_START __gnu_thumb1_case_sqi
   2059 	push	{r1}
   2060 	mov	r1, lr
   2061 	lsrs	r1, r1, #1
   2062 	lsls	r1, r1, #1
   2063 	ldrsb	r1, [r1, r0]
   2064 	lsls	r1, r1, #1
   2065 	add	lr, lr, r1
   2066 	pop	{r1}
   2067 	bx	lr
   2068 	SIZE (__gnu_thumb1_case_sqi)
   2069 #endif
   2070 
   2071 #ifdef L_thumb1_case_uqi
   2072 
   2073 	.text
   2074 	.align 0
   2075         .force_thumb
   2076 	.syntax unified
   2077 	THUMB_FUNC_START __gnu_thumb1_case_uqi
   2078 	push	{r1}
   2079 	mov	r1, lr
   2080 	lsrs	r1, r1, #1
   2081 	lsls	r1, r1, #1
   2082 	ldrb	r1, [r1, r0]
   2083 	lsls	r1, r1, #1
   2084 	add	lr, lr, r1
   2085 	pop	{r1}
   2086 	bx	lr
   2087 	SIZE (__gnu_thumb1_case_uqi)
   2088 #endif
   2089 
   2090 #ifdef L_thumb1_case_shi
   2091 
   2092 	.text
   2093 	.align 0
   2094         .force_thumb
   2095 	.syntax unified
   2096 	THUMB_FUNC_START __gnu_thumb1_case_shi
   2097 	push	{r0, r1}
   2098 	mov	r1, lr
   2099 	lsrs	r1, r1, #1
   2100 	lsls	r0, r0, #1
   2101 	lsls	r1, r1, #1
   2102 	ldrsh	r1, [r1, r0]
   2103 	lsls	r1, r1, #1
   2104 	add	lr, lr, r1
   2105 	pop	{r0, r1}
   2106 	bx	lr
   2107 	SIZE (__gnu_thumb1_case_shi)
   2108 #endif
   2109 
   2110 #ifdef L_thumb1_case_uhi
   2111 
   2112 	.text
   2113 	.align 0
   2114         .force_thumb
   2115 	.syntax unified
   2116 	THUMB_FUNC_START __gnu_thumb1_case_uhi
   2117 	push	{r0, r1}
   2118 	mov	r1, lr
   2119 	lsrs	r1, r1, #1
   2120 	lsls	r0, r0, #1
   2121 	lsls	r1, r1, #1
   2122 	ldrh	r1, [r1, r0]
   2123 	lsls	r1, r1, #1
   2124 	add	lr, lr, r1
   2125 	pop	{r0, r1}
   2126 	bx	lr
   2127 	SIZE (__gnu_thumb1_case_uhi)
   2128 #endif
   2129 
   2130 #ifdef L_thumb1_case_si
   2131 
   2132 	.text
   2133 	.align 0
   2134         .force_thumb
   2135 	.syntax unified
   2136 	THUMB_FUNC_START __gnu_thumb1_case_si
   2137 	push	{r0, r1}
   2138 	mov	r1, lr
   2139 	adds.n	r1, r1, #2	/* Align to word.  */
   2140 	lsrs	r1, r1, #2
   2141 	lsls	r0, r0, #2
   2142 	lsls	r1, r1, #2
   2143 	ldr	r0, [r1, r0]
   2144 	adds	r0, r0, r1
   2145 	mov	lr, r0
   2146 	pop	{r0, r1}
   2147 	mov	pc, lr		/* We know we were called from thumb code.  */
   2148 	SIZE (__gnu_thumb1_case_si)
   2149 #endif
   2150 
   2151 #endif /* Arch supports thumb.  */
   2152 
   2153 .macro CFI_START_FUNCTION
   2154 	.cfi_startproc
   2155 	.cfi_remember_state
   2156 .endm
   2157 
   2158 .macro CFI_END_FUNCTION
   2159 	.cfi_restore_state
   2160 	.cfi_endproc
   2161 .endm
   2162 
   2163 #ifndef __symbian__
   2164 /* The condition here must match the one in gcc/config/arm/elf.h and
   2165    libgcc/config/arm/t-elf.  */
   2166 #ifndef NOT_ISA_TARGET_32BIT
   2167 #include "ieee754-df.S"
   2168 #include "ieee754-sf.S"
   2169 #include "bpabi.S"
   2170 #else /* NOT_ISA_TARGET_32BIT */
   2171 #include "bpabi-v6m.S"
   2172 #endif /* NOT_ISA_TARGET_32BIT */
   2173 #endif /* !__symbian__ */
   2174