1 1.1 joerg /* ===-- clzsi2.c - Implement __clzsi2 -------------------------------------=== 2 1.1 joerg * 3 1.1 joerg * The LLVM Compiler Infrastructure 4 1.1 joerg * 5 1.1 joerg * This file is dual licensed under the MIT and the University of Illinois Open 6 1.1 joerg * Source Licenses. See LICENSE.TXT for details. 7 1.1 joerg * 8 1.1 joerg * ===----------------------------------------------------------------------=== 9 1.1 joerg * 10 1.1 joerg * This file implements count leading zeros for 32bit arguments. 11 1.1 joerg * 12 1.1 joerg * ===----------------------------------------------------------------------=== 13 1.1 joerg */ 14 1.1 joerg #include "../assembly.h" 15 1.1 joerg 16 1.1 joerg .syntax unified 17 1.1 joerg .text 18 1.1.1.3 joerg #if __ARM_ARCH_ISA_THUMB == 2 19 1.1.1.3 joerg .thumb 20 1.1.1.3 joerg #endif 21 1.1.1.3 joerg 22 1.1.1.2 joerg .p2align 2 23 1.1.1.4 joerg #if __ARM_ARCH_ISA_THUMB == 2 24 1.1.1.4 joerg DEFINE_COMPILERRT_THUMB_FUNCTION(__clzsi2) 25 1.1.1.4 joerg #else 26 1.1 joerg DEFINE_COMPILERRT_FUNCTION(__clzsi2) 27 1.1.1.4 joerg #endif 28 1.1 joerg #ifdef __ARM_FEATURE_CLZ 29 1.1 joerg clz r0, r0 30 1.1 joerg JMP(lr) 31 1.1 joerg #else 32 1.1 joerg /* Assumption: n != 0 */ 33 1.1 joerg 34 1.1 joerg /* 35 1.1 joerg * r0: n 36 1.1 joerg * r1: count of leading zeros in n + 1 37 1.1 joerg * r2: scratch register for shifted r0 38 1.1 joerg */ 39 1.1 joerg mov r1, 1 40 1.1 joerg 41 1.1 joerg /* 42 1.1 joerg * Basic block: 43 1.1 joerg * if ((r0 >> SHIFT) == 0) 44 1.1 joerg * r1 += SHIFT; 45 1.1 joerg * else 46 1.1 joerg * r0 >>= SHIFT; 47 1.1 joerg * for descending powers of two as SHIFT. 48 1.1 joerg */ 49 1.1 joerg 50 1.1 joerg #define BLOCK(shift) \ 51 1.1 joerg lsrs r2, r0, shift; \ 52 1.1 joerg movne r0, r2; \ 53 1.1 joerg addeq r1, shift \ 54 1.1 joerg 55 1.1 joerg BLOCK(16) 56 1.1 joerg BLOCK(8) 57 1.1 joerg BLOCK(4) 58 1.1 joerg BLOCK(2) 59 1.1 joerg 60 1.1 joerg /* 61 1.1 joerg * The basic block invariants at this point are (r0 >> 2) == 0 and 62 1.1 joerg * r0 != 0. This means 1 <= r0 <= 3 and 0 <= (r0 >> 1) <= 1. 63 1.1 joerg * 64 1.1 joerg * r0 | (r0 >> 1) == 0 | (r0 >> 1) == 1 | -(r0 >> 1) | 1 - (r0 >> 1) 65 1.1 joerg * ---+----------------+----------------+------------+-------------- 66 1.1 joerg * 1 | 1 | 0 | 0 | 1 67 1.1 joerg * 2 | 0 | 1 | -1 | 0 68 1.1 joerg * 3 | 0 | 1 | -1 | 0 69 1.1 joerg * 70 1.1 joerg * The r1's initial value of 1 compensates for the 1 here. 71 1.1 joerg */ 72 1.1 joerg sub r0, r1, r0, lsr #1 73 1.1 joerg 74 1.1 joerg JMP(lr) 75 1.1 joerg #endif // __ARM_FEATURE_CLZ 76 1.1 joerg END_COMPILERRT_FUNCTION(__clzsi2) 77