Home | History | Annotate | Line # | Download | only in ia64
      1  1.1  cherry .file "__udivsi3.s"
      2  1.1  cherry 
      3  1.2  cherry // $NetBSD: udivsi3.S,v 1.2 2006/04/07 14:27:33 cherry Exp $
      4  1.1  cherry 
      5  1.1  cherry //-
      6  1.1  cherry // Copyright (c) 2000, Intel Corporation
      7  1.1  cherry // All rights reserved.
      8  1.1  cherry //
      9  1.1  cherry // Contributed 2/15/2000 by Marius Cornea, John Harrison, Cristina Iordache,
     10  1.1  cherry // Ted Kubaska, Bob Norin, and Shane Story of the Computational Software Lab,
     11  1.1  cherry // Intel Corporation.
     12  1.1  cherry //
     13  1.1  cherry // WARRANTY DISCLAIMER
     14  1.1  cherry //
     15  1.1  cherry // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     16  1.1  cherry // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     17  1.1  cherry // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
     18  1.1  cherry // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL INTEL OR ITS
     19  1.1  cherry // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
     20  1.1  cherry // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     21  1.1  cherry // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
     22  1.1  cherry // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
     23  1.1  cherry // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY OR TORT (INCLUDING
     24  1.1  cherry // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
     25  1.1  cherry // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26  1.1  cherry //
     27  1.1  cherry // Intel Corporation is the author of this code, and requests that all
     28  1.1  cherry // problem reports or change requests be submitted to it directly at
     29  1.1  cherry // http://developer.intel.com/opensource.
     30  1.1  cherry //
     31  1.1  cherry 
     32  1.1  cherry .section .text
     33  1.1  cherry 
     34  1.1  cherry // 32-bit unsigned integer divide
     35  1.1  cherry 
     36  1.1  cherry .proc __udivsi3#
     37  1.1  cherry .align 32
     38  1.1  cherry .global __udivsi3#
     39  1.1  cherry .align 32
     40  1.1  cherry 
     41  1.1  cherry __udivsi3:
     42  1.1  cherry 
     43  1.1  cherry { .mii
     44  1.1  cherry   alloc r31=ar.pfs,2,0,0,0
     45  1.1  cherry   nop.i 0
     46  1.1  cherry   nop.i 0;;
     47  1.1  cherry } { .mii
     48  1.1  cherry   nop.m 0
     49  1.1  cherry 
     50  1.1  cherry   // 32-BIT UNSIGNED INTEGER DIVIDE BEGINS HERE
     51  1.1  cherry 
     52  1.1  cherry   // general register used:
     53  1.1  cherry   //    r32 - 32-bit unsigned integer dividend
     54  1.1  cherry   //    r33 - 32-bit unsigned integer divisor
     55  1.1  cherry   //    r8 - 32-bit unsigned integer result
     56  1.1  cherry   //    r2 - scratch register
     57  1.1  cherry   // floating-point registers used: f6, f7, f8, f9
     58  1.1  cherry   // predicate registers used: p6
     59  1.1  cherry 
     60  1.1  cherry   zxt4 r32=r32
     61  1.1  cherry   zxt4 r33=r33;;
     62  1.1  cherry } { .mmb
     63  1.1  cherry   setf.sig f6=r32
     64  1.1  cherry   setf.sig f7=r33
     65  1.1  cherry   nop.b 0;;
     66  1.1  cherry } { .mfi
     67  1.1  cherry   nop.m 0
     68  1.1  cherry   fcvt.xf f6=f6
     69  1.1  cherry   nop.i 0
     70  1.1  cherry } { .mfi
     71  1.1  cherry   nop.m 0
     72  1.1  cherry   fcvt.xf f7=f7
     73  1.1  cherry   mov r2 = 0x0ffdd;;
     74  1.1  cherry } { .mfi
     75  1.1  cherry   setf.exp f9 = r2
     76  1.1  cherry   // (1) y0
     77  1.1  cherry   frcpa.s1 f8,p6=f6,f7
     78  1.1  cherry   nop.i 0;;
     79  1.1  cherry } { .mfi
     80  1.1  cherry   nop.m 0
     81  1.1  cherry   // (2) q0 = a * y0
     82  1.1  cherry   (p6) fma.s1 f6=f6,f8,f0
     83  1.1  cherry   nop.i 0
     84  1.1  cherry } { .mfi
     85  1.1  cherry   nop.m 0
     86  1.1  cherry   // (3) e0 = 1 - b * y0
     87  1.1  cherry   (p6) fnma.s1 f7=f7,f8,f1
     88  1.1  cherry   nop.i 0;;
     89  1.1  cherry } { .mfi
     90  1.1  cherry   nop.m 0
     91  1.1  cherry   // (4) q1 = q0 + e0 * q0
     92  1.1  cherry   (p6) fma.s1 f6=f7,f6,f6
     93  1.1  cherry   nop.i 0
     94  1.1  cherry } { .mfi
     95  1.1  cherry   nop.m 0
     96  1.1  cherry   // (5) e1 = e0 * e0 + 2^-34
     97  1.1  cherry   (p6) fma.s1 f7=f7,f7,f9
     98  1.1  cherry   nop.i 0;;
     99  1.1  cherry } { .mfi
    100  1.1  cherry   nop.m 0
    101  1.1  cherry   // (6) q2 = q1 + e1 * q1
    102  1.1  cherry   (p6) fma.s1 f8=f7,f6,f6
    103  1.1  cherry   nop.i 0;;
    104  1.1  cherry } { .mfi
    105  1.1  cherry   nop.m 0
    106  1.1  cherry   // (7) q = trunc(q2)
    107  1.1  cherry   fcvt.fxu.trunc.s1 f8=f8
    108  1.1  cherry   nop.i 0;;
    109  1.1  cherry } { .mmi
    110  1.1  cherry   // quotient will be in the least significant 32 bits of r8 (if b != 0)
    111  1.1  cherry   getf.sig r8=f8
    112  1.1  cherry   nop.m 0
    113  1.1  cherry   nop.i 0;;
    114  1.1  cherry }
    115  1.1  cherry 
    116  1.1  cherry   // 32-BIT UNSIGNED INTEGER DIVIDE ENDS HERE
    117  1.1  cherry 
    118  1.1  cherry { .mmb
    119  1.1  cherry   nop.m 0
    120  1.1  cherry   nop.m 0
    121  1.1  cherry   br.ret.sptk b0;;
    122  1.1  cherry }
    123  1.1  cherry 
    124  1.1  cherry .endp __udivsi3
    125