Home | History | Annotate | Line # | Download | only in ia64
      1  1.1  cherry .file "__umoddi3.s"
      2  1.1  cherry 
      3  1.2  cherry // $NetBSD: umoddi3.S,v 1.2 2006/04/07 14:27:33 cherry Exp $
      4  1.1  cherry 
      5  1.1  cherry //-
      6  1.1  cherry // Copyright (c) 2000, Intel Corporation
      7  1.1  cherry // All rights reserved.
      8  1.1  cherry //
      9  1.1  cherry // Contributed 2/15/2000 by Marius Cornea, John Harrison, Cristina Iordache,
     10  1.1  cherry // Ted Kubaska, Bob Norin, and Shane Story of the Computational Software Lab,
     11  1.1  cherry // Intel Corporation.
     12  1.1  cherry //
     13  1.1  cherry // WARRANTY DISCLAIMER
     14  1.1  cherry //
     15  1.1  cherry // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     16  1.1  cherry // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     17  1.1  cherry // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
     18  1.1  cherry // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL INTEL OR ITS
     19  1.1  cherry // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
     20  1.1  cherry // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     21  1.1  cherry // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
     22  1.1  cherry // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
     23  1.1  cherry // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY OR TORT (INCLUDING
     24  1.1  cherry // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
     25  1.1  cherry // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26  1.1  cherry //
     27  1.1  cherry // Intel Corporation is the author of this code, and requests that all
     28  1.1  cherry // problem reports or change requests be submitted to it directly at
     29  1.1  cherry // http://developer.intel.com/opensource.
     30  1.1  cherry //
     31  1.1  cherry 
     32  1.1  cherry .section .text
     33  1.1  cherry 
     34  1.1  cherry   // 64-bit unsigned integer remainder
     35  1.1  cherry 
     36  1.1  cherry .proc __umoddi3#
     37  1.1  cherry .align 32
     38  1.1  cherry .global __umoddi3#
     39  1.1  cherry .align 32
     40  1.1  cherry 
     41  1.1  cherry __umoddi3:
     42  1.1  cherry 
     43  1.1  cherry { .mii
     44  1.1  cherry   alloc r31=ar.pfs,3,0,0,0
     45  1.1  cherry   nop.i 0
     46  1.1  cherry   nop.i 0
     47  1.1  cherry } { .mmb
     48  1.1  cherry 
     49  1.1  cherry   // 64-BIT UNSIGNED INTEGER REMAINDER BEGINS HERE
     50  1.1  cherry 
     51  1.1  cherry   // general register used:
     52  1.1  cherry   //    r32 - 64-bit unsigned integer dividend, called a below
     53  1.1  cherry   //    r33 - 64-bit unsigned integer divisor, called b below
     54  1.1  cherry   //    r8 - 64-bit unsigned integer result
     55  1.1  cherry   // floating-point registers used: f6, f7, f8, f9, f10, f11, f12
     56  1.1  cherry   // predicate registers used: p6
     57  1.1  cherry 
     58  1.1  cherry   setf.sig f12=r32  // holds a in integer form
     59  1.1  cherry   setf.sig f7=r33
     60  1.1  cherry   nop.b 0;;
     61  1.1  cherry } { .mfi
     62  1.1  cherry   // get 2's complement of b
     63  1.1  cherry   sub r33=r0,r33
     64  1.1  cherry   fcvt.xuf.s1 f6=f12
     65  1.1  cherry   nop.i 0
     66  1.1  cherry } { .mfi
     67  1.1  cherry   nop.m 0
     68  1.1  cherry   fcvt.xuf.s1 f7=f7
     69  1.1  cherry   nop.i 0;;
     70  1.1  cherry } { .mfi
     71  1.1  cherry   nop.m 0
     72  1.1  cherry   // Step (1)
     73  1.1  cherry   // y0 = 1 / b in f8
     74  1.1  cherry   frcpa.s1 f8,p6=f6,f7
     75  1.1  cherry   nop.i 0;;
     76  1.1  cherry } { .mfi
     77  1.1  cherry   nop.m 0
     78  1.1  cherry   // Step (2)
     79  1.1  cherry   // q0 = a * y0 in f10
     80  1.1  cherry   (p6) fma.s1 f10=f6,f8,f0
     81  1.1  cherry   nop.i 0
     82  1.1  cherry } { .mfi
     83  1.1  cherry   nop.m 0
     84  1.1  cherry   // Step (3)
     85  1.1  cherry   // e0 = 1 - b * y0 in f9
     86  1.1  cherry   (p6) fnma.s1 f9=f7,f8,f1
     87  1.1  cherry   nop.i 0;;
     88  1.1  cherry } { .mfi
     89  1.1  cherry   nop.m 0
     90  1.1  cherry   // Step (4)
     91  1.1  cherry   // q1 = q0 + e0 * q0 in f10
     92  1.1  cherry   (p6) fma.s1 f10=f9,f10,f10
     93  1.1  cherry   nop.i 0
     94  1.1  cherry } { .mfi
     95  1.1  cherry   nop.m 0
     96  1.1  cherry   // Step (5)
     97  1.1  cherry   // e1 = e0 * e0 in f11
     98  1.1  cherry   (p6) fma.s1 f11=f9,f9,f0
     99  1.1  cherry   nop.i 0;;
    100  1.1  cherry } { .mfi
    101  1.1  cherry   nop.m 0
    102  1.1  cherry   // Step (6)
    103  1.1  cherry   // y1 = y0 + e0 * y0 in f8
    104  1.1  cherry   (p6) fma.s1 f8=f9,f8,f8
    105  1.1  cherry   nop.i 0;;
    106  1.1  cherry } { .mfi
    107  1.1  cherry   nop.m 0
    108  1.1  cherry   // Step (7)
    109  1.1  cherry   // q2 = q1 + e1 * q1 in f9
    110  1.1  cherry   (p6) fma.s1 f9=f11,f10,f10
    111  1.1  cherry   nop.i 0;;
    112  1.1  cherry } { .mfi
    113  1.1  cherry   nop.m 0
    114  1.1  cherry   // Step (8)
    115  1.1  cherry   // y2 = y1 + e1 * y1 in f8
    116  1.1  cherry   (p6) fma.s1 f8=f11,f8,f8
    117  1.1  cherry   nop.i 0;;
    118  1.1  cherry } { .mfi
    119  1.1  cherry   nop.m 0
    120  1.1  cherry   // Step (9)
    121  1.1  cherry   // r2 = a - b * q2 in f10
    122  1.1  cherry   (p6) fnma.s1 f10=f7,f9,f6
    123  1.1  cherry   nop.i 0;;
    124  1.1  cherry } { .mfi
    125  1.1  cherry   // f7=-b
    126  1.1  cherry   setf.sig f7=r33
    127  1.1  cherry   // Step (10)
    128  1.1  cherry   // q3 = q2 + r2 * y2 in f8
    129  1.1  cherry   (p6) fma.s1 f8=f10,f8,f9
    130  1.1  cherry   nop.i 0;;
    131  1.1  cherry } { .mfi
    132  1.1  cherry   nop.m 0
    133  1.1  cherry   // (11) q = trunc(q3)
    134  1.1  cherry   fcvt.fxu.trunc.s1 f8=f8
    135  1.1  cherry   nop.i 0;;
    136  1.1  cherry }  { .mfi
    137  1.1  cherry   nop.m 0
    138  1.1  cherry   // (12) r = a + (-b) * q
    139  1.1  cherry   xma.l f8=f8,f7,f12
    140  1.1  cherry   nop.i 0;;
    141  1.1  cherry }  { .mib
    142  1.1  cherry   getf.sig r8=f8
    143  1.1  cherry   nop.i 0
    144  1.1  cherry   nop.b 0
    145  1.1  cherry }
    146  1.1  cherry 
    147  1.1  cherry   // 64-BIT UNSIGNED INTEGER REMAINDER ENDS HERE
    148  1.1  cherry 
    149  1.1  cherry { .mib
    150  1.1  cherry   nop.m 0
    151  1.1  cherry   nop.i 0
    152  1.1  cherry   br.ret.sptk b0;;
    153  1.1  cherry }
    154  1.1  cherry 
    155  1.1  cherry .endp __umoddi3
    156