4 // Copyright (c) 2000 - 2003, Intel Corporation
5 // All rights reserved.
7 // Contributed 2000 by the Intel Numerics Group, Intel Corporation
9 // Redistribution and use in source and binary forms, with or without
10 // modification, are permitted provided that the following conditions are
13 // * Redistributions of source code must retain the above copyright
14 // notice, this list of conditions and the following disclaimer.
16 // * Redistributions in binary form must reproduce the above copyright
17 // notice, this list of conditions and the following disclaimer in the
18 // documentation and/or other materials provided with the distribution.
20 // * The name of Intel Corporation may not be used to endorse or promote
21 // products derived from this software without specific prior written
24 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
25 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
26 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
27 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL INTEL OR ITS
28 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
29 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
30 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
31 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
32 // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY OR TORT (INCLUDING
33 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
34 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 // Intel Corporation is the author of this code, and requests that all
37 // problem reports or change requests be submitted to it directly at
38 // http://www.intel.com/software/products/opensource/libraries/num.htm.
41 //==============================================================
42 // 02/02/00 Initial version
43 // 04/04/00 Improved speed, corrected result for NaN input
44 // 05/30/00 Fixed bug for exponent 0x1003e
45 // 12/22/00 Fixed so inexact flag is never set, and invalid is not set for
46 // qnans nor for inputs larger than 2^63.
47 // 05/20/02 Cleaned up namespace and sf0 syntax
48 // 02/10/03 Reordered header: .section, .global, .proc, .align
51 //==============================================================
52 // long double modfl(long double x, long double *iptr)
53 // break a floating point x number into fraction and an exponent
55 // input floating point f8, address in r34
56 // output floating point f8 (x fraction), and *iptr (x integral part)
59 //==============================================================
61 // NO FRACTIONAL PART: HUGE
63 // for double-extended
64 // If the true exponent is >= 63
65 // 1003e ==> 1003e -ffff = 3f = 63(dec)
67 // we are already an integer (p9 true)
69 // NO INTEGER PART: SMALL
70 // Is f8 exponent less than register bias (that is, is it
71 // less than 1). If it is, get the right sign of
72 // zero and store this in iptr.
74 // CALCULATION: NOT HUGE, NOT SMALL
75 // To get the integer part
76 // Take the floating-point input and truncate
77 // then convert this integer to fp Call it MODF_INTEGER_PART
79 // Subtract MODF_INTEGER_PART from MODF_NORM_F8 to get fraction part
80 // Then put fraction part in f8
81 // put integer part MODF_INTEGER_PART into *iptr
84 //==============================================================
86 // predicate registers used:
90 // -----------------------+-----------------+-------------
91 // SMALL | NORMAL | HUGE
92 // p11 --------------->|<----- p12 ----->| <-------------- p9
93 // p10 --------------------------------->|
94 // p13 --------------------------------------------------->|
97 // floating-point registers used:
99 MODF_FRACTION_PART = f10
100 MODF_INTEGER_PART = f11
101 MODF_INT_INTEGER_PART = f12
104 // general registers used
106 modf_GR_no_frac = r15
114 GLOBAL_LIBM_ENTRY(modfl)
116 // Main path is p9, p11, p8 FALSE and p12 TRUE
118 // Assume input is normalized and get signexp
119 // Normalize input just in case
120 // Form exponent bias
122 getf.exp modf_signexp = f8
123 fnorm.s0 MODF_NORM_F8 = f8
124 addl modf_GR_FFFF = 0xffff, r0
126 // Get integer part of input
127 // Form exponent mask
130 fcvt.fx.trunc.s1 MODF_INT_INTEGER_PART = f8
131 mov modf_17_ones = 0x1ffff ;;
135 // qnan snan inf norm unorm 0 -+
136 // 1 1 1 0 0 0 11 = 0xe3 NAN_INF
137 // Form biased exponent where input only has an integer part
140 fclass.m.unc p6,p13 = f8, 0xe3
141 addl modf_GR_no_frac = 0x1003e, r0 ;;
144 // Mask to get exponent
146 // qnan snan inf norm unorm 0 -+
147 // 0 0 0 0 1 0 11 = 0x0b UNORM
148 // Set p13 to indicate calculation path, else p6 if nan or inf
150 and modf_exp = modf_17_ones, modf_signexp
151 fclass.m.unc p8,p0 = f8, 0x0b
155 // p11 <== SMALL, no integer part, fraction is everyting
156 // p9 <== HUGE, no fraction part, integer is everything
157 // p12 <== NORMAL, fraction part and integer part
159 (p13) cmp.lt.unc p11,p10 = modf_exp, modf_GR_FFFF
164 // Is x inf? p6 if inf, p7 if nan
166 (p10) cmp.ge.unc p9,p12 = modf_exp, modf_GR_no_frac
167 (p6) fclass.m.unc p6,p7 = f8, 0x23
168 (p8) br.cond.spnt MODF_DENORM ;;
172 // For HUGE set fraction to signed 0
175 (p9) fmerge.s f8 = f8,f0
178 // For HUGE set integer part to normalized input
181 (p9) fnorm.s0 MODF_INTEGER_PART = MODF_NORM_F8
185 // For SMALL set fraction to normalized input, integer part to signed 0
188 (p11) fmerge.s MODF_INTEGER_PART = f8,f0
193 (p11) fnorm.s0 f8 = MODF_NORM_F8
197 // For NORMAL float the integer part
200 (p12) fcvt.xf MODF_INTEGER_PART = MODF_INT_INTEGER_PART
204 // If x inf set integer part to INF, fraction to signed 0
206 (p6) stfe [r34] = MODF_NORM_F8
207 (p6) fmerge.s f8 = f8,f0
211 // If x nan set integer and fraction parts to NaN (quietized)
213 (p7) stfe [r34] = MODF_NORM_F8
214 (p7) fmerge.s f8 = MODF_NORM_F8, MODF_NORM_F8
219 (p9) stfe [r34] = MODF_INTEGER_PART
224 // For NORMAL compute fraction part
226 (p11) stfe [r34] = MODF_INTEGER_PART
227 (p12) fms.s0 f8 = MODF_NORM_F8,f1, MODF_INTEGER_PART
231 // For NORMAL test if fraction part is zero; if so append correct sign
234 (p12) fcmp.eq.unc.s0 p7,p0 = MODF_NORM_F8, MODF_INTEGER_PART
239 (p12) stfe [r34] = MODF_INTEGER_PART
244 // For NORMAL if fraction part is zero append sign of input
247 (p7) fmerge.s f8 = MODF_NORM_F8, f0
252 // If x unorm get signexp from normalized input
253 // If x unorm get integer part from normalized input
255 getf.exp modf_signexp = MODF_NORM_F8
256 fcvt.fx.trunc.s1 MODF_INT_INTEGER_PART = MODF_NORM_F8
260 // If x unorm mask to get exponent
262 and modf_exp = modf_17_ones, modf_signexp ;;
263 cmp.lt.unc p11,p10 = modf_exp, modf_GR_FFFF
268 (p10) cmp.ge.unc p9,p12 = modf_exp, modf_GR_no_frac
270 br.cond.spnt MODF_COMMON ;;
273 GLOBAL_LIBM_END(modfl)