2 * Copyright (c) 2005 Josef Cejka
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
9 * - Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * - Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 * - The name of the author may not be used to endorse or promote products
15 * derived from this software without specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 /** @addtogroup softfloat
38 /* Table for fast leading zeroes counting */
39 char zeroTable
[256] = {
40 8, 7, 7, 6, 6, 6, 6, 4, 4, 4, 4, 4, 4, 4, 4, \
41 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, \
42 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, \
43 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, \
44 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, \
45 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, \
46 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, \
47 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, \
48 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
49 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
50 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
51 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
52 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
53 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
54 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, \
55 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
60 /** Take fraction shifted by 10 bits to left, round it, normalize it and detect exceptions
61 * @param cexp exponent with bias
62 * @param cfrac fraction shifted 10 places left with added hidden bit
64 * @return valied float64
66 float64
finishFloat64(int32_t cexp
, uint64_t cfrac
, char sign
)
70 result
.parts
.sign
= sign
;
72 /* find first nonzero digit and shift result and detect possibly underflow */
73 while ((cexp
> 0) && (cfrac
) && (!(cfrac
& (FLOAT64_HIDDEN_BIT_MASK
<< (64 - FLOAT64_FRACTION_SIZE
- 1 ) )))) {
76 /* TODO: fix underflow */
79 if ((cexp
< 0) || ( cexp
== 0 && (!(cfrac
& (FLOAT64_HIDDEN_BIT_MASK
<< (64 - FLOAT64_FRACTION_SIZE
- 1)))))) {
80 /* FIXME: underflow */
82 if ((cexp
+ FLOAT64_FRACTION_SIZE
+ 1) < 0) { /* +1 is place for rounding */
83 result
.parts
.fraction
= 0;
92 cfrac
+= (0x1 << (64 - FLOAT64_FRACTION_SIZE
- 3));
94 if (!(cfrac
& (FLOAT64_HIDDEN_BIT_MASK
<< (64 - FLOAT64_FRACTION_SIZE
- 1)))) {
96 result
.parts
.fraction
= ((cfrac
>>(64 - FLOAT64_FRACTION_SIZE
- 2) ) & (~FLOAT64_HIDDEN_BIT_MASK
));
100 cfrac
+= (0x1 << (64 - FLOAT64_FRACTION_SIZE
- 3));
105 if (cfrac
& (FLOAT64_HIDDEN_BIT_MASK
<< (64 - FLOAT64_FRACTION_SIZE
- 1 ))) {
111 if (cexp
>= FLOAT64_MAX_EXPONENT
) {
112 /* FIXME: overflow, return infinity */
113 result
.parts
.exp
= FLOAT64_MAX_EXPONENT
;
114 result
.parts
.fraction
= 0;
118 result
.parts
.exp
= (uint32_t)cexp
;
120 result
.parts
.fraction
= ((cfrac
>>(64 - FLOAT64_FRACTION_SIZE
- 2 ) ) & (~FLOAT64_HIDDEN_BIT_MASK
));
125 /** Counts leading zeroes in 64bit unsigned integer
128 int countZeroes64(uint64_t i
)
131 for (j
=0; j
< 64; j
+= 8) {
132 if ( i
& (0xFFll
<< (56 - j
))) {
133 return (j
+ countZeroes8(i
>> (56 - j
)));
140 /** Counts leading zeroes in 32bit unsigned integer
143 int countZeroes32(uint32_t i
)
146 for (j
=0; j
< 32; j
+= 8) {
147 if ( i
& (0xFF << (24 - j
))) {
148 return (j
+ countZeroes8(i
>> (24 - j
)));
155 /** Counts leading zeroes in byte
158 int countZeroes8(uint8_t i
)
163 /** Round and normalize number expressed by exponent and fraction with first bit (equal to hidden bit) at 30. bit
164 * @param exp exponent
165 * @param fraction part with hidden bit shifted to 30. bit
167 void roundFloat32(int32_t *exp
, uint32_t *fraction
)
169 /* rounding - if first bit after fraction is set then round up */
170 (*fraction
) += (0x1 << 6);
172 if ((*fraction
) & (FLOAT32_HIDDEN_BIT_MASK
<< 8)) {
173 /* rounding overflow */
178 if (((*exp
) >= FLOAT32_MAX_EXPONENT
) || ((*exp
) < 0)) {
179 /* overflow - set infinity as result */
180 (*exp
) = FLOAT32_MAX_EXPONENT
;
188 /** Round and normalize number expressed by exponent and fraction with first bit (equal to hidden bit) at 62. bit
189 * @param exp exponent
190 * @param fraction part with hidden bit shifted to 62. bit
192 void roundFloat64(int32_t *exp
, uint64_t *fraction
)
194 /* rounding - if first bit after fraction is set then round up */
195 (*fraction
) += (0x1 << 9);
197 if ((*fraction
) & (FLOAT64_HIDDEN_BIT_MASK
<< 11)) {
198 /* rounding overflow */
203 if (((*exp
) >= FLOAT64_MAX_EXPONENT
) || ((*exp
) < 0)) {
204 /* overflow - set infinity as result */
205 (*exp
) = FLOAT64_MAX_EXPONENT
;