2 * Linux/PA-RISC Project (http://www.parisc-linux.org/)
4 * Floating-point emulation code
5 * Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2, or (at your option)
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
25 * @(#) pa/spmath/dfmpy.c $Revision: 1.1 $
28 * Double Precision Floating-point Multiply
30 * External Interfaces:
31 * dbl_fmpy(srcptr1,srcptr2,dstptr,status)
33 * Internal Interfaces:
36 * <<please update with a overview of the operation of this file>>
43 #include "dbl_float.h"
46 * Double Precision Floating-point Multiply
51 dbl_floating_point
*srcptr1
,
52 dbl_floating_point
*srcptr2
,
53 dbl_floating_point
*dstptr
,
56 register unsigned int opnd1p1
, opnd1p2
, opnd2p1
, opnd2p2
;
57 register unsigned int opnd3p1
, opnd3p2
, resultp1
, resultp2
;
58 register int dest_exponent
, count
;
59 register boolean inexact
= FALSE
, guardbit
= FALSE
, stickybit
= FALSE
;
62 Dbl_copyfromptr(srcptr1
,opnd1p1
,opnd1p2
);
63 Dbl_copyfromptr(srcptr2
,opnd2p1
,opnd2p2
);
66 * set sign bit of result
68 if (Dbl_sign(opnd1p1
) ^ Dbl_sign(opnd2p1
))
69 Dbl_setnegativezerop1(resultp1
);
70 else Dbl_setzerop1(resultp1
);
72 * check first operand for NaN's or infinity
74 if (Dbl_isinfinity_exponent(opnd1p1
)) {
75 if (Dbl_iszero_mantissa(opnd1p1
,opnd1p2
)) {
76 if (Dbl_isnotnan(opnd2p1
,opnd2p2
)) {
77 if (Dbl_iszero_exponentmantissa(opnd2p1
,opnd2p2
)) {
79 * invalid since operands are infinity
82 if (Is_invalidtrap_enabled())
83 return(INVALIDEXCEPTION
);
85 Dbl_makequietnan(resultp1
,resultp2
);
86 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
92 Dbl_setinfinity_exponentmantissa(resultp1
,resultp2
);
93 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
99 * is NaN; signaling or quiet?
101 if (Dbl_isone_signaling(opnd1p1
)) {
102 /* trap if INVALIDTRAP enabled */
103 if (Is_invalidtrap_enabled())
104 return(INVALIDEXCEPTION
);
107 Dbl_set_quiet(opnd1p1
);
110 * is second operand a signaling NaN?
112 else if (Dbl_is_signalingnan(opnd2p1
)) {
113 /* trap if INVALIDTRAP enabled */
114 if (Is_invalidtrap_enabled())
115 return(INVALIDEXCEPTION
);
118 Dbl_set_quiet(opnd2p1
);
119 Dbl_copytoptr(opnd2p1
,opnd2p2
,dstptr
);
125 Dbl_copytoptr(opnd1p1
,opnd1p2
,dstptr
);
130 * check second operand for NaN's or infinity
132 if (Dbl_isinfinity_exponent(opnd2p1
)) {
133 if (Dbl_iszero_mantissa(opnd2p1
,opnd2p2
)) {
134 if (Dbl_iszero_exponentmantissa(opnd1p1
,opnd1p2
)) {
135 /* invalid since operands are zero & infinity */
136 if (Is_invalidtrap_enabled())
137 return(INVALIDEXCEPTION
);
139 Dbl_makequietnan(opnd2p1
,opnd2p2
);
140 Dbl_copytoptr(opnd2p1
,opnd2p2
,dstptr
);
146 Dbl_setinfinity_exponentmantissa(resultp1
,resultp2
);
147 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
151 * is NaN; signaling or quiet?
153 if (Dbl_isone_signaling(opnd2p1
)) {
154 /* trap if INVALIDTRAP enabled */
155 if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION
);
158 Dbl_set_quiet(opnd2p1
);
163 Dbl_copytoptr(opnd2p1
,opnd2p2
,dstptr
);
169 dest_exponent
= Dbl_exponent(opnd1p1
) + Dbl_exponent(opnd2p1
) -DBL_BIAS
;
174 if (Dbl_isnotzero_exponent(opnd1p1
)) {
176 Dbl_clear_signexponent_set_hidden(opnd1p1
);
180 if (Dbl_iszero_mantissa(opnd1p1
,opnd1p2
)) {
181 Dbl_setzero_exponentmantissa(resultp1
,resultp2
);
182 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
185 /* is denormalized, adjust exponent */
186 Dbl_clear_signexponent(opnd1p1
);
187 Dbl_leftshiftby1(opnd1p1
,opnd1p2
);
188 Dbl_normalize(opnd1p1
,opnd1p2
,dest_exponent
);
190 /* opnd2 needs to have hidden bit set with msb in hidden bit */
191 if (Dbl_isnotzero_exponent(opnd2p1
)) {
192 Dbl_clear_signexponent_set_hidden(opnd2p1
);
196 if (Dbl_iszero_mantissa(opnd2p1
,opnd2p2
)) {
197 Dbl_setzero_exponentmantissa(resultp1
,resultp2
);
198 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
201 /* is denormalized; want to normalize */
202 Dbl_clear_signexponent(opnd2p1
);
203 Dbl_leftshiftby1(opnd2p1
,opnd2p2
);
204 Dbl_normalize(opnd2p1
,opnd2p2
,dest_exponent
);
207 /* Multiply two source mantissas together */
209 /* make room for guard bits */
210 Dbl_leftshiftby7(opnd2p1
,opnd2p2
);
211 Dbl_setzero(opnd3p1
,opnd3p2
);
213 * Four bits at a time are inspected in each loop, and a
214 * simple shift and add multiply algorithm is used.
216 for (count
=1;count
<=DBL_P
;count
+=4) {
217 stickybit
|= Dlow4p2(opnd3p2
);
218 Dbl_rightshiftby4(opnd3p1
,opnd3p2
);
219 if (Dbit28p2(opnd1p2
)) {
220 /* Twoword_add should be an ADDC followed by an ADD. */
221 Twoword_add(opnd3p1
, opnd3p2
, opnd2p1
<<3 | opnd2p2
>>29,
224 if (Dbit29p2(opnd1p2
)) {
225 Twoword_add(opnd3p1
, opnd3p2
, opnd2p1
<<2 | opnd2p2
>>30,
228 if (Dbit30p2(opnd1p2
)) {
229 Twoword_add(opnd3p1
, opnd3p2
, opnd2p1
<<1 | opnd2p2
>>31,
232 if (Dbit31p2(opnd1p2
)) {
233 Twoword_add(opnd3p1
, opnd3p2
, opnd2p1
, opnd2p2
);
235 Dbl_rightshiftby4(opnd1p1
,opnd1p2
);
237 if (Dbit3p1(opnd3p1
)==0) {
238 Dbl_leftshiftby1(opnd3p1
,opnd3p2
);
241 /* result mantissa >= 2. */
244 /* check for denormalized result */
245 while (Dbit3p1(opnd3p1
)==0) {
246 Dbl_leftshiftby1(opnd3p1
,opnd3p2
);
250 * check for guard, sticky and inexact bits
252 stickybit
|= Dallp2(opnd3p2
) << 25;
253 guardbit
= (Dallp2(opnd3p2
) << 24) >> 31;
254 inexact
= guardbit
| stickybit
;
256 /* align result mantissa */
257 Dbl_rightshiftby8(opnd3p1
,opnd3p2
);
262 if (inexact
&& (dest_exponent
>0 || Is_underflowtrap_enabled())) {
263 Dbl_clear_signexponent(opnd3p1
);
264 switch (Rounding_mode()) {
266 if (Dbl_iszero_sign(resultp1
))
267 Dbl_increment(opnd3p1
,opnd3p2
);
270 if (Dbl_isone_sign(resultp1
))
271 Dbl_increment(opnd3p1
,opnd3p2
);
275 if (stickybit
|| Dbl_isone_lowmantissap2(opnd3p2
))
276 Dbl_increment(opnd3p1
,opnd3p2
);
279 if (Dbl_isone_hidden(opnd3p1
)) dest_exponent
++;
281 Dbl_set_mantissa(resultp1
,resultp2
,opnd3p1
,opnd3p2
);
286 if (dest_exponent
>= DBL_INFINITY_EXPONENT
) {
287 /* trap if OVERFLOWTRAP enabled */
288 if (Is_overflowtrap_enabled()) {
290 * Adjust bias of result
292 Dbl_setwrapped_exponent(resultp1
,dest_exponent
,ovfl
);
293 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
295 if (Is_inexacttrap_enabled())
296 return (OVERFLOWEXCEPTION
| INEXACTEXCEPTION
);
297 else Set_inexactflag();
298 return (OVERFLOWEXCEPTION
);
302 /* set result to infinity or largest number */
303 Dbl_setoverflow(resultp1
,resultp2
);
308 else if (dest_exponent
<= 0) {
309 /* trap if UNDERFLOWTRAP enabled */
310 if (Is_underflowtrap_enabled()) {
312 * Adjust bias of result
314 Dbl_setwrapped_exponent(resultp1
,dest_exponent
,unfl
);
315 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
317 if (Is_inexacttrap_enabled())
318 return (UNDERFLOWEXCEPTION
| INEXACTEXCEPTION
);
319 else Set_inexactflag();
320 return (UNDERFLOWEXCEPTION
);
323 /* Determine if should set underflow flag */
325 if (dest_exponent
== 0 && inexact
) {
326 switch (Rounding_mode()) {
328 if (Dbl_iszero_sign(resultp1
)) {
329 Dbl_increment(opnd3p1
,opnd3p2
);
330 if (Dbl_isone_hiddenoverflow(opnd3p1
))
332 Dbl_decrement(opnd3p1
,opnd3p2
);
336 if (Dbl_isone_sign(resultp1
)) {
337 Dbl_increment(opnd3p1
,opnd3p2
);
338 if (Dbl_isone_hiddenoverflow(opnd3p1
))
340 Dbl_decrement(opnd3p1
,opnd3p2
);
344 if (guardbit
&& (stickybit
||
345 Dbl_isone_lowmantissap2(opnd3p2
))) {
346 Dbl_increment(opnd3p1
,opnd3p2
);
347 if (Dbl_isone_hiddenoverflow(opnd3p1
))
349 Dbl_decrement(opnd3p1
,opnd3p2
);
356 * denormalize result or set to signed zero
359 Dbl_denormalize(opnd3p1
,opnd3p2
,dest_exponent
,guardbit
,
362 /* return zero or smallest number */
364 switch (Rounding_mode()) {
366 if (Dbl_iszero_sign(resultp1
)) {
367 Dbl_increment(opnd3p1
,opnd3p2
);
371 if (Dbl_isone_sign(resultp1
)) {
372 Dbl_increment(opnd3p1
,opnd3p2
);
376 if (guardbit
&& (stickybit
||
377 Dbl_isone_lowmantissap2(opnd3p2
))) {
378 Dbl_increment(opnd3p1
,opnd3p2
);
382 if (is_tiny
) Set_underflowflag();
384 Dbl_set_exponentmantissa(resultp1
,resultp2
,opnd3p1
,opnd3p2
);
386 else Dbl_set_exponent(resultp1
,dest_exponent
);
387 /* check for inexact */
388 Dbl_copytoptr(resultp1
,resultp2
,dstptr
);
390 if (Is_inexacttrap_enabled()) return(INEXACTEXCEPTION
);
391 else Set_inexactflag();