target/ppc: implement xs[n]maddqp[o]/xs[n]msubqp[o]
[qemu.git] / target / ppc / fpu_helper.c
blob98e9576608f6c69f308c648551f4e7a281020656
1 /*
2 * PowerPC floating point and SPE emulation helpers for QEMU.
4 * Copyright (c) 2003-2007 Jocelyn Mayer
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #include "qemu/osdep.h"
20 #include "cpu.h"
21 #include "exec/helper-proto.h"
22 #include "exec/exec-all.h"
23 #include "internal.h"
24 #include "fpu/softfloat.h"
26 static inline float128 float128_snan_to_qnan(float128 x)
28 float128 r;
30 r.high = x.high | 0x0000800000000000;
31 r.low = x.low;
32 return r;
35 #define float64_snan_to_qnan(x) ((x) | 0x0008000000000000ULL)
36 #define float32_snan_to_qnan(x) ((x) | 0x00400000)
37 #define float16_snan_to_qnan(x) ((x) | 0x0200)
39 static inline bool fp_exceptions_enabled(CPUPPCState *env)
41 #ifdef CONFIG_USER_ONLY
42 return true;
43 #else
44 return (env->msr & ((1U << MSR_FE0) | (1U << MSR_FE1))) != 0;
45 #endif
48 /*****************************************************************************/
49 /* Floating point operations helpers */
52 * This is the non-arithmatic conversion that happens e.g. on loads.
53 * In the Power ISA pseudocode, this is called DOUBLE.
55 uint64_t helper_todouble(uint32_t arg)
57 uint32_t abs_arg = arg & 0x7fffffff;
58 uint64_t ret;
60 if (likely(abs_arg >= 0x00800000)) {
61 if (unlikely(extract32(arg, 23, 8) == 0xff)) {
62 /* Inf or NAN. */
63 ret = (uint64_t)extract32(arg, 31, 1) << 63;
64 ret |= (uint64_t)0x7ff << 52;
65 ret |= (uint64_t)extract32(arg, 0, 23) << 29;
66 } else {
67 /* Normalized operand. */
68 ret = (uint64_t)extract32(arg, 30, 2) << 62;
69 ret |= ((extract32(arg, 30, 1) ^ 1) * (uint64_t)7) << 59;
70 ret |= (uint64_t)extract32(arg, 0, 30) << 29;
72 } else {
73 /* Zero or Denormalized operand. */
74 ret = (uint64_t)extract32(arg, 31, 1) << 63;
75 if (unlikely(abs_arg != 0)) {
77 * Denormalized operand.
78 * Shift fraction so that the msb is in the implicit bit position.
79 * Thus, shift is in the range [1:23].
81 int shift = clz32(abs_arg) - 8;
83 * The first 3 terms compute the float64 exponent. We then bias
84 * this result by -1 so that we can swallow the implicit bit below.
86 int exp = -126 - shift + 1023 - 1;
88 ret |= (uint64_t)exp << 52;
89 ret += (uint64_t)abs_arg << (52 - 23 + shift);
92 return ret;
96 * This is the non-arithmatic conversion that happens e.g. on stores.
97 * In the Power ISA pseudocode, this is called SINGLE.
99 uint32_t helper_tosingle(uint64_t arg)
101 int exp = extract64(arg, 52, 11);
102 uint32_t ret;
104 if (likely(exp > 896)) {
105 /* No denormalization required (includes Inf, NaN). */
106 ret = extract64(arg, 62, 2) << 30;
107 ret |= extract64(arg, 29, 30);
108 } else {
110 * Zero or Denormal result. If the exponent is in bounds for
111 * a single-precision denormal result, extract the proper
112 * bits. If the input is not zero, and the exponent is out of
113 * bounds, then the result is undefined; this underflows to
114 * zero.
116 ret = extract64(arg, 63, 1) << 31;
117 if (unlikely(exp >= 874)) {
118 /* Denormal result. */
119 ret |= ((1ULL << 52) | extract64(arg, 0, 52)) >> (896 + 30 - exp);
122 return ret;
125 static inline int ppc_float32_get_unbiased_exp(float32 f)
127 return ((f >> 23) & 0xFF) - 127;
130 static inline int ppc_float64_get_unbiased_exp(float64 f)
132 return ((f >> 52) & 0x7FF) - 1023;
135 /* Classify a floating-point number. */
136 enum {
137 is_normal = 1,
138 is_zero = 2,
139 is_denormal = 4,
140 is_inf = 8,
141 is_qnan = 16,
142 is_snan = 32,
143 is_neg = 64,
146 #define COMPUTE_CLASS(tp) \
147 static int tp##_classify(tp arg) \
149 int ret = tp##_is_neg(arg) * is_neg; \
150 if (unlikely(tp##_is_any_nan(arg))) { \
151 float_status dummy = { }; /* snan_bit_is_one = 0 */ \
152 ret |= (tp##_is_signaling_nan(arg, &dummy) \
153 ? is_snan : is_qnan); \
154 } else if (unlikely(tp##_is_infinity(arg))) { \
155 ret |= is_inf; \
156 } else if (tp##_is_zero(arg)) { \
157 ret |= is_zero; \
158 } else if (tp##_is_zero_or_denormal(arg)) { \
159 ret |= is_denormal; \
160 } else { \
161 ret |= is_normal; \
163 return ret; \
166 COMPUTE_CLASS(float16)
167 COMPUTE_CLASS(float32)
168 COMPUTE_CLASS(float64)
169 COMPUTE_CLASS(float128)
171 static void set_fprf_from_class(CPUPPCState *env, int class)
173 static const uint8_t fprf[6][2] = {
174 { 0x04, 0x08 }, /* normalized */
175 { 0x02, 0x12 }, /* zero */
176 { 0x14, 0x18 }, /* denormalized */
177 { 0x05, 0x09 }, /* infinity */
178 { 0x11, 0x11 }, /* qnan */
179 { 0x00, 0x00 }, /* snan -- flags are undefined */
181 bool isneg = class & is_neg;
183 env->fpscr &= ~FP_FPRF;
184 env->fpscr |= fprf[ctz32(class)][isneg] << FPSCR_FPRF;
187 #define COMPUTE_FPRF(tp) \
188 void helper_compute_fprf_##tp(CPUPPCState *env, tp arg) \
190 set_fprf_from_class(env, tp##_classify(arg)); \
193 COMPUTE_FPRF(float16)
194 COMPUTE_FPRF(float32)
195 COMPUTE_FPRF(float64)
196 COMPUTE_FPRF(float128)
198 /* Floating-point invalid operations exception */
199 static void finish_invalid_op_excp(CPUPPCState *env, int op, uintptr_t retaddr)
201 /* Update the floating-point invalid operation summary */
202 env->fpscr |= FP_VX;
203 /* Update the floating-point exception summary */
204 env->fpscr |= FP_FX;
205 if (fpscr_ve != 0) {
206 /* Update the floating-point enabled exception summary */
207 env->fpscr |= FP_FEX;
208 if (fp_exceptions_enabled(env)) {
209 raise_exception_err_ra(env, POWERPC_EXCP_PROGRAM,
210 POWERPC_EXCP_FP | op, retaddr);
215 static void finish_invalid_op_arith(CPUPPCState *env, int op,
216 bool set_fpcc, uintptr_t retaddr)
218 env->fpscr &= ~(FP_FR | FP_FI);
219 if (fpscr_ve == 0) {
220 if (set_fpcc) {
221 env->fpscr &= ~FP_FPCC;
222 env->fpscr |= (FP_C | FP_FU);
225 finish_invalid_op_excp(env, op, retaddr);
228 /* Signalling NaN */
229 static void float_invalid_op_vxsnan(CPUPPCState *env, uintptr_t retaddr)
231 env->fpscr |= FP_VXSNAN;
232 finish_invalid_op_excp(env, POWERPC_EXCP_FP_VXSNAN, retaddr);
235 /* Magnitude subtraction of infinities */
236 static void float_invalid_op_vxisi(CPUPPCState *env, bool set_fpcc,
237 uintptr_t retaddr)
239 env->fpscr |= FP_VXISI;
240 finish_invalid_op_arith(env, POWERPC_EXCP_FP_VXISI, set_fpcc, retaddr);
243 /* Division of infinity by infinity */
244 static void float_invalid_op_vxidi(CPUPPCState *env, bool set_fpcc,
245 uintptr_t retaddr)
247 env->fpscr |= FP_VXIDI;
248 finish_invalid_op_arith(env, POWERPC_EXCP_FP_VXIDI, set_fpcc, retaddr);
251 /* Division of zero by zero */
252 static void float_invalid_op_vxzdz(CPUPPCState *env, bool set_fpcc,
253 uintptr_t retaddr)
255 env->fpscr |= FP_VXZDZ;
256 finish_invalid_op_arith(env, POWERPC_EXCP_FP_VXZDZ, set_fpcc, retaddr);
259 /* Multiplication of zero by infinity */
260 static void float_invalid_op_vximz(CPUPPCState *env, bool set_fpcc,
261 uintptr_t retaddr)
263 env->fpscr |= FP_VXIMZ;
264 finish_invalid_op_arith(env, POWERPC_EXCP_FP_VXIMZ, set_fpcc, retaddr);
267 /* Square root of a negative number */
268 static void float_invalid_op_vxsqrt(CPUPPCState *env, bool set_fpcc,
269 uintptr_t retaddr)
271 env->fpscr |= FP_VXSQRT;
272 finish_invalid_op_arith(env, POWERPC_EXCP_FP_VXSQRT, set_fpcc, retaddr);
275 /* Ordered comparison of NaN */
276 static void float_invalid_op_vxvc(CPUPPCState *env, bool set_fpcc,
277 uintptr_t retaddr)
279 env->fpscr |= FP_VXVC;
280 if (set_fpcc) {
281 env->fpscr &= ~FP_FPCC;
282 env->fpscr |= (FP_C | FP_FU);
284 /* Update the floating-point invalid operation summary */
285 env->fpscr |= FP_VX;
286 /* Update the floating-point exception summary */
287 env->fpscr |= FP_FX;
288 /* We must update the target FPR before raising the exception */
289 if (fpscr_ve != 0) {
290 CPUState *cs = env_cpu(env);
292 cs->exception_index = POWERPC_EXCP_PROGRAM;
293 env->error_code = POWERPC_EXCP_FP | POWERPC_EXCP_FP_VXVC;
294 /* Update the floating-point enabled exception summary */
295 env->fpscr |= FP_FEX;
296 /* Exception is deferred */
300 /* Invalid conversion */
301 static void float_invalid_op_vxcvi(CPUPPCState *env, bool set_fpcc,
302 uintptr_t retaddr)
304 env->fpscr |= FP_VXCVI;
305 env->fpscr &= ~(FP_FR | FP_FI);
306 if (fpscr_ve == 0) {
307 if (set_fpcc) {
308 env->fpscr &= ~FP_FPCC;
309 env->fpscr |= (FP_C | FP_FU);
312 finish_invalid_op_excp(env, POWERPC_EXCP_FP_VXCVI, retaddr);
315 static inline void float_zero_divide_excp(CPUPPCState *env, uintptr_t raddr)
317 env->fpscr |= FP_ZX;
318 env->fpscr &= ~(FP_FR | FP_FI);
319 /* Update the floating-point exception summary */
320 env->fpscr |= FP_FX;
321 if (fpscr_ze != 0) {
322 /* Update the floating-point enabled exception summary */
323 env->fpscr |= FP_FEX;
324 if (fp_exceptions_enabled(env)) {
325 raise_exception_err_ra(env, POWERPC_EXCP_PROGRAM,
326 POWERPC_EXCP_FP | POWERPC_EXCP_FP_ZX,
327 raddr);
332 static inline void float_overflow_excp(CPUPPCState *env)
334 CPUState *cs = env_cpu(env);
336 env->fpscr |= FP_OX;
337 /* Update the floating-point exception summary */
338 env->fpscr |= FP_FX;
339 if (fpscr_oe != 0) {
340 /* XXX: should adjust the result */
341 /* Update the floating-point enabled exception summary */
342 env->fpscr |= FP_FEX;
343 /* We must update the target FPR before raising the exception */
344 cs->exception_index = POWERPC_EXCP_PROGRAM;
345 env->error_code = POWERPC_EXCP_FP | POWERPC_EXCP_FP_OX;
346 } else {
347 env->fpscr |= FP_XX;
348 env->fpscr |= FP_FI;
352 static inline void float_underflow_excp(CPUPPCState *env)
354 CPUState *cs = env_cpu(env);
356 env->fpscr |= FP_UX;
357 /* Update the floating-point exception summary */
358 env->fpscr |= FP_FX;
359 if (fpscr_ue != 0) {
360 /* XXX: should adjust the result */
361 /* Update the floating-point enabled exception summary */
362 env->fpscr |= FP_FEX;
363 /* We must update the target FPR before raising the exception */
364 cs->exception_index = POWERPC_EXCP_PROGRAM;
365 env->error_code = POWERPC_EXCP_FP | POWERPC_EXCP_FP_UX;
369 static inline void float_inexact_excp(CPUPPCState *env)
371 CPUState *cs = env_cpu(env);
373 env->fpscr |= FP_FI;
374 env->fpscr |= FP_XX;
375 /* Update the floating-point exception summary */
376 env->fpscr |= FP_FX;
377 if (fpscr_xe != 0) {
378 /* Update the floating-point enabled exception summary */
379 env->fpscr |= FP_FEX;
380 /* We must update the target FPR before raising the exception */
381 cs->exception_index = POWERPC_EXCP_PROGRAM;
382 env->error_code = POWERPC_EXCP_FP | POWERPC_EXCP_FP_XX;
386 void helper_fpscr_clrbit(CPUPPCState *env, uint32_t bit)
388 uint32_t mask = 1u << bit;
389 if (env->fpscr & mask) {
390 ppc_store_fpscr(env, env->fpscr & ~(target_ulong)mask);
394 void helper_fpscr_setbit(CPUPPCState *env, uint32_t bit)
396 uint32_t mask = 1u << bit;
397 if (!(env->fpscr & mask)) {
398 ppc_store_fpscr(env, env->fpscr | mask);
402 void helper_store_fpscr(CPUPPCState *env, uint64_t val, uint32_t nibbles)
404 target_ulong mask = 0;
405 int i;
407 /* TODO: push this extension back to translation time */
408 for (i = 0; i < sizeof(target_ulong) * 2; i++) {
409 if (nibbles & (1 << i)) {
410 mask |= (target_ulong) 0xf << (4 * i);
413 val = (val & mask) | (env->fpscr & ~mask);
414 ppc_store_fpscr(env, val);
417 void helper_fpscr_check_status(CPUPPCState *env)
419 CPUState *cs = env_cpu(env);
420 target_ulong fpscr = env->fpscr;
421 int error = 0;
423 if ((fpscr & FP_OX) && (fpscr & FP_OE)) {
424 error = POWERPC_EXCP_FP_OX;
425 } else if ((fpscr & FP_UX) && (fpscr & FP_UE)) {
426 error = POWERPC_EXCP_FP_UX;
427 } else if ((fpscr & FP_XX) && (fpscr & FP_XE)) {
428 error = POWERPC_EXCP_FP_XX;
429 } else if ((fpscr & FP_ZX) && (fpscr & FP_ZE)) {
430 error = POWERPC_EXCP_FP_ZX;
431 } else if (fpscr & FP_VE) {
432 if (fpscr & FP_VXSOFT) {
433 error = POWERPC_EXCP_FP_VXSOFT;
434 } else if (fpscr & FP_VXSNAN) {
435 error = POWERPC_EXCP_FP_VXSNAN;
436 } else if (fpscr & FP_VXISI) {
437 error = POWERPC_EXCP_FP_VXISI;
438 } else if (fpscr & FP_VXIDI) {
439 error = POWERPC_EXCP_FP_VXIDI;
440 } else if (fpscr & FP_VXZDZ) {
441 error = POWERPC_EXCP_FP_VXZDZ;
442 } else if (fpscr & FP_VXIMZ) {
443 error = POWERPC_EXCP_FP_VXIMZ;
444 } else if (fpscr & FP_VXVC) {
445 error = POWERPC_EXCP_FP_VXVC;
446 } else if (fpscr & FP_VXSQRT) {
447 error = POWERPC_EXCP_FP_VXSQRT;
448 } else if (fpscr & FP_VXCVI) {
449 error = POWERPC_EXCP_FP_VXCVI;
450 } else {
451 return;
453 } else {
454 return;
456 cs->exception_index = POWERPC_EXCP_PROGRAM;
457 env->error_code = error | POWERPC_EXCP_FP;
458 /* Deferred floating-point exception after target FPSCR update */
459 if (fp_exceptions_enabled(env)) {
460 raise_exception_err_ra(env, cs->exception_index,
461 env->error_code, GETPC());
465 static void do_float_check_status(CPUPPCState *env, uintptr_t raddr)
467 CPUState *cs = env_cpu(env);
468 int status = get_float_exception_flags(&env->fp_status);
470 if (status & float_flag_overflow) {
471 float_overflow_excp(env);
472 } else if (status & float_flag_underflow) {
473 float_underflow_excp(env);
475 if (status & float_flag_inexact) {
476 float_inexact_excp(env);
477 } else {
478 env->fpscr &= ~FP_FI; /* clear the FPSCR[FI] bit */
481 if (cs->exception_index == POWERPC_EXCP_PROGRAM &&
482 (env->error_code & POWERPC_EXCP_FP)) {
483 /* Deferred floating-point exception after target FPR update */
484 if (fp_exceptions_enabled(env)) {
485 raise_exception_err_ra(env, cs->exception_index,
486 env->error_code, raddr);
491 void helper_float_check_status(CPUPPCState *env)
493 do_float_check_status(env, GETPC());
496 void helper_reset_fpstatus(CPUPPCState *env)
498 set_float_exception_flags(0, &env->fp_status);
501 static void float_invalid_op_addsub(CPUPPCState *env, int flags,
502 bool set_fpcc, uintptr_t retaddr)
504 if (flags & float_flag_invalid_isi) {
505 float_invalid_op_vxisi(env, set_fpcc, retaddr);
506 } else if (flags & float_flag_invalid_snan) {
507 float_invalid_op_vxsnan(env, retaddr);
511 /* fadd - fadd. */
512 float64 helper_fadd(CPUPPCState *env, float64 arg1, float64 arg2)
514 float64 ret = float64_add(arg1, arg2, &env->fp_status);
515 int flags = get_float_exception_flags(&env->fp_status);
517 if (unlikely(flags & float_flag_invalid)) {
518 float_invalid_op_addsub(env, flags, 1, GETPC());
521 return ret;
524 /* fadds - fadds. */
525 float64 helper_fadds(CPUPPCState *env, float64 arg1, float64 arg2)
527 float64 ret = float64r32_add(arg1, arg2, &env->fp_status);
528 int flags = get_float_exception_flags(&env->fp_status);
530 if (unlikely(flags & float_flag_invalid)) {
531 float_invalid_op_addsub(env, flags, 1, GETPC());
533 return ret;
536 /* fsub - fsub. */
537 float64 helper_fsub(CPUPPCState *env, float64 arg1, float64 arg2)
539 float64 ret = float64_sub(arg1, arg2, &env->fp_status);
540 int flags = get_float_exception_flags(&env->fp_status);
542 if (unlikely(flags & float_flag_invalid)) {
543 float_invalid_op_addsub(env, flags, 1, GETPC());
546 return ret;
549 /* fsubs - fsubs. */
550 float64 helper_fsubs(CPUPPCState *env, float64 arg1, float64 arg2)
552 float64 ret = float64r32_sub(arg1, arg2, &env->fp_status);
553 int flags = get_float_exception_flags(&env->fp_status);
555 if (unlikely(flags & float_flag_invalid)) {
556 float_invalid_op_addsub(env, flags, 1, GETPC());
558 return ret;
561 static void float_invalid_op_mul(CPUPPCState *env, int flags,
562 bool set_fprc, uintptr_t retaddr)
564 if (flags & float_flag_invalid_imz) {
565 float_invalid_op_vximz(env, set_fprc, retaddr);
566 } else if (flags & float_flag_invalid_snan) {
567 float_invalid_op_vxsnan(env, retaddr);
571 /* fmul - fmul. */
572 float64 helper_fmul(CPUPPCState *env, float64 arg1, float64 arg2)
574 float64 ret = float64_mul(arg1, arg2, &env->fp_status);
575 int flags = get_float_exception_flags(&env->fp_status);
577 if (unlikely(flags & float_flag_invalid)) {
578 float_invalid_op_mul(env, flags, 1, GETPC());
581 return ret;
584 /* fmuls - fmuls. */
585 float64 helper_fmuls(CPUPPCState *env, float64 arg1, float64 arg2)
587 float64 ret = float64r32_mul(arg1, arg2, &env->fp_status);
588 int flags = get_float_exception_flags(&env->fp_status);
590 if (unlikely(flags & float_flag_invalid)) {
591 float_invalid_op_mul(env, flags, 1, GETPC());
593 return ret;
596 static void float_invalid_op_div(CPUPPCState *env, int flags,
597 bool set_fprc, uintptr_t retaddr)
599 if (flags & float_flag_invalid_idi) {
600 float_invalid_op_vxidi(env, set_fprc, retaddr);
601 } else if (flags & float_flag_invalid_zdz) {
602 float_invalid_op_vxzdz(env, set_fprc, retaddr);
603 } else if (flags & float_flag_invalid_snan) {
604 float_invalid_op_vxsnan(env, retaddr);
608 /* fdiv - fdiv. */
609 float64 helper_fdiv(CPUPPCState *env, float64 arg1, float64 arg2)
611 float64 ret = float64_div(arg1, arg2, &env->fp_status);
612 int flags = get_float_exception_flags(&env->fp_status);
614 if (unlikely(flags & float_flag_invalid)) {
615 float_invalid_op_div(env, flags, 1, GETPC());
617 if (unlikely(flags & float_flag_divbyzero)) {
618 float_zero_divide_excp(env, GETPC());
621 return ret;
624 /* fdivs - fdivs. */
625 float64 helper_fdivs(CPUPPCState *env, float64 arg1, float64 arg2)
627 float64 ret = float64r32_div(arg1, arg2, &env->fp_status);
628 int flags = get_float_exception_flags(&env->fp_status);
630 if (unlikely(flags & float_flag_invalid)) {
631 float_invalid_op_div(env, flags, 1, GETPC());
633 if (unlikely(flags & float_flag_divbyzero)) {
634 float_zero_divide_excp(env, GETPC());
637 return ret;
640 static uint64_t float_invalid_cvt(CPUPPCState *env, int flags,
641 uint64_t ret, uint64_t ret_nan,
642 bool set_fprc, uintptr_t retaddr)
645 * VXCVI is different from most in that it sets two exception bits,
646 * VXCVI and VXSNAN for an SNaN input.
648 if (flags & float_flag_invalid_snan) {
649 env->fpscr |= FP_VXSNAN;
651 float_invalid_op_vxcvi(env, set_fprc, retaddr);
653 return flags & float_flag_invalid_cvti ? ret : ret_nan;
656 #define FPU_FCTI(op, cvt, nanval) \
657 uint64_t helper_##op(CPUPPCState *env, float64 arg) \
659 uint64_t ret = float64_to_##cvt(arg, &env->fp_status); \
660 int flags = get_float_exception_flags(&env->fp_status); \
661 if (unlikely(flags & float_flag_invalid)) { \
662 ret = float_invalid_cvt(env, flags, ret, nanval, 1, GETPC()); \
664 return ret; \
667 FPU_FCTI(fctiw, int32, 0x80000000U)
668 FPU_FCTI(fctiwz, int32_round_to_zero, 0x80000000U)
669 FPU_FCTI(fctiwu, uint32, 0x00000000U)
670 FPU_FCTI(fctiwuz, uint32_round_to_zero, 0x00000000U)
671 FPU_FCTI(fctid, int64, 0x8000000000000000ULL)
672 FPU_FCTI(fctidz, int64_round_to_zero, 0x8000000000000000ULL)
673 FPU_FCTI(fctidu, uint64, 0x0000000000000000ULL)
674 FPU_FCTI(fctiduz, uint64_round_to_zero, 0x0000000000000000ULL)
676 #define FPU_FCFI(op, cvtr, is_single) \
677 uint64_t helper_##op(CPUPPCState *env, uint64_t arg) \
679 CPU_DoubleU farg; \
681 if (is_single) { \
682 float32 tmp = cvtr(arg, &env->fp_status); \
683 farg.d = float32_to_float64(tmp, &env->fp_status); \
684 } else { \
685 farg.d = cvtr(arg, &env->fp_status); \
687 do_float_check_status(env, GETPC()); \
688 return farg.ll; \
691 FPU_FCFI(fcfid, int64_to_float64, 0)
692 FPU_FCFI(fcfids, int64_to_float32, 1)
693 FPU_FCFI(fcfidu, uint64_to_float64, 0)
694 FPU_FCFI(fcfidus, uint64_to_float32, 1)
696 static uint64_t do_fri(CPUPPCState *env, uint64_t arg,
697 FloatRoundMode rounding_mode)
699 FloatRoundMode old_rounding_mode = get_float_rounding_mode(&env->fp_status);
700 int flags;
702 set_float_rounding_mode(rounding_mode, &env->fp_status);
703 arg = float64_round_to_int(arg, &env->fp_status);
704 set_float_rounding_mode(old_rounding_mode, &env->fp_status);
706 flags = get_float_exception_flags(&env->fp_status);
707 if (flags & float_flag_invalid_snan) {
708 float_invalid_op_vxsnan(env, GETPC());
711 /* fri* does not set FPSCR[XX] */
712 set_float_exception_flags(flags & ~float_flag_inexact, &env->fp_status);
713 do_float_check_status(env, GETPC());
715 return arg;
718 uint64_t helper_frin(CPUPPCState *env, uint64_t arg)
720 return do_fri(env, arg, float_round_ties_away);
723 uint64_t helper_friz(CPUPPCState *env, uint64_t arg)
725 return do_fri(env, arg, float_round_to_zero);
728 uint64_t helper_frip(CPUPPCState *env, uint64_t arg)
730 return do_fri(env, arg, float_round_up);
733 uint64_t helper_frim(CPUPPCState *env, uint64_t arg)
735 return do_fri(env, arg, float_round_down);
738 static void float_invalid_op_madd(CPUPPCState *env, int flags,
739 bool set_fpcc, uintptr_t retaddr)
741 if (flags & float_flag_invalid_imz) {
742 float_invalid_op_vximz(env, set_fpcc, retaddr);
743 } else {
744 float_invalid_op_addsub(env, flags, set_fpcc, retaddr);
748 static float64 do_fmadd(CPUPPCState *env, float64 a, float64 b,
749 float64 c, int madd_flags, uintptr_t retaddr)
751 float64 ret = float64_muladd(a, b, c, madd_flags, &env->fp_status);
752 int flags = get_float_exception_flags(&env->fp_status);
754 if (unlikely(flags & float_flag_invalid)) {
755 float_invalid_op_madd(env, flags, 1, retaddr);
757 return ret;
760 static uint64_t do_fmadds(CPUPPCState *env, float64 a, float64 b,
761 float64 c, int madd_flags, uintptr_t retaddr)
763 float64 ret = float64r32_muladd(a, b, c, madd_flags, &env->fp_status);
764 int flags = get_float_exception_flags(&env->fp_status);
766 if (unlikely(flags & float_flag_invalid)) {
767 float_invalid_op_madd(env, flags, 1, retaddr);
769 return ret;
772 #define FPU_FMADD(op, madd_flags) \
773 uint64_t helper_##op(CPUPPCState *env, uint64_t arg1, \
774 uint64_t arg2, uint64_t arg3) \
775 { return do_fmadd(env, arg1, arg2, arg3, madd_flags, GETPC()); } \
776 uint64_t helper_##op##s(CPUPPCState *env, uint64_t arg1, \
777 uint64_t arg2, uint64_t arg3) \
778 { return do_fmadds(env, arg1, arg2, arg3, madd_flags, GETPC()); }
780 #define MADD_FLGS 0
781 #define MSUB_FLGS float_muladd_negate_c
782 #define NMADD_FLGS float_muladd_negate_result
783 #define NMSUB_FLGS (float_muladd_negate_c | float_muladd_negate_result)
785 FPU_FMADD(fmadd, MADD_FLGS)
786 FPU_FMADD(fnmadd, NMADD_FLGS)
787 FPU_FMADD(fmsub, MSUB_FLGS)
788 FPU_FMADD(fnmsub, NMSUB_FLGS)
790 /* frsp - frsp. */
791 static uint64_t do_frsp(CPUPPCState *env, uint64_t arg, uintptr_t retaddr)
793 float32 f32 = float64_to_float32(arg, &env->fp_status);
794 int flags = get_float_exception_flags(&env->fp_status);
796 if (unlikely(flags & float_flag_invalid_snan)) {
797 float_invalid_op_vxsnan(env, retaddr);
799 return helper_todouble(f32);
802 uint64_t helper_frsp(CPUPPCState *env, uint64_t arg)
804 return do_frsp(env, arg, GETPC());
807 static void float_invalid_op_sqrt(CPUPPCState *env, int flags,
808 bool set_fpcc, uintptr_t retaddr)
810 if (unlikely(flags & float_flag_invalid_sqrt)) {
811 float_invalid_op_vxsqrt(env, set_fpcc, retaddr);
812 } else if (unlikely(flags & float_flag_invalid_snan)) {
813 float_invalid_op_vxsnan(env, retaddr);
817 /* fsqrt - fsqrt. */
818 float64 helper_fsqrt(CPUPPCState *env, float64 arg)
820 float64 ret = float64_sqrt(arg, &env->fp_status);
821 int flags = get_float_exception_flags(&env->fp_status);
823 if (unlikely(flags & float_flag_invalid)) {
824 float_invalid_op_sqrt(env, flags, 1, GETPC());
827 return ret;
830 /* fsqrts - fsqrts. */
831 float64 helper_fsqrts(CPUPPCState *env, float64 arg)
833 float64 ret = float64r32_sqrt(arg, &env->fp_status);
834 int flags = get_float_exception_flags(&env->fp_status);
836 if (unlikely(flags & float_flag_invalid)) {
837 float_invalid_op_sqrt(env, flags, 1, GETPC());
839 return ret;
842 /* fre - fre. */
843 float64 helper_fre(CPUPPCState *env, float64 arg)
845 /* "Estimate" the reciprocal with actual division. */
846 float64 ret = float64_div(float64_one, arg, &env->fp_status);
847 int flags = get_float_exception_flags(&env->fp_status);
849 if (unlikely(flags & float_flag_invalid_snan)) {
850 float_invalid_op_vxsnan(env, GETPC());
852 if (unlikely(flags & float_flag_divbyzero)) {
853 float_zero_divide_excp(env, GETPC());
854 /* For FPSCR.ZE == 0, the result is 1/2. */
855 ret = float64_set_sign(float64_half, float64_is_neg(arg));
858 return ret;
861 /* fres - fres. */
862 uint64_t helper_fres(CPUPPCState *env, uint64_t arg)
864 /* "Estimate" the reciprocal with actual division. */
865 float64 ret = float64r32_div(float64_one, arg, &env->fp_status);
866 int flags = get_float_exception_flags(&env->fp_status);
868 if (unlikely(flags & float_flag_invalid_snan)) {
869 float_invalid_op_vxsnan(env, GETPC());
871 if (unlikely(flags & float_flag_divbyzero)) {
872 float_zero_divide_excp(env, GETPC());
873 /* For FPSCR.ZE == 0, the result is 1/2. */
874 ret = float64_set_sign(float64_half, float64_is_neg(arg));
877 return ret;
880 /* frsqrte - frsqrte. */
881 float64 helper_frsqrte(CPUPPCState *env, float64 arg)
883 /* "Estimate" the reciprocal with actual division. */
884 float64 rets = float64_sqrt(arg, &env->fp_status);
885 float64 retd = float64_div(float64_one, rets, &env->fp_status);
886 int flags = get_float_exception_flags(&env->fp_status);
888 if (unlikely(flags & float_flag_invalid)) {
889 float_invalid_op_sqrt(env, flags, 1, GETPC());
891 if (unlikely(flags & float_flag_divbyzero)) {
892 /* Reciprocal of (square root of) zero. */
893 float_zero_divide_excp(env, GETPC());
896 return retd;
899 /* frsqrtes - frsqrtes. */
900 float64 helper_frsqrtes(CPUPPCState *env, float64 arg)
902 /* "Estimate" the reciprocal with actual division. */
903 float64 rets = float64_sqrt(arg, &env->fp_status);
904 float64 retd = float64r32_div(float64_one, rets, &env->fp_status);
905 int flags = get_float_exception_flags(&env->fp_status);
907 if (unlikely(flags & float_flag_invalid)) {
908 float_invalid_op_sqrt(env, flags, 1, GETPC());
910 if (unlikely(flags & float_flag_divbyzero)) {
911 /* Reciprocal of (square root of) zero. */
912 float_zero_divide_excp(env, GETPC());
915 return retd;
918 /* fsel - fsel. */
919 uint64_t helper_fsel(CPUPPCState *env, uint64_t arg1, uint64_t arg2,
920 uint64_t arg3)
922 CPU_DoubleU farg1;
924 farg1.ll = arg1;
926 if ((!float64_is_neg(farg1.d) || float64_is_zero(farg1.d)) &&
927 !float64_is_any_nan(farg1.d)) {
928 return arg2;
929 } else {
930 return arg3;
934 uint32_t helper_ftdiv(uint64_t fra, uint64_t frb)
936 int fe_flag = 0;
937 int fg_flag = 0;
939 if (unlikely(float64_is_infinity(fra) ||
940 float64_is_infinity(frb) ||
941 float64_is_zero(frb))) {
942 fe_flag = 1;
943 fg_flag = 1;
944 } else {
945 int e_a = ppc_float64_get_unbiased_exp(fra);
946 int e_b = ppc_float64_get_unbiased_exp(frb);
948 if (unlikely(float64_is_any_nan(fra) ||
949 float64_is_any_nan(frb))) {
950 fe_flag = 1;
951 } else if ((e_b <= -1022) || (e_b >= 1021)) {
952 fe_flag = 1;
953 } else if (!float64_is_zero(fra) &&
954 (((e_a - e_b) >= 1023) ||
955 ((e_a - e_b) <= -1021) ||
956 (e_a <= -970))) {
957 fe_flag = 1;
960 if (unlikely(float64_is_zero_or_denormal(frb))) {
961 /* XB is not zero because of the above check and */
962 /* so must be denormalized. */
963 fg_flag = 1;
967 return 0x8 | (fg_flag ? 4 : 0) | (fe_flag ? 2 : 0);
970 uint32_t helper_ftsqrt(uint64_t frb)
972 int fe_flag = 0;
973 int fg_flag = 0;
975 if (unlikely(float64_is_infinity(frb) || float64_is_zero(frb))) {
976 fe_flag = 1;
977 fg_flag = 1;
978 } else {
979 int e_b = ppc_float64_get_unbiased_exp(frb);
981 if (unlikely(float64_is_any_nan(frb))) {
982 fe_flag = 1;
983 } else if (unlikely(float64_is_zero(frb))) {
984 fe_flag = 1;
985 } else if (unlikely(float64_is_neg(frb))) {
986 fe_flag = 1;
987 } else if (!float64_is_zero(frb) && (e_b <= (-1022 + 52))) {
988 fe_flag = 1;
991 if (unlikely(float64_is_zero_or_denormal(frb))) {
992 /* XB is not zero because of the above check and */
993 /* therefore must be denormalized. */
994 fg_flag = 1;
998 return 0x8 | (fg_flag ? 4 : 0) | (fe_flag ? 2 : 0);
1001 void helper_fcmpu(CPUPPCState *env, uint64_t arg1, uint64_t arg2,
1002 uint32_t crfD)
1004 CPU_DoubleU farg1, farg2;
1005 uint32_t ret = 0;
1007 farg1.ll = arg1;
1008 farg2.ll = arg2;
1010 if (unlikely(float64_is_any_nan(farg1.d) ||
1011 float64_is_any_nan(farg2.d))) {
1012 ret = 0x01UL;
1013 } else if (float64_lt(farg1.d, farg2.d, &env->fp_status)) {
1014 ret = 0x08UL;
1015 } else if (!float64_le(farg1.d, farg2.d, &env->fp_status)) {
1016 ret = 0x04UL;
1017 } else {
1018 ret = 0x02UL;
1021 env->fpscr &= ~FP_FPCC;
1022 env->fpscr |= ret << FPSCR_FPCC;
1023 env->crf[crfD] = ret;
1024 if (unlikely(ret == 0x01UL
1025 && (float64_is_signaling_nan(farg1.d, &env->fp_status) ||
1026 float64_is_signaling_nan(farg2.d, &env->fp_status)))) {
1027 /* sNaN comparison */
1028 float_invalid_op_vxsnan(env, GETPC());
1032 void helper_fcmpo(CPUPPCState *env, uint64_t arg1, uint64_t arg2,
1033 uint32_t crfD)
1035 CPU_DoubleU farg1, farg2;
1036 uint32_t ret = 0;
1038 farg1.ll = arg1;
1039 farg2.ll = arg2;
1041 if (unlikely(float64_is_any_nan(farg1.d) ||
1042 float64_is_any_nan(farg2.d))) {
1043 ret = 0x01UL;
1044 } else if (float64_lt(farg1.d, farg2.d, &env->fp_status)) {
1045 ret = 0x08UL;
1046 } else if (!float64_le(farg1.d, farg2.d, &env->fp_status)) {
1047 ret = 0x04UL;
1048 } else {
1049 ret = 0x02UL;
1052 env->fpscr &= ~FP_FPCC;
1053 env->fpscr |= ret << FPSCR_FPCC;
1054 env->crf[crfD] = (uint32_t) ret;
1055 if (unlikely(ret == 0x01UL)) {
1056 float_invalid_op_vxvc(env, 1, GETPC());
1057 if (float64_is_signaling_nan(farg1.d, &env->fp_status) ||
1058 float64_is_signaling_nan(farg2.d, &env->fp_status)) {
1059 /* sNaN comparison */
1060 float_invalid_op_vxsnan(env, GETPC());
1065 /* Single-precision floating-point conversions */
1066 static inline uint32_t efscfsi(CPUPPCState *env, uint32_t val)
1068 CPU_FloatU u;
1070 u.f = int32_to_float32(val, &env->vec_status);
1072 return u.l;
1075 static inline uint32_t efscfui(CPUPPCState *env, uint32_t val)
1077 CPU_FloatU u;
1079 u.f = uint32_to_float32(val, &env->vec_status);
1081 return u.l;
1084 static inline int32_t efsctsi(CPUPPCState *env, uint32_t val)
1086 CPU_FloatU u;
1088 u.l = val;
1089 /* NaN are not treated the same way IEEE 754 does */
1090 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1091 return 0;
1094 return float32_to_int32(u.f, &env->vec_status);
1097 static inline uint32_t efsctui(CPUPPCState *env, uint32_t val)
1099 CPU_FloatU u;
1101 u.l = val;
1102 /* NaN are not treated the same way IEEE 754 does */
1103 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1104 return 0;
1107 return float32_to_uint32(u.f, &env->vec_status);
1110 static inline uint32_t efsctsiz(CPUPPCState *env, uint32_t val)
1112 CPU_FloatU u;
1114 u.l = val;
1115 /* NaN are not treated the same way IEEE 754 does */
1116 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1117 return 0;
1120 return float32_to_int32_round_to_zero(u.f, &env->vec_status);
1123 static inline uint32_t efsctuiz(CPUPPCState *env, uint32_t val)
1125 CPU_FloatU u;
1127 u.l = val;
1128 /* NaN are not treated the same way IEEE 754 does */
1129 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1130 return 0;
1133 return float32_to_uint32_round_to_zero(u.f, &env->vec_status);
1136 static inline uint32_t efscfsf(CPUPPCState *env, uint32_t val)
1138 CPU_FloatU u;
1139 float32 tmp;
1141 u.f = int32_to_float32(val, &env->vec_status);
1142 tmp = int64_to_float32(1ULL << 32, &env->vec_status);
1143 u.f = float32_div(u.f, tmp, &env->vec_status);
1145 return u.l;
1148 static inline uint32_t efscfuf(CPUPPCState *env, uint32_t val)
1150 CPU_FloatU u;
1151 float32 tmp;
1153 u.f = uint32_to_float32(val, &env->vec_status);
1154 tmp = uint64_to_float32(1ULL << 32, &env->vec_status);
1155 u.f = float32_div(u.f, tmp, &env->vec_status);
1157 return u.l;
1160 static inline uint32_t efsctsf(CPUPPCState *env, uint32_t val)
1162 CPU_FloatU u;
1163 float32 tmp;
1165 u.l = val;
1166 /* NaN are not treated the same way IEEE 754 does */
1167 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1168 return 0;
1170 tmp = uint64_to_float32(1ULL << 32, &env->vec_status);
1171 u.f = float32_mul(u.f, tmp, &env->vec_status);
1173 return float32_to_int32(u.f, &env->vec_status);
1176 static inline uint32_t efsctuf(CPUPPCState *env, uint32_t val)
1178 CPU_FloatU u;
1179 float32 tmp;
1181 u.l = val;
1182 /* NaN are not treated the same way IEEE 754 does */
1183 if (unlikely(float32_is_quiet_nan(u.f, &env->vec_status))) {
1184 return 0;
1186 tmp = uint64_to_float32(1ULL << 32, &env->vec_status);
1187 u.f = float32_mul(u.f, tmp, &env->vec_status);
1189 return float32_to_uint32(u.f, &env->vec_status);
1192 #define HELPER_SPE_SINGLE_CONV(name) \
1193 uint32_t helper_e##name(CPUPPCState *env, uint32_t val) \
1195 return e##name(env, val); \
1197 /* efscfsi */
1198 HELPER_SPE_SINGLE_CONV(fscfsi);
1199 /* efscfui */
1200 HELPER_SPE_SINGLE_CONV(fscfui);
1201 /* efscfuf */
1202 HELPER_SPE_SINGLE_CONV(fscfuf);
1203 /* efscfsf */
1204 HELPER_SPE_SINGLE_CONV(fscfsf);
1205 /* efsctsi */
1206 HELPER_SPE_SINGLE_CONV(fsctsi);
1207 /* efsctui */
1208 HELPER_SPE_SINGLE_CONV(fsctui);
1209 /* efsctsiz */
1210 HELPER_SPE_SINGLE_CONV(fsctsiz);
1211 /* efsctuiz */
1212 HELPER_SPE_SINGLE_CONV(fsctuiz);
1213 /* efsctsf */
1214 HELPER_SPE_SINGLE_CONV(fsctsf);
1215 /* efsctuf */
1216 HELPER_SPE_SINGLE_CONV(fsctuf);
1218 #define HELPER_SPE_VECTOR_CONV(name) \
1219 uint64_t helper_ev##name(CPUPPCState *env, uint64_t val) \
1221 return ((uint64_t)e##name(env, val >> 32) << 32) | \
1222 (uint64_t)e##name(env, val); \
1224 /* evfscfsi */
1225 HELPER_SPE_VECTOR_CONV(fscfsi);
1226 /* evfscfui */
1227 HELPER_SPE_VECTOR_CONV(fscfui);
1228 /* evfscfuf */
1229 HELPER_SPE_VECTOR_CONV(fscfuf);
1230 /* evfscfsf */
1231 HELPER_SPE_VECTOR_CONV(fscfsf);
1232 /* evfsctsi */
1233 HELPER_SPE_VECTOR_CONV(fsctsi);
1234 /* evfsctui */
1235 HELPER_SPE_VECTOR_CONV(fsctui);
1236 /* evfsctsiz */
1237 HELPER_SPE_VECTOR_CONV(fsctsiz);
1238 /* evfsctuiz */
1239 HELPER_SPE_VECTOR_CONV(fsctuiz);
1240 /* evfsctsf */
1241 HELPER_SPE_VECTOR_CONV(fsctsf);
1242 /* evfsctuf */
1243 HELPER_SPE_VECTOR_CONV(fsctuf);
1245 /* Single-precision floating-point arithmetic */
1246 static inline uint32_t efsadd(CPUPPCState *env, uint32_t op1, uint32_t op2)
1248 CPU_FloatU u1, u2;
1250 u1.l = op1;
1251 u2.l = op2;
1252 u1.f = float32_add(u1.f, u2.f, &env->vec_status);
1253 return u1.l;
1256 static inline uint32_t efssub(CPUPPCState *env, uint32_t op1, uint32_t op2)
1258 CPU_FloatU u1, u2;
1260 u1.l = op1;
1261 u2.l = op2;
1262 u1.f = float32_sub(u1.f, u2.f, &env->vec_status);
1263 return u1.l;
1266 static inline uint32_t efsmul(CPUPPCState *env, uint32_t op1, uint32_t op2)
1268 CPU_FloatU u1, u2;
1270 u1.l = op1;
1271 u2.l = op2;
1272 u1.f = float32_mul(u1.f, u2.f, &env->vec_status);
1273 return u1.l;
1276 static inline uint32_t efsdiv(CPUPPCState *env, uint32_t op1, uint32_t op2)
1278 CPU_FloatU u1, u2;
1280 u1.l = op1;
1281 u2.l = op2;
1282 u1.f = float32_div(u1.f, u2.f, &env->vec_status);
1283 return u1.l;
1286 #define HELPER_SPE_SINGLE_ARITH(name) \
1287 uint32_t helper_e##name(CPUPPCState *env, uint32_t op1, uint32_t op2) \
1289 return e##name(env, op1, op2); \
1291 /* efsadd */
1292 HELPER_SPE_SINGLE_ARITH(fsadd);
1293 /* efssub */
1294 HELPER_SPE_SINGLE_ARITH(fssub);
1295 /* efsmul */
1296 HELPER_SPE_SINGLE_ARITH(fsmul);
1297 /* efsdiv */
1298 HELPER_SPE_SINGLE_ARITH(fsdiv);
1300 #define HELPER_SPE_VECTOR_ARITH(name) \
1301 uint64_t helper_ev##name(CPUPPCState *env, uint64_t op1, uint64_t op2) \
1303 return ((uint64_t)e##name(env, op1 >> 32, op2 >> 32) << 32) | \
1304 (uint64_t)e##name(env, op1, op2); \
1306 /* evfsadd */
1307 HELPER_SPE_VECTOR_ARITH(fsadd);
1308 /* evfssub */
1309 HELPER_SPE_VECTOR_ARITH(fssub);
1310 /* evfsmul */
1311 HELPER_SPE_VECTOR_ARITH(fsmul);
1312 /* evfsdiv */
1313 HELPER_SPE_VECTOR_ARITH(fsdiv);
1315 /* Single-precision floating-point comparisons */
1316 static inline uint32_t efscmplt(CPUPPCState *env, uint32_t op1, uint32_t op2)
1318 CPU_FloatU u1, u2;
1320 u1.l = op1;
1321 u2.l = op2;
1322 return float32_lt(u1.f, u2.f, &env->vec_status) ? 4 : 0;
1325 static inline uint32_t efscmpgt(CPUPPCState *env, uint32_t op1, uint32_t op2)
1327 CPU_FloatU u1, u2;
1329 u1.l = op1;
1330 u2.l = op2;
1331 return float32_le(u1.f, u2.f, &env->vec_status) ? 0 : 4;
1334 static inline uint32_t efscmpeq(CPUPPCState *env, uint32_t op1, uint32_t op2)
1336 CPU_FloatU u1, u2;
1338 u1.l = op1;
1339 u2.l = op2;
1340 return float32_eq(u1.f, u2.f, &env->vec_status) ? 4 : 0;
1343 static inline uint32_t efststlt(CPUPPCState *env, uint32_t op1, uint32_t op2)
1345 /* XXX: TODO: ignore special values (NaN, infinites, ...) */
1346 return efscmplt(env, op1, op2);
1349 static inline uint32_t efststgt(CPUPPCState *env, uint32_t op1, uint32_t op2)
1351 /* XXX: TODO: ignore special values (NaN, infinites, ...) */
1352 return efscmpgt(env, op1, op2);
1355 static inline uint32_t efststeq(CPUPPCState *env, uint32_t op1, uint32_t op2)
1357 /* XXX: TODO: ignore special values (NaN, infinites, ...) */
1358 return efscmpeq(env, op1, op2);
1361 #define HELPER_SINGLE_SPE_CMP(name) \
1362 uint32_t helper_e##name(CPUPPCState *env, uint32_t op1, uint32_t op2) \
1364 return e##name(env, op1, op2); \
1366 /* efststlt */
1367 HELPER_SINGLE_SPE_CMP(fststlt);
1368 /* efststgt */
1369 HELPER_SINGLE_SPE_CMP(fststgt);
1370 /* efststeq */
1371 HELPER_SINGLE_SPE_CMP(fststeq);
1372 /* efscmplt */
1373 HELPER_SINGLE_SPE_CMP(fscmplt);
1374 /* efscmpgt */
1375 HELPER_SINGLE_SPE_CMP(fscmpgt);
1376 /* efscmpeq */
1377 HELPER_SINGLE_SPE_CMP(fscmpeq);
1379 static inline uint32_t evcmp_merge(int t0, int t1)
1381 return (t0 << 3) | (t1 << 2) | ((t0 | t1) << 1) | (t0 & t1);
1384 #define HELPER_VECTOR_SPE_CMP(name) \
1385 uint32_t helper_ev##name(CPUPPCState *env, uint64_t op1, uint64_t op2) \
1387 return evcmp_merge(e##name(env, op1 >> 32, op2 >> 32), \
1388 e##name(env, op1, op2)); \
1390 /* evfststlt */
1391 HELPER_VECTOR_SPE_CMP(fststlt);
1392 /* evfststgt */
1393 HELPER_VECTOR_SPE_CMP(fststgt);
1394 /* evfststeq */
1395 HELPER_VECTOR_SPE_CMP(fststeq);
1396 /* evfscmplt */
1397 HELPER_VECTOR_SPE_CMP(fscmplt);
1398 /* evfscmpgt */
1399 HELPER_VECTOR_SPE_CMP(fscmpgt);
1400 /* evfscmpeq */
1401 HELPER_VECTOR_SPE_CMP(fscmpeq);
1403 /* Double-precision floating-point conversion */
1404 uint64_t helper_efdcfsi(CPUPPCState *env, uint32_t val)
1406 CPU_DoubleU u;
1408 u.d = int32_to_float64(val, &env->vec_status);
1410 return u.ll;
1413 uint64_t helper_efdcfsid(CPUPPCState *env, uint64_t val)
1415 CPU_DoubleU u;
1417 u.d = int64_to_float64(val, &env->vec_status);
1419 return u.ll;
1422 uint64_t helper_efdcfui(CPUPPCState *env, uint32_t val)
1424 CPU_DoubleU u;
1426 u.d = uint32_to_float64(val, &env->vec_status);
1428 return u.ll;
1431 uint64_t helper_efdcfuid(CPUPPCState *env, uint64_t val)
1433 CPU_DoubleU u;
1435 u.d = uint64_to_float64(val, &env->vec_status);
1437 return u.ll;
1440 uint32_t helper_efdctsi(CPUPPCState *env, uint64_t val)
1442 CPU_DoubleU u;
1444 u.ll = val;
1445 /* NaN are not treated the same way IEEE 754 does */
1446 if (unlikely(float64_is_any_nan(u.d))) {
1447 return 0;
1450 return float64_to_int32(u.d, &env->vec_status);
1453 uint32_t helper_efdctui(CPUPPCState *env, uint64_t val)
1455 CPU_DoubleU u;
1457 u.ll = val;
1458 /* NaN are not treated the same way IEEE 754 does */
1459 if (unlikely(float64_is_any_nan(u.d))) {
1460 return 0;
1463 return float64_to_uint32(u.d, &env->vec_status);
1466 uint32_t helper_efdctsiz(CPUPPCState *env, uint64_t val)
1468 CPU_DoubleU u;
1470 u.ll = val;
1471 /* NaN are not treated the same way IEEE 754 does */
1472 if (unlikely(float64_is_any_nan(u.d))) {
1473 return 0;
1476 return float64_to_int32_round_to_zero(u.d, &env->vec_status);
1479 uint64_t helper_efdctsidz(CPUPPCState *env, uint64_t val)
1481 CPU_DoubleU u;
1483 u.ll = val;
1484 /* NaN are not treated the same way IEEE 754 does */
1485 if (unlikely(float64_is_any_nan(u.d))) {
1486 return 0;
1489 return float64_to_int64_round_to_zero(u.d, &env->vec_status);
1492 uint32_t helper_efdctuiz(CPUPPCState *env, uint64_t val)
1494 CPU_DoubleU u;
1496 u.ll = val;
1497 /* NaN are not treated the same way IEEE 754 does */
1498 if (unlikely(float64_is_any_nan(u.d))) {
1499 return 0;
1502 return float64_to_uint32_round_to_zero(u.d, &env->vec_status);
1505 uint64_t helper_efdctuidz(CPUPPCState *env, uint64_t val)
1507 CPU_DoubleU u;
1509 u.ll = val;
1510 /* NaN are not treated the same way IEEE 754 does */
1511 if (unlikely(float64_is_any_nan(u.d))) {
1512 return 0;
1515 return float64_to_uint64_round_to_zero(u.d, &env->vec_status);
1518 uint64_t helper_efdcfsf(CPUPPCState *env, uint32_t val)
1520 CPU_DoubleU u;
1521 float64 tmp;
1523 u.d = int32_to_float64(val, &env->vec_status);
1524 tmp = int64_to_float64(1ULL << 32, &env->vec_status);
1525 u.d = float64_div(u.d, tmp, &env->vec_status);
1527 return u.ll;
1530 uint64_t helper_efdcfuf(CPUPPCState *env, uint32_t val)
1532 CPU_DoubleU u;
1533 float64 tmp;
1535 u.d = uint32_to_float64(val, &env->vec_status);
1536 tmp = int64_to_float64(1ULL << 32, &env->vec_status);
1537 u.d = float64_div(u.d, tmp, &env->vec_status);
1539 return u.ll;
1542 uint32_t helper_efdctsf(CPUPPCState *env, uint64_t val)
1544 CPU_DoubleU u;
1545 float64 tmp;
1547 u.ll = val;
1548 /* NaN are not treated the same way IEEE 754 does */
1549 if (unlikely(float64_is_any_nan(u.d))) {
1550 return 0;
1552 tmp = uint64_to_float64(1ULL << 32, &env->vec_status);
1553 u.d = float64_mul(u.d, tmp, &env->vec_status);
1555 return float64_to_int32(u.d, &env->vec_status);
1558 uint32_t helper_efdctuf(CPUPPCState *env, uint64_t val)
1560 CPU_DoubleU u;
1561 float64 tmp;
1563 u.ll = val;
1564 /* NaN are not treated the same way IEEE 754 does */
1565 if (unlikely(float64_is_any_nan(u.d))) {
1566 return 0;
1568 tmp = uint64_to_float64(1ULL << 32, &env->vec_status);
1569 u.d = float64_mul(u.d, tmp, &env->vec_status);
1571 return float64_to_uint32(u.d, &env->vec_status);
1574 uint32_t helper_efscfd(CPUPPCState *env, uint64_t val)
1576 CPU_DoubleU u1;
1577 CPU_FloatU u2;
1579 u1.ll = val;
1580 u2.f = float64_to_float32(u1.d, &env->vec_status);
1582 return u2.l;
1585 uint64_t helper_efdcfs(CPUPPCState *env, uint32_t val)
1587 CPU_DoubleU u2;
1588 CPU_FloatU u1;
1590 u1.l = val;
1591 u2.d = float32_to_float64(u1.f, &env->vec_status);
1593 return u2.ll;
1596 /* Double precision fixed-point arithmetic */
1597 uint64_t helper_efdadd(CPUPPCState *env, uint64_t op1, uint64_t op2)
1599 CPU_DoubleU u1, u2;
1601 u1.ll = op1;
1602 u2.ll = op2;
1603 u1.d = float64_add(u1.d, u2.d, &env->vec_status);
1604 return u1.ll;
1607 uint64_t helper_efdsub(CPUPPCState *env, uint64_t op1, uint64_t op2)
1609 CPU_DoubleU u1, u2;
1611 u1.ll = op1;
1612 u2.ll = op2;
1613 u1.d = float64_sub(u1.d, u2.d, &env->vec_status);
1614 return u1.ll;
1617 uint64_t helper_efdmul(CPUPPCState *env, uint64_t op1, uint64_t op2)
1619 CPU_DoubleU u1, u2;
1621 u1.ll = op1;
1622 u2.ll = op2;
1623 u1.d = float64_mul(u1.d, u2.d, &env->vec_status);
1624 return u1.ll;
1627 uint64_t helper_efddiv(CPUPPCState *env, uint64_t op1, uint64_t op2)
1629 CPU_DoubleU u1, u2;
1631 u1.ll = op1;
1632 u2.ll = op2;
1633 u1.d = float64_div(u1.d, u2.d, &env->vec_status);
1634 return u1.ll;
1637 /* Double precision floating point helpers */
1638 uint32_t helper_efdtstlt(CPUPPCState *env, uint64_t op1, uint64_t op2)
1640 CPU_DoubleU u1, u2;
1642 u1.ll = op1;
1643 u2.ll = op2;
1644 return float64_lt(u1.d, u2.d, &env->vec_status) ? 4 : 0;
1647 uint32_t helper_efdtstgt(CPUPPCState *env, uint64_t op1, uint64_t op2)
1649 CPU_DoubleU u1, u2;
1651 u1.ll = op1;
1652 u2.ll = op2;
1653 return float64_le(u1.d, u2.d, &env->vec_status) ? 0 : 4;
1656 uint32_t helper_efdtsteq(CPUPPCState *env, uint64_t op1, uint64_t op2)
1658 CPU_DoubleU u1, u2;
1660 u1.ll = op1;
1661 u2.ll = op2;
1662 return float64_eq_quiet(u1.d, u2.d, &env->vec_status) ? 4 : 0;
1665 uint32_t helper_efdcmplt(CPUPPCState *env, uint64_t op1, uint64_t op2)
1667 /* XXX: TODO: test special values (NaN, infinites, ...) */
1668 return helper_efdtstlt(env, op1, op2);
1671 uint32_t helper_efdcmpgt(CPUPPCState *env, uint64_t op1, uint64_t op2)
1673 /* XXX: TODO: test special values (NaN, infinites, ...) */
1674 return helper_efdtstgt(env, op1, op2);
1677 uint32_t helper_efdcmpeq(CPUPPCState *env, uint64_t op1, uint64_t op2)
1679 /* XXX: TODO: test special values (NaN, infinites, ...) */
1680 return helper_efdtsteq(env, op1, op2);
1683 #define float64_to_float64(x, env) x
1687 * VSX_ADD_SUB - VSX floating point add/subtract
1688 * name - instruction mnemonic
1689 * op - operation (add or sub)
1690 * nels - number of elements (1, 2 or 4)
1691 * tp - type (float32 or float64)
1692 * fld - vsr_t field (VsrD(*) or VsrW(*))
1693 * sfprf - set FPRF
1695 #define VSX_ADD_SUB(name, op, nels, tp, fld, sfprf, r2sp) \
1696 void helper_##name(CPUPPCState *env, ppc_vsr_t *xt, \
1697 ppc_vsr_t *xa, ppc_vsr_t *xb) \
1699 ppc_vsr_t t = { }; \
1700 int i; \
1702 helper_reset_fpstatus(env); \
1704 for (i = 0; i < nels; i++) { \
1705 float_status tstat = env->fp_status; \
1706 set_float_exception_flags(0, &tstat); \
1707 t.fld = tp##_##op(xa->fld, xb->fld, &tstat); \
1708 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
1710 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
1711 float_invalid_op_addsub(env, tstat.float_exception_flags, \
1712 sfprf, GETPC()); \
1715 if (r2sp) { \
1716 t.fld = do_frsp(env, t.fld, GETPC()); \
1719 if (sfprf) { \
1720 helper_compute_fprf_float64(env, t.fld); \
1723 *xt = t; \
1724 do_float_check_status(env, GETPC()); \
1727 VSX_ADD_SUB(xsadddp, add, 1, float64, VsrD(0), 1, 0)
1728 VSX_ADD_SUB(xsaddsp, add, 1, float64, VsrD(0), 1, 1)
1729 VSX_ADD_SUB(xvadddp, add, 2, float64, VsrD(i), 0, 0)
1730 VSX_ADD_SUB(xvaddsp, add, 4, float32, VsrW(i), 0, 0)
1731 VSX_ADD_SUB(xssubdp, sub, 1, float64, VsrD(0), 1, 0)
1732 VSX_ADD_SUB(xssubsp, sub, 1, float64, VsrD(0), 1, 1)
1733 VSX_ADD_SUB(xvsubdp, sub, 2, float64, VsrD(i), 0, 0)
1734 VSX_ADD_SUB(xvsubsp, sub, 4, float32, VsrW(i), 0, 0)
1736 void helper_xsaddqp(CPUPPCState *env, uint32_t opcode,
1737 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb)
1739 ppc_vsr_t t = *xt;
1740 float_status tstat;
1742 helper_reset_fpstatus(env);
1744 tstat = env->fp_status;
1745 if (unlikely(Rc(opcode) != 0)) {
1746 tstat.float_rounding_mode = float_round_to_odd;
1749 set_float_exception_flags(0, &tstat);
1750 t.f128 = float128_add(xa->f128, xb->f128, &tstat);
1751 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
1753 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) {
1754 float_invalid_op_addsub(env, tstat.float_exception_flags, 1, GETPC());
1757 helper_compute_fprf_float128(env, t.f128);
1759 *xt = t;
1760 do_float_check_status(env, GETPC());
1764 * VSX_MUL - VSX floating point multiply
1765 * op - instruction mnemonic
1766 * nels - number of elements (1, 2 or 4)
1767 * tp - type (float32 or float64)
1768 * fld - vsr_t field (VsrD(*) or VsrW(*))
1769 * sfprf - set FPRF
1771 #define VSX_MUL(op, nels, tp, fld, sfprf, r2sp) \
1772 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, \
1773 ppc_vsr_t *xa, ppc_vsr_t *xb) \
1775 ppc_vsr_t t = { }; \
1776 int i; \
1778 helper_reset_fpstatus(env); \
1780 for (i = 0; i < nels; i++) { \
1781 float_status tstat = env->fp_status; \
1782 set_float_exception_flags(0, &tstat); \
1783 t.fld = tp##_mul(xa->fld, xb->fld, &tstat); \
1784 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
1786 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
1787 float_invalid_op_mul(env, tstat.float_exception_flags, \
1788 sfprf, GETPC()); \
1791 if (r2sp) { \
1792 t.fld = do_frsp(env, t.fld, GETPC()); \
1795 if (sfprf) { \
1796 helper_compute_fprf_float64(env, t.fld); \
1800 *xt = t; \
1801 do_float_check_status(env, GETPC()); \
1804 VSX_MUL(xsmuldp, 1, float64, VsrD(0), 1, 0)
1805 VSX_MUL(xsmulsp, 1, float64, VsrD(0), 1, 1)
1806 VSX_MUL(xvmuldp, 2, float64, VsrD(i), 0, 0)
1807 VSX_MUL(xvmulsp, 4, float32, VsrW(i), 0, 0)
1809 void helper_xsmulqp(CPUPPCState *env, uint32_t opcode,
1810 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb)
1812 ppc_vsr_t t = *xt;
1813 float_status tstat;
1815 helper_reset_fpstatus(env);
1816 tstat = env->fp_status;
1817 if (unlikely(Rc(opcode) != 0)) {
1818 tstat.float_rounding_mode = float_round_to_odd;
1821 set_float_exception_flags(0, &tstat);
1822 t.f128 = float128_mul(xa->f128, xb->f128, &tstat);
1823 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
1825 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) {
1826 float_invalid_op_mul(env, tstat.float_exception_flags, 1, GETPC());
1828 helper_compute_fprf_float128(env, t.f128);
1830 *xt = t;
1831 do_float_check_status(env, GETPC());
1835 * VSX_DIV - VSX floating point divide
1836 * op - instruction mnemonic
1837 * nels - number of elements (1, 2 or 4)
1838 * tp - type (float32 or float64)
1839 * fld - vsr_t field (VsrD(*) or VsrW(*))
1840 * sfprf - set FPRF
1842 #define VSX_DIV(op, nels, tp, fld, sfprf, r2sp) \
1843 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, \
1844 ppc_vsr_t *xa, ppc_vsr_t *xb) \
1846 ppc_vsr_t t = { }; \
1847 int i; \
1849 helper_reset_fpstatus(env); \
1851 for (i = 0; i < nels; i++) { \
1852 float_status tstat = env->fp_status; \
1853 set_float_exception_flags(0, &tstat); \
1854 t.fld = tp##_div(xa->fld, xb->fld, &tstat); \
1855 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
1857 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
1858 float_invalid_op_div(env, tstat.float_exception_flags, \
1859 sfprf, GETPC()); \
1861 if (unlikely(tstat.float_exception_flags & float_flag_divbyzero)) { \
1862 float_zero_divide_excp(env, GETPC()); \
1865 if (r2sp) { \
1866 t.fld = do_frsp(env, t.fld, GETPC()); \
1869 if (sfprf) { \
1870 helper_compute_fprf_float64(env, t.fld); \
1874 *xt = t; \
1875 do_float_check_status(env, GETPC()); \
1878 VSX_DIV(xsdivdp, 1, float64, VsrD(0), 1, 0)
1879 VSX_DIV(xsdivsp, 1, float64, VsrD(0), 1, 1)
1880 VSX_DIV(xvdivdp, 2, float64, VsrD(i), 0, 0)
1881 VSX_DIV(xvdivsp, 4, float32, VsrW(i), 0, 0)
1883 void helper_xsdivqp(CPUPPCState *env, uint32_t opcode,
1884 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb)
1886 ppc_vsr_t t = *xt;
1887 float_status tstat;
1889 helper_reset_fpstatus(env);
1890 tstat = env->fp_status;
1891 if (unlikely(Rc(opcode) != 0)) {
1892 tstat.float_rounding_mode = float_round_to_odd;
1895 set_float_exception_flags(0, &tstat);
1896 t.f128 = float128_div(xa->f128, xb->f128, &tstat);
1897 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
1899 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) {
1900 float_invalid_op_div(env, tstat.float_exception_flags, 1, GETPC());
1902 if (unlikely(tstat.float_exception_flags & float_flag_divbyzero)) {
1903 float_zero_divide_excp(env, GETPC());
1906 helper_compute_fprf_float128(env, t.f128);
1907 *xt = t;
1908 do_float_check_status(env, GETPC());
1912 * VSX_RE - VSX floating point reciprocal estimate
1913 * op - instruction mnemonic
1914 * nels - number of elements (1, 2 or 4)
1915 * tp - type (float32 or float64)
1916 * fld - vsr_t field (VsrD(*) or VsrW(*))
1917 * sfprf - set FPRF
1919 #define VSX_RE(op, nels, tp, fld, sfprf, r2sp) \
1920 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
1922 ppc_vsr_t t = { }; \
1923 int i; \
1925 helper_reset_fpstatus(env); \
1927 for (i = 0; i < nels; i++) { \
1928 if (unlikely(tp##_is_signaling_nan(xb->fld, &env->fp_status))) { \
1929 float_invalid_op_vxsnan(env, GETPC()); \
1931 t.fld = tp##_div(tp##_one, xb->fld, &env->fp_status); \
1933 if (r2sp) { \
1934 t.fld = do_frsp(env, t.fld, GETPC()); \
1937 if (sfprf) { \
1938 helper_compute_fprf_float64(env, t.fld); \
1942 *xt = t; \
1943 do_float_check_status(env, GETPC()); \
1946 VSX_RE(xsredp, 1, float64, VsrD(0), 1, 0)
1947 VSX_RE(xsresp, 1, float64, VsrD(0), 1, 1)
1948 VSX_RE(xvredp, 2, float64, VsrD(i), 0, 0)
1949 VSX_RE(xvresp, 4, float32, VsrW(i), 0, 0)
1952 * VSX_SQRT - VSX floating point square root
1953 * op - instruction mnemonic
1954 * nels - number of elements (1, 2 or 4)
1955 * tp - type (float32 or float64)
1956 * fld - vsr_t field (VsrD(*) or VsrW(*))
1957 * sfprf - set FPRF
1959 #define VSX_SQRT(op, nels, tp, fld, sfprf, r2sp) \
1960 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
1962 ppc_vsr_t t = { }; \
1963 int i; \
1965 helper_reset_fpstatus(env); \
1967 for (i = 0; i < nels; i++) { \
1968 float_status tstat = env->fp_status; \
1969 set_float_exception_flags(0, &tstat); \
1970 t.fld = tp##_sqrt(xb->fld, &tstat); \
1971 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
1973 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
1974 float_invalid_op_sqrt(env, tstat.float_exception_flags, \
1975 sfprf, GETPC()); \
1978 if (r2sp) { \
1979 t.fld = do_frsp(env, t.fld, GETPC()); \
1982 if (sfprf) { \
1983 helper_compute_fprf_float64(env, t.fld); \
1987 *xt = t; \
1988 do_float_check_status(env, GETPC()); \
1991 VSX_SQRT(xssqrtdp, 1, float64, VsrD(0), 1, 0)
1992 VSX_SQRT(xssqrtsp, 1, float64, VsrD(0), 1, 1)
1993 VSX_SQRT(xvsqrtdp, 2, float64, VsrD(i), 0, 0)
1994 VSX_SQRT(xvsqrtsp, 4, float32, VsrW(i), 0, 0)
1997 *VSX_RSQRTE - VSX floating point reciprocal square root estimate
1998 * op - instruction mnemonic
1999 * nels - number of elements (1, 2 or 4)
2000 * tp - type (float32 or float64)
2001 * fld - vsr_t field (VsrD(*) or VsrW(*))
2002 * sfprf - set FPRF
2004 #define VSX_RSQRTE(op, nels, tp, fld, sfprf, r2sp) \
2005 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
2007 ppc_vsr_t t = { }; \
2008 int i; \
2010 helper_reset_fpstatus(env); \
2012 for (i = 0; i < nels; i++) { \
2013 float_status tstat = env->fp_status; \
2014 set_float_exception_flags(0, &tstat); \
2015 t.fld = tp##_sqrt(xb->fld, &tstat); \
2016 t.fld = tp##_div(tp##_one, t.fld, &tstat); \
2017 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
2018 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
2019 float_invalid_op_sqrt(env, tstat.float_exception_flags, \
2020 sfprf, GETPC()); \
2022 if (r2sp) { \
2023 t.fld = do_frsp(env, t.fld, GETPC()); \
2026 if (sfprf) { \
2027 helper_compute_fprf_float64(env, t.fld); \
2031 *xt = t; \
2032 do_float_check_status(env, GETPC()); \
2035 VSX_RSQRTE(xsrsqrtedp, 1, float64, VsrD(0), 1, 0)
2036 VSX_RSQRTE(xsrsqrtesp, 1, float64, VsrD(0), 1, 1)
2037 VSX_RSQRTE(xvrsqrtedp, 2, float64, VsrD(i), 0, 0)
2038 VSX_RSQRTE(xvrsqrtesp, 4, float32, VsrW(i), 0, 0)
2041 * VSX_TDIV - VSX floating point test for divide
2042 * op - instruction mnemonic
2043 * nels - number of elements (1, 2 or 4)
2044 * tp - type (float32 or float64)
2045 * fld - vsr_t field (VsrD(*) or VsrW(*))
2046 * emin - minimum unbiased exponent
2047 * emax - maximum unbiased exponent
2048 * nbits - number of fraction bits
2050 #define VSX_TDIV(op, nels, tp, fld, emin, emax, nbits) \
2051 void helper_##op(CPUPPCState *env, uint32_t opcode, \
2052 ppc_vsr_t *xa, ppc_vsr_t *xb) \
2054 int i; \
2055 int fe_flag = 0; \
2056 int fg_flag = 0; \
2058 for (i = 0; i < nels; i++) { \
2059 if (unlikely(tp##_is_infinity(xa->fld) || \
2060 tp##_is_infinity(xb->fld) || \
2061 tp##_is_zero(xb->fld))) { \
2062 fe_flag = 1; \
2063 fg_flag = 1; \
2064 } else { \
2065 int e_a = ppc_##tp##_get_unbiased_exp(xa->fld); \
2066 int e_b = ppc_##tp##_get_unbiased_exp(xb->fld); \
2068 if (unlikely(tp##_is_any_nan(xa->fld) || \
2069 tp##_is_any_nan(xb->fld))) { \
2070 fe_flag = 1; \
2071 } else if ((e_b <= emin) || (e_b >= (emax - 2))) { \
2072 fe_flag = 1; \
2073 } else if (!tp##_is_zero(xa->fld) && \
2074 (((e_a - e_b) >= emax) || \
2075 ((e_a - e_b) <= (emin + 1)) || \
2076 (e_a <= (emin + nbits)))) { \
2077 fe_flag = 1; \
2080 if (unlikely(tp##_is_zero_or_denormal(xb->fld))) { \
2081 /* \
2082 * XB is not zero because of the above check and so \
2083 * must be denormalized. \
2084 */ \
2085 fg_flag = 1; \
2090 env->crf[BF(opcode)] = 0x8 | (fg_flag ? 4 : 0) | (fe_flag ? 2 : 0); \
2093 VSX_TDIV(xstdivdp, 1, float64, VsrD(0), -1022, 1023, 52)
2094 VSX_TDIV(xvtdivdp, 2, float64, VsrD(i), -1022, 1023, 52)
2095 VSX_TDIV(xvtdivsp, 4, float32, VsrW(i), -126, 127, 23)
2098 * VSX_TSQRT - VSX floating point test for square root
2099 * op - instruction mnemonic
2100 * nels - number of elements (1, 2 or 4)
2101 * tp - type (float32 or float64)
2102 * fld - vsr_t field (VsrD(*) or VsrW(*))
2103 * emin - minimum unbiased exponent
2104 * emax - maximum unbiased exponent
2105 * nbits - number of fraction bits
2107 #define VSX_TSQRT(op, nels, tp, fld, emin, nbits) \
2108 void helper_##op(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xb) \
2110 int i; \
2111 int fe_flag = 0; \
2112 int fg_flag = 0; \
2114 for (i = 0; i < nels; i++) { \
2115 if (unlikely(tp##_is_infinity(xb->fld) || \
2116 tp##_is_zero(xb->fld))) { \
2117 fe_flag = 1; \
2118 fg_flag = 1; \
2119 } else { \
2120 int e_b = ppc_##tp##_get_unbiased_exp(xb->fld); \
2122 if (unlikely(tp##_is_any_nan(xb->fld))) { \
2123 fe_flag = 1; \
2124 } else if (unlikely(tp##_is_zero(xb->fld))) { \
2125 fe_flag = 1; \
2126 } else if (unlikely(tp##_is_neg(xb->fld))) { \
2127 fe_flag = 1; \
2128 } else if (!tp##_is_zero(xb->fld) && \
2129 (e_b <= (emin + nbits))) { \
2130 fe_flag = 1; \
2133 if (unlikely(tp##_is_zero_or_denormal(xb->fld))) { \
2134 /* \
2135 * XB is not zero because of the above check and \
2136 * therefore must be denormalized. \
2137 */ \
2138 fg_flag = 1; \
2143 env->crf[BF(opcode)] = 0x8 | (fg_flag ? 4 : 0) | (fe_flag ? 2 : 0); \
2146 VSX_TSQRT(xstsqrtdp, 1, float64, VsrD(0), -1022, 52)
2147 VSX_TSQRT(xvtsqrtdp, 2, float64, VsrD(i), -1022, 52)
2148 VSX_TSQRT(xvtsqrtsp, 4, float32, VsrW(i), -126, 23)
2151 * VSX_MADD - VSX floating point muliply/add variations
2152 * op - instruction mnemonic
2153 * nels - number of elements (1, 2 or 4)
2154 * tp - type (float32 or float64)
2155 * fld - vsr_t field (VsrD(*) or VsrW(*))
2156 * maddflgs - flags for the float*muladd routine that control the
2157 * various forms (madd, msub, nmadd, nmsub)
2158 * sfprf - set FPRF
2159 * r2sp - round intermediate double precision result to single precision
2161 #define VSX_MADD(op, nels, tp, fld, maddflgs, sfprf, r2sp) \
2162 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, \
2163 ppc_vsr_t *s1, ppc_vsr_t *s2, ppc_vsr_t *s3) \
2165 ppc_vsr_t t = *xt; \
2166 int i; \
2168 helper_reset_fpstatus(env); \
2170 for (i = 0; i < nels; i++) { \
2171 float_status tstat = env->fp_status; \
2172 set_float_exception_flags(0, &tstat); \
2173 if (r2sp && (tstat.float_rounding_mode == float_round_nearest_even)) {\
2174 /* \
2175 * Avoid double rounding errors by rounding the intermediate \
2176 * result to odd. \
2177 */ \
2178 set_float_rounding_mode(float_round_to_zero, &tstat); \
2179 t.fld = tp##_muladd(s1->fld, s3->fld, s2->fld, \
2180 maddflgs, &tstat); \
2181 t.fld |= (get_float_exception_flags(&tstat) & \
2182 float_flag_inexact) != 0; \
2183 } else { \
2184 t.fld = tp##_muladd(s1->fld, s3->fld, s2->fld, \
2185 maddflgs, &tstat); \
2187 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
2189 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
2190 float_invalid_op_madd(env, tstat.float_exception_flags, \
2191 sfprf, GETPC()); \
2194 if (r2sp) { \
2195 t.fld = do_frsp(env, t.fld, GETPC()); \
2198 if (sfprf) { \
2199 helper_compute_fprf_float64(env, t.fld); \
2202 *xt = t; \
2203 do_float_check_status(env, GETPC()); \
2206 VSX_MADD(XSMADDDP, 1, float64, VsrD(0), MADD_FLGS, 1, 0)
2207 VSX_MADD(XSMSUBDP, 1, float64, VsrD(0), MSUB_FLGS, 1, 0)
2208 VSX_MADD(XSNMADDDP, 1, float64, VsrD(0), NMADD_FLGS, 1, 0)
2209 VSX_MADD(XSNMSUBDP, 1, float64, VsrD(0), NMSUB_FLGS, 1, 0)
2210 VSX_MADD(XSMADDSP, 1, float64, VsrD(0), MADD_FLGS, 1, 1)
2211 VSX_MADD(XSMSUBSP, 1, float64, VsrD(0), MSUB_FLGS, 1, 1)
2212 VSX_MADD(XSNMADDSP, 1, float64, VsrD(0), NMADD_FLGS, 1, 1)
2213 VSX_MADD(XSNMSUBSP, 1, float64, VsrD(0), NMSUB_FLGS, 1, 1)
2215 VSX_MADD(xvmadddp, 2, float64, VsrD(i), MADD_FLGS, 0, 0)
2216 VSX_MADD(xvmsubdp, 2, float64, VsrD(i), MSUB_FLGS, 0, 0)
2217 VSX_MADD(xvnmadddp, 2, float64, VsrD(i), NMADD_FLGS, 0, 0)
2218 VSX_MADD(xvnmsubdp, 2, float64, VsrD(i), NMSUB_FLGS, 0, 0)
2220 VSX_MADD(xvmaddsp, 4, float32, VsrW(i), MADD_FLGS, 0, 0)
2221 VSX_MADD(xvmsubsp, 4, float32, VsrW(i), MSUB_FLGS, 0, 0)
2222 VSX_MADD(xvnmaddsp, 4, float32, VsrW(i), NMADD_FLGS, 0, 0)
2223 VSX_MADD(xvnmsubsp, 4, float32, VsrW(i), NMSUB_FLGS, 0, 0)
2226 * VSX_MADDQ - VSX floating point quad-precision muliply/add
2227 * op - instruction mnemonic
2228 * maddflgs - flags for the float*muladd routine that control the
2229 * various forms (madd, msub, nmadd, nmsub)
2230 * ro - round to odd
2232 #define VSX_MADDQ(op, maddflgs, ro) \
2233 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *s1, ppc_vsr_t *s2,\
2234 ppc_vsr_t *s3) \
2236 ppc_vsr_t t = *xt; \
2238 helper_reset_fpstatus(env); \
2240 float_status tstat = env->fp_status; \
2241 set_float_exception_flags(0, &tstat); \
2242 if (ro) { \
2243 tstat.float_rounding_mode = float_round_to_odd; \
2245 t.f128 = float128_muladd(s1->f128, s3->f128, s2->f128, maddflgs, &tstat); \
2246 env->fp_status.float_exception_flags |= tstat.float_exception_flags; \
2248 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) { \
2249 float_invalid_op_madd(env, tstat.float_exception_flags, \
2250 false, GETPC()); \
2253 helper_compute_fprf_float128(env, t.f128); \
2254 *xt = t; \
2255 do_float_check_status(env, GETPC()); \
2258 VSX_MADDQ(XSMADDQP, MADD_FLGS, 0)
2259 VSX_MADDQ(XSMADDQPO, MADD_FLGS, 1)
2260 VSX_MADDQ(XSMSUBQP, MSUB_FLGS, 0)
2261 VSX_MADDQ(XSMSUBQPO, MSUB_FLGS, 1)
2262 VSX_MADDQ(XSNMADDQP, NMADD_FLGS, 0)
2263 VSX_MADDQ(XSNMADDQPO, NMADD_FLGS, 1)
2264 VSX_MADDQ(XSNMSUBQP, NMSUB_FLGS, 0)
2265 VSX_MADDQ(XSNMSUBQPO, NMSUB_FLGS, 0)
2268 * VSX_SCALAR_CMP_DP - VSX scalar floating point compare double precision
2269 * op - instruction mnemonic
2270 * cmp - comparison operation
2271 * exp - expected result of comparison
2272 * svxvc - set VXVC bit
2274 #define VSX_SCALAR_CMP_DP(op, cmp, exp, svxvc) \
2275 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, \
2276 ppc_vsr_t *xa, ppc_vsr_t *xb) \
2278 ppc_vsr_t t = *xt; \
2279 bool vxsnan_flag = false, vxvc_flag = false, vex_flag = false; \
2281 if (float64_is_signaling_nan(xa->VsrD(0), &env->fp_status) || \
2282 float64_is_signaling_nan(xb->VsrD(0), &env->fp_status)) { \
2283 vxsnan_flag = true; \
2284 if (fpscr_ve == 0 && svxvc) { \
2285 vxvc_flag = true; \
2287 } else if (svxvc) { \
2288 vxvc_flag = float64_is_quiet_nan(xa->VsrD(0), &env->fp_status) || \
2289 float64_is_quiet_nan(xb->VsrD(0), &env->fp_status); \
2291 if (vxsnan_flag) { \
2292 float_invalid_op_vxsnan(env, GETPC()); \
2294 if (vxvc_flag) { \
2295 float_invalid_op_vxvc(env, 0, GETPC()); \
2297 vex_flag = fpscr_ve && (vxvc_flag || vxsnan_flag); \
2299 if (!vex_flag) { \
2300 if (float64_##cmp(xb->VsrD(0), xa->VsrD(0), \
2301 &env->fp_status) == exp) { \
2302 t.VsrD(0) = -1; \
2303 t.VsrD(1) = 0; \
2304 } else { \
2305 t.VsrD(0) = 0; \
2306 t.VsrD(1) = 0; \
2309 *xt = t; \
2310 do_float_check_status(env, GETPC()); \
2313 VSX_SCALAR_CMP_DP(xscmpeqdp, eq, 1, 0)
2314 VSX_SCALAR_CMP_DP(xscmpgedp, le, 1, 1)
2315 VSX_SCALAR_CMP_DP(xscmpgtdp, lt, 1, 1)
2316 VSX_SCALAR_CMP_DP(xscmpnedp, eq, 0, 0)
2318 void helper_xscmpexpdp(CPUPPCState *env, uint32_t opcode,
2319 ppc_vsr_t *xa, ppc_vsr_t *xb)
2321 int64_t exp_a, exp_b;
2322 uint32_t cc;
2324 exp_a = extract64(xa->VsrD(0), 52, 11);
2325 exp_b = extract64(xb->VsrD(0), 52, 11);
2327 if (unlikely(float64_is_any_nan(xa->VsrD(0)) ||
2328 float64_is_any_nan(xb->VsrD(0)))) {
2329 cc = CRF_SO;
2330 } else {
2331 if (exp_a < exp_b) {
2332 cc = CRF_LT;
2333 } else if (exp_a > exp_b) {
2334 cc = CRF_GT;
2335 } else {
2336 cc = CRF_EQ;
2340 env->fpscr &= ~FP_FPCC;
2341 env->fpscr |= cc << FPSCR_FPCC;
2342 env->crf[BF(opcode)] = cc;
2344 do_float_check_status(env, GETPC());
2347 void helper_xscmpexpqp(CPUPPCState *env, uint32_t opcode,
2348 ppc_vsr_t *xa, ppc_vsr_t *xb)
2350 int64_t exp_a, exp_b;
2351 uint32_t cc;
2353 exp_a = extract64(xa->VsrD(0), 48, 15);
2354 exp_b = extract64(xb->VsrD(0), 48, 15);
2356 if (unlikely(float128_is_any_nan(xa->f128) ||
2357 float128_is_any_nan(xb->f128))) {
2358 cc = CRF_SO;
2359 } else {
2360 if (exp_a < exp_b) {
2361 cc = CRF_LT;
2362 } else if (exp_a > exp_b) {
2363 cc = CRF_GT;
2364 } else {
2365 cc = CRF_EQ;
2369 env->fpscr &= ~FP_FPCC;
2370 env->fpscr |= cc << FPSCR_FPCC;
2371 env->crf[BF(opcode)] = cc;
2373 do_float_check_status(env, GETPC());
2376 static inline void do_scalar_cmp(CPUPPCState *env, ppc_vsr_t *xa, ppc_vsr_t *xb,
2377 int crf_idx, bool ordered)
2379 uint32_t cc;
2380 bool vxsnan_flag = false, vxvc_flag = false;
2382 helper_reset_fpstatus(env);
2384 switch (float64_compare(xa->VsrD(0), xb->VsrD(0), &env->fp_status)) {
2385 case float_relation_less:
2386 cc = CRF_LT;
2387 break;
2388 case float_relation_equal:
2389 cc = CRF_EQ;
2390 break;
2391 case float_relation_greater:
2392 cc = CRF_GT;
2393 break;
2394 case float_relation_unordered:
2395 cc = CRF_SO;
2397 if (float64_is_signaling_nan(xa->VsrD(0), &env->fp_status) ||
2398 float64_is_signaling_nan(xb->VsrD(0), &env->fp_status)) {
2399 vxsnan_flag = true;
2400 if (fpscr_ve == 0 && ordered) {
2401 vxvc_flag = true;
2403 } else if (float64_is_quiet_nan(xa->VsrD(0), &env->fp_status) ||
2404 float64_is_quiet_nan(xb->VsrD(0), &env->fp_status)) {
2405 if (ordered) {
2406 vxvc_flag = true;
2410 break;
2411 default:
2412 g_assert_not_reached();
2415 env->fpscr &= ~FP_FPCC;
2416 env->fpscr |= cc << FPSCR_FPCC;
2417 env->crf[crf_idx] = cc;
2419 if (vxsnan_flag) {
2420 float_invalid_op_vxsnan(env, GETPC());
2422 if (vxvc_flag) {
2423 float_invalid_op_vxvc(env, 0, GETPC());
2426 do_float_check_status(env, GETPC());
2429 void helper_xscmpodp(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xa,
2430 ppc_vsr_t *xb)
2432 do_scalar_cmp(env, xa, xb, BF(opcode), true);
2435 void helper_xscmpudp(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xa,
2436 ppc_vsr_t *xb)
2438 do_scalar_cmp(env, xa, xb, BF(opcode), false);
2441 static inline void do_scalar_cmpq(CPUPPCState *env, ppc_vsr_t *xa,
2442 ppc_vsr_t *xb, int crf_idx, bool ordered)
2444 uint32_t cc;
2445 bool vxsnan_flag = false, vxvc_flag = false;
2447 helper_reset_fpstatus(env);
2449 switch (float128_compare(xa->f128, xb->f128, &env->fp_status)) {
2450 case float_relation_less:
2451 cc = CRF_LT;
2452 break;
2453 case float_relation_equal:
2454 cc = CRF_EQ;
2455 break;
2456 case float_relation_greater:
2457 cc = CRF_GT;
2458 break;
2459 case float_relation_unordered:
2460 cc = CRF_SO;
2462 if (float128_is_signaling_nan(xa->f128, &env->fp_status) ||
2463 float128_is_signaling_nan(xb->f128, &env->fp_status)) {
2464 vxsnan_flag = true;
2465 if (fpscr_ve == 0 && ordered) {
2466 vxvc_flag = true;
2468 } else if (float128_is_quiet_nan(xa->f128, &env->fp_status) ||
2469 float128_is_quiet_nan(xb->f128, &env->fp_status)) {
2470 if (ordered) {
2471 vxvc_flag = true;
2475 break;
2476 default:
2477 g_assert_not_reached();
2480 env->fpscr &= ~FP_FPCC;
2481 env->fpscr |= cc << FPSCR_FPCC;
2482 env->crf[crf_idx] = cc;
2484 if (vxsnan_flag) {
2485 float_invalid_op_vxsnan(env, GETPC());
2487 if (vxvc_flag) {
2488 float_invalid_op_vxvc(env, 0, GETPC());
2491 do_float_check_status(env, GETPC());
2494 void helper_xscmpoqp(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xa,
2495 ppc_vsr_t *xb)
2497 do_scalar_cmpq(env, xa, xb, BF(opcode), true);
2500 void helper_xscmpuqp(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xa,
2501 ppc_vsr_t *xb)
2503 do_scalar_cmpq(env, xa, xb, BF(opcode), false);
2507 * VSX_MAX_MIN - VSX floating point maximum/minimum
2508 * name - instruction mnemonic
2509 * op - operation (max or min)
2510 * nels - number of elements (1, 2 or 4)
2511 * tp - type (float32 or float64)
2512 * fld - vsr_t field (VsrD(*) or VsrW(*))
2514 #define VSX_MAX_MIN(name, op, nels, tp, fld) \
2515 void helper_##name(CPUPPCState *env, ppc_vsr_t *xt, \
2516 ppc_vsr_t *xa, ppc_vsr_t *xb) \
2518 ppc_vsr_t t = { }; \
2519 int i; \
2521 for (i = 0; i < nels; i++) { \
2522 t.fld = tp##_##op(xa->fld, xb->fld, &env->fp_status); \
2523 if (unlikely(tp##_is_signaling_nan(xa->fld, &env->fp_status) || \
2524 tp##_is_signaling_nan(xb->fld, &env->fp_status))) { \
2525 float_invalid_op_vxsnan(env, GETPC()); \
2529 *xt = t; \
2530 do_float_check_status(env, GETPC()); \
2533 VSX_MAX_MIN(xsmaxdp, maxnum, 1, float64, VsrD(0))
2534 VSX_MAX_MIN(xvmaxdp, maxnum, 2, float64, VsrD(i))
2535 VSX_MAX_MIN(xvmaxsp, maxnum, 4, float32, VsrW(i))
2536 VSX_MAX_MIN(xsmindp, minnum, 1, float64, VsrD(0))
2537 VSX_MAX_MIN(xvmindp, minnum, 2, float64, VsrD(i))
2538 VSX_MAX_MIN(xvminsp, minnum, 4, float32, VsrW(i))
2540 #define VSX_MAX_MINC(name, max) \
2541 void helper_##name(CPUPPCState *env, \
2542 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb) \
2544 ppc_vsr_t t = { }; \
2545 bool vxsnan_flag = false, vex_flag = false; \
2547 if (unlikely(float64_is_any_nan(xa->VsrD(0)) || \
2548 float64_is_any_nan(xb->VsrD(0)))) { \
2549 if (float64_is_signaling_nan(xa->VsrD(0), &env->fp_status) || \
2550 float64_is_signaling_nan(xb->VsrD(0), &env->fp_status)) { \
2551 vxsnan_flag = true; \
2553 t.VsrD(0) = xb->VsrD(0); \
2554 } else if ((max && \
2555 !float64_lt(xa->VsrD(0), xb->VsrD(0), &env->fp_status)) || \
2556 (!max && \
2557 float64_lt(xa->VsrD(0), xb->VsrD(0), &env->fp_status))) { \
2558 t.VsrD(0) = xa->VsrD(0); \
2559 } else { \
2560 t.VsrD(0) = xb->VsrD(0); \
2563 vex_flag = fpscr_ve & vxsnan_flag; \
2564 if (vxsnan_flag) { \
2565 float_invalid_op_vxsnan(env, GETPC()); \
2567 if (!vex_flag) { \
2568 *xt = t; \
2572 VSX_MAX_MINC(xsmaxcdp, 1);
2573 VSX_MAX_MINC(xsmincdp, 0);
2575 #define VSX_MAX_MINJ(name, max) \
2576 void helper_##name(CPUPPCState *env, \
2577 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb) \
2579 ppc_vsr_t t = { }; \
2580 bool vxsnan_flag = false, vex_flag = false; \
2582 if (unlikely(float64_is_any_nan(xa->VsrD(0)))) { \
2583 if (float64_is_signaling_nan(xa->VsrD(0), &env->fp_status)) { \
2584 vxsnan_flag = true; \
2586 t.VsrD(0) = xa->VsrD(0); \
2587 } else if (unlikely(float64_is_any_nan(xb->VsrD(0)))) { \
2588 if (float64_is_signaling_nan(xb->VsrD(0), &env->fp_status)) { \
2589 vxsnan_flag = true; \
2591 t.VsrD(0) = xb->VsrD(0); \
2592 } else if (float64_is_zero(xa->VsrD(0)) && \
2593 float64_is_zero(xb->VsrD(0))) { \
2594 if (max) { \
2595 if (!float64_is_neg(xa->VsrD(0)) || \
2596 !float64_is_neg(xb->VsrD(0))) { \
2597 t.VsrD(0) = 0ULL; \
2598 } else { \
2599 t.VsrD(0) = 0x8000000000000000ULL; \
2601 } else { \
2602 if (float64_is_neg(xa->VsrD(0)) || \
2603 float64_is_neg(xb->VsrD(0))) { \
2604 t.VsrD(0) = 0x8000000000000000ULL; \
2605 } else { \
2606 t.VsrD(0) = 0ULL; \
2609 } else if ((max && \
2610 !float64_lt(xa->VsrD(0), xb->VsrD(0), &env->fp_status)) || \
2611 (!max && \
2612 float64_lt(xa->VsrD(0), xb->VsrD(0), &env->fp_status))) { \
2613 t.VsrD(0) = xa->VsrD(0); \
2614 } else { \
2615 t.VsrD(0) = xb->VsrD(0); \
2618 vex_flag = fpscr_ve & vxsnan_flag; \
2619 if (vxsnan_flag) { \
2620 float_invalid_op_vxsnan(env, GETPC()); \
2622 if (!vex_flag) { \
2623 *xt = t; \
2627 VSX_MAX_MINJ(xsmaxjdp, 1);
2628 VSX_MAX_MINJ(xsminjdp, 0);
2631 * VSX_CMP - VSX floating point compare
2632 * op - instruction mnemonic
2633 * nels - number of elements (1, 2 or 4)
2634 * tp - type (float32 or float64)
2635 * fld - vsr_t field (VsrD(*) or VsrW(*))
2636 * cmp - comparison operation
2637 * svxvc - set VXVC bit
2638 * exp - expected result of comparison
2640 #define VSX_CMP(op, nels, tp, fld, cmp, svxvc, exp) \
2641 uint32_t helper_##op(CPUPPCState *env, ppc_vsr_t *xt, \
2642 ppc_vsr_t *xa, ppc_vsr_t *xb) \
2644 ppc_vsr_t t = *xt; \
2645 uint32_t crf6 = 0; \
2646 int i; \
2647 int all_true = 1; \
2648 int all_false = 1; \
2650 for (i = 0; i < nels; i++) { \
2651 if (unlikely(tp##_is_any_nan(xa->fld) || \
2652 tp##_is_any_nan(xb->fld))) { \
2653 if (tp##_is_signaling_nan(xa->fld, &env->fp_status) || \
2654 tp##_is_signaling_nan(xb->fld, &env->fp_status)) { \
2655 float_invalid_op_vxsnan(env, GETPC()); \
2657 if (svxvc) { \
2658 float_invalid_op_vxvc(env, 0, GETPC()); \
2660 t.fld = 0; \
2661 all_true = 0; \
2662 } else { \
2663 if (tp##_##cmp(xb->fld, xa->fld, &env->fp_status) == exp) { \
2664 t.fld = -1; \
2665 all_false = 0; \
2666 } else { \
2667 t.fld = 0; \
2668 all_true = 0; \
2673 *xt = t; \
2674 crf6 = (all_true ? 0x8 : 0) | (all_false ? 0x2 : 0); \
2675 return crf6; \
2678 VSX_CMP(xvcmpeqdp, 2, float64, VsrD(i), eq, 0, 1)
2679 VSX_CMP(xvcmpgedp, 2, float64, VsrD(i), le, 1, 1)
2680 VSX_CMP(xvcmpgtdp, 2, float64, VsrD(i), lt, 1, 1)
2681 VSX_CMP(xvcmpnedp, 2, float64, VsrD(i), eq, 0, 0)
2682 VSX_CMP(xvcmpeqsp, 4, float32, VsrW(i), eq, 0, 1)
2683 VSX_CMP(xvcmpgesp, 4, float32, VsrW(i), le, 1, 1)
2684 VSX_CMP(xvcmpgtsp, 4, float32, VsrW(i), lt, 1, 1)
2685 VSX_CMP(xvcmpnesp, 4, float32, VsrW(i), eq, 0, 0)
2688 * VSX_CVT_FP_TO_FP - VSX floating point/floating point conversion
2689 * op - instruction mnemonic
2690 * nels - number of elements (1, 2 or 4)
2691 * stp - source type (float32 or float64)
2692 * ttp - target type (float32 or float64)
2693 * sfld - source vsr_t field
2694 * tfld - target vsr_t field (f32 or f64)
2695 * sfprf - set FPRF
2697 #define VSX_CVT_FP_TO_FP(op, nels, stp, ttp, sfld, tfld, sfprf) \
2698 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
2700 ppc_vsr_t t = { }; \
2701 int i; \
2703 for (i = 0; i < nels; i++) { \
2704 t.tfld = stp##_to_##ttp(xb->sfld, &env->fp_status); \
2705 if (unlikely(stp##_is_signaling_nan(xb->sfld, \
2706 &env->fp_status))) { \
2707 float_invalid_op_vxsnan(env, GETPC()); \
2708 t.tfld = ttp##_snan_to_qnan(t.tfld); \
2710 if (sfprf) { \
2711 helper_compute_fprf_##ttp(env, t.tfld); \
2715 *xt = t; \
2716 do_float_check_status(env, GETPC()); \
2719 VSX_CVT_FP_TO_FP(xscvdpsp, 1, float64, float32, VsrD(0), VsrW(0), 1)
2720 VSX_CVT_FP_TO_FP(xscvspdp, 1, float32, float64, VsrW(0), VsrD(0), 1)
2721 VSX_CVT_FP_TO_FP(xvcvdpsp, 2, float64, float32, VsrD(i), VsrW(2 * i), 0)
2722 VSX_CVT_FP_TO_FP(xvcvspdp, 2, float32, float64, VsrW(2 * i), VsrD(i), 0)
2725 * VSX_CVT_FP_TO_FP_VECTOR - VSX floating point/floating point conversion
2726 * op - instruction mnemonic
2727 * nels - number of elements (1, 2 or 4)
2728 * stp - source type (float32 or float64)
2729 * ttp - target type (float32 or float64)
2730 * sfld - source vsr_t field
2731 * tfld - target vsr_t field (f32 or f64)
2732 * sfprf - set FPRF
2734 #define VSX_CVT_FP_TO_FP_VECTOR(op, nels, stp, ttp, sfld, tfld, sfprf) \
2735 void helper_##op(CPUPPCState *env, uint32_t opcode, \
2736 ppc_vsr_t *xt, ppc_vsr_t *xb) \
2738 ppc_vsr_t t = *xt; \
2739 int i; \
2741 for (i = 0; i < nels; i++) { \
2742 t.tfld = stp##_to_##ttp(xb->sfld, &env->fp_status); \
2743 if (unlikely(stp##_is_signaling_nan(xb->sfld, \
2744 &env->fp_status))) { \
2745 float_invalid_op_vxsnan(env, GETPC()); \
2746 t.tfld = ttp##_snan_to_qnan(t.tfld); \
2748 if (sfprf) { \
2749 helper_compute_fprf_##ttp(env, t.tfld); \
2753 *xt = t; \
2754 do_float_check_status(env, GETPC()); \
2757 VSX_CVT_FP_TO_FP_VECTOR(xscvdpqp, 1, float64, float128, VsrD(0), f128, 1)
2760 * VSX_CVT_FP_TO_FP_HP - VSX floating point/floating point conversion
2761 * involving one half precision value
2762 * op - instruction mnemonic
2763 * nels - number of elements (1, 2 or 4)
2764 * stp - source type
2765 * ttp - target type
2766 * sfld - source vsr_t field
2767 * tfld - target vsr_t field
2768 * sfprf - set FPRF
2770 #define VSX_CVT_FP_TO_FP_HP(op, nels, stp, ttp, sfld, tfld, sfprf) \
2771 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
2773 ppc_vsr_t t = { }; \
2774 int i; \
2776 for (i = 0; i < nels; i++) { \
2777 t.tfld = stp##_to_##ttp(xb->sfld, 1, &env->fp_status); \
2778 if (unlikely(stp##_is_signaling_nan(xb->sfld, \
2779 &env->fp_status))) { \
2780 float_invalid_op_vxsnan(env, GETPC()); \
2781 t.tfld = ttp##_snan_to_qnan(t.tfld); \
2783 if (sfprf) { \
2784 helper_compute_fprf_##ttp(env, t.tfld); \
2788 *xt = t; \
2789 do_float_check_status(env, GETPC()); \
2792 VSX_CVT_FP_TO_FP_HP(xscvdphp, 1, float64, float16, VsrD(0), VsrH(3), 1)
2793 VSX_CVT_FP_TO_FP_HP(xscvhpdp, 1, float16, float64, VsrH(3), VsrD(0), 1)
2794 VSX_CVT_FP_TO_FP_HP(xvcvsphp, 4, float32, float16, VsrW(i), VsrH(2 * i + 1), 0)
2795 VSX_CVT_FP_TO_FP_HP(xvcvhpsp, 4, float16, float32, VsrH(2 * i + 1), VsrW(i), 0)
2797 void helper_XSCVQPDP(CPUPPCState *env, uint32_t ro, ppc_vsr_t *xt,
2798 ppc_vsr_t *xb)
2800 ppc_vsr_t t = { };
2801 float_status tstat;
2803 tstat = env->fp_status;
2804 if (ro != 0) {
2805 tstat.float_rounding_mode = float_round_to_odd;
2808 t.VsrD(0) = float128_to_float64(xb->f128, &tstat);
2809 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
2810 if (unlikely(float128_is_signaling_nan(xb->f128, &tstat))) {
2811 float_invalid_op_vxsnan(env, GETPC());
2812 t.VsrD(0) = float64_snan_to_qnan(t.VsrD(0));
2814 helper_compute_fprf_float64(env, t.VsrD(0));
2816 *xt = t;
2817 do_float_check_status(env, GETPC());
2820 uint64_t helper_xscvdpspn(CPUPPCState *env, uint64_t xb)
2822 uint64_t result, sign, exp, frac;
2824 float_status tstat = env->fp_status;
2825 set_float_exception_flags(0, &tstat);
2827 sign = extract64(xb, 63, 1);
2828 exp = extract64(xb, 52, 11);
2829 frac = extract64(xb, 0, 52) | 0x10000000000000ULL;
2831 if (unlikely(exp == 0 && extract64(frac, 0, 52) != 0)) {
2832 /* DP denormal operand. */
2833 /* Exponent override to DP min exp. */
2834 exp = 1;
2835 /* Implicit bit override to 0. */
2836 frac = deposit64(frac, 53, 1, 0);
2839 if (unlikely(exp < 897 && frac != 0)) {
2840 /* SP tiny operand. */
2841 if (897 - exp > 63) {
2842 frac = 0;
2843 } else {
2844 /* Denormalize until exp = SP min exp. */
2845 frac >>= (897 - exp);
2847 /* Exponent override to SP min exp - 1. */
2848 exp = 896;
2851 result = sign << 31;
2852 result |= extract64(exp, 10, 1) << 30;
2853 result |= extract64(exp, 0, 7) << 23;
2854 result |= extract64(frac, 29, 23);
2856 /* hardware replicates result to both words of the doubleword result. */
2857 return (result << 32) | result;
2860 uint64_t helper_xscvspdpn(CPUPPCState *env, uint64_t xb)
2862 return helper_todouble(xb >> 32);
2866 * VSX_CVT_FP_TO_INT - VSX floating point to integer conversion
2867 * op - instruction mnemonic
2868 * nels - number of elements (1, 2 or 4)
2869 * stp - source type (float32 or float64)
2870 * ttp - target type (int32, uint32, int64 or uint64)
2871 * sfld - source vsr_t field
2872 * tfld - target vsr_t field
2873 * rnan - resulting NaN
2875 #define VSX_CVT_FP_TO_INT(op, nels, stp, ttp, sfld, tfld, rnan) \
2876 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
2878 int all_flags = env->fp_status.float_exception_flags, flags; \
2879 ppc_vsr_t t = { }; \
2880 int i; \
2882 for (i = 0; i < nels; i++) { \
2883 env->fp_status.float_exception_flags = 0; \
2884 t.tfld = stp##_to_##ttp##_round_to_zero(xb->sfld, &env->fp_status); \
2885 flags = env->fp_status.float_exception_flags; \
2886 if (unlikely(flags & float_flag_invalid)) { \
2887 t.tfld = float_invalid_cvt(env, flags, t.tfld, rnan, 0, GETPC());\
2889 all_flags |= flags; \
2892 *xt = t; \
2893 env->fp_status.float_exception_flags = all_flags; \
2894 do_float_check_status(env, GETPC()); \
2897 VSX_CVT_FP_TO_INT(xscvdpsxds, 1, float64, int64, VsrD(0), VsrD(0), \
2898 0x8000000000000000ULL)
2899 VSX_CVT_FP_TO_INT(xscvdpsxws, 1, float64, int32, VsrD(0), VsrW(1), \
2900 0x80000000U)
2901 VSX_CVT_FP_TO_INT(xscvdpuxds, 1, float64, uint64, VsrD(0), VsrD(0), 0ULL)
2902 VSX_CVT_FP_TO_INT(xscvdpuxws, 1, float64, uint32, VsrD(0), VsrW(1), 0U)
2903 VSX_CVT_FP_TO_INT(xvcvdpsxds, 2, float64, int64, VsrD(i), VsrD(i), \
2904 0x8000000000000000ULL)
2905 VSX_CVT_FP_TO_INT(xvcvdpsxws, 2, float64, int32, VsrD(i), VsrW(2 * i), \
2906 0x80000000U)
2907 VSX_CVT_FP_TO_INT(xvcvdpuxds, 2, float64, uint64, VsrD(i), VsrD(i), 0ULL)
2908 VSX_CVT_FP_TO_INT(xvcvdpuxws, 2, float64, uint32, VsrD(i), VsrW(2 * i), 0U)
2909 VSX_CVT_FP_TO_INT(xvcvspsxds, 2, float32, int64, VsrW(2 * i), VsrD(i), \
2910 0x8000000000000000ULL)
2911 VSX_CVT_FP_TO_INT(xvcvspsxws, 4, float32, int32, VsrW(i), VsrW(i), 0x80000000U)
2912 VSX_CVT_FP_TO_INT(xvcvspuxds, 2, float32, uint64, VsrW(2 * i), VsrD(i), 0ULL)
2913 VSX_CVT_FP_TO_INT(xvcvspuxws, 4, float32, uint32, VsrW(i), VsrW(i), 0U)
2916 * VSX_CVT_FP_TO_INT_VECTOR - VSX floating point to integer conversion
2917 * op - instruction mnemonic
2918 * stp - source type (float32 or float64)
2919 * ttp - target type (int32, uint32, int64 or uint64)
2920 * sfld - source vsr_t field
2921 * tfld - target vsr_t field
2922 * rnan - resulting NaN
2924 #define VSX_CVT_FP_TO_INT_VECTOR(op, stp, ttp, sfld, tfld, rnan) \
2925 void helper_##op(CPUPPCState *env, uint32_t opcode, \
2926 ppc_vsr_t *xt, ppc_vsr_t *xb) \
2928 ppc_vsr_t t = { }; \
2929 int flags; \
2931 t.tfld = stp##_to_##ttp##_round_to_zero(xb->sfld, &env->fp_status); \
2932 flags = get_float_exception_flags(&env->fp_status); \
2933 if (flags & float_flag_invalid) { \
2934 t.tfld = float_invalid_cvt(env, flags, t.tfld, rnan, 0, GETPC()); \
2937 *xt = t; \
2938 do_float_check_status(env, GETPC()); \
2941 VSX_CVT_FP_TO_INT_VECTOR(xscvqpsdz, float128, int64, f128, VsrD(0), \
2942 0x8000000000000000ULL)
2944 VSX_CVT_FP_TO_INT_VECTOR(xscvqpswz, float128, int32, f128, VsrD(0), \
2945 0xffffffff80000000ULL)
2946 VSX_CVT_FP_TO_INT_VECTOR(xscvqpudz, float128, uint64, f128, VsrD(0), 0x0ULL)
2947 VSX_CVT_FP_TO_INT_VECTOR(xscvqpuwz, float128, uint32, f128, VsrD(0), 0x0ULL)
2950 * VSX_CVT_INT_TO_FP - VSX integer to floating point conversion
2951 * op - instruction mnemonic
2952 * nels - number of elements (1, 2 or 4)
2953 * stp - source type (int32, uint32, int64 or uint64)
2954 * ttp - target type (float32 or float64)
2955 * sfld - source vsr_t field
2956 * tfld - target vsr_t field
2957 * jdef - definition of the j index (i or 2*i)
2958 * sfprf - set FPRF
2960 #define VSX_CVT_INT_TO_FP(op, nels, stp, ttp, sfld, tfld, sfprf, r2sp) \
2961 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
2963 ppc_vsr_t t = { }; \
2964 int i; \
2966 for (i = 0; i < nels; i++) { \
2967 t.tfld = stp##_to_##ttp(xb->sfld, &env->fp_status); \
2968 if (r2sp) { \
2969 t.tfld = do_frsp(env, t.tfld, GETPC()); \
2971 if (sfprf) { \
2972 helper_compute_fprf_float64(env, t.tfld); \
2976 *xt = t; \
2977 do_float_check_status(env, GETPC()); \
2980 VSX_CVT_INT_TO_FP(xscvsxddp, 1, int64, float64, VsrD(0), VsrD(0), 1, 0)
2981 VSX_CVT_INT_TO_FP(xscvuxddp, 1, uint64, float64, VsrD(0), VsrD(0), 1, 0)
2982 VSX_CVT_INT_TO_FP(xscvsxdsp, 1, int64, float64, VsrD(0), VsrD(0), 1, 1)
2983 VSX_CVT_INT_TO_FP(xscvuxdsp, 1, uint64, float64, VsrD(0), VsrD(0), 1, 1)
2984 VSX_CVT_INT_TO_FP(xvcvsxddp, 2, int64, float64, VsrD(i), VsrD(i), 0, 0)
2985 VSX_CVT_INT_TO_FP(xvcvuxddp, 2, uint64, float64, VsrD(i), VsrD(i), 0, 0)
2986 VSX_CVT_INT_TO_FP(xvcvsxwdp, 2, int32, float64, VsrW(2 * i), VsrD(i), 0, 0)
2987 VSX_CVT_INT_TO_FP(xvcvuxwdp, 2, uint64, float64, VsrW(2 * i), VsrD(i), 0, 0)
2988 VSX_CVT_INT_TO_FP(xvcvsxdsp, 2, int64, float32, VsrD(i), VsrW(2 * i), 0, 0)
2989 VSX_CVT_INT_TO_FP(xvcvuxdsp, 2, uint64, float32, VsrD(i), VsrW(2 * i), 0, 0)
2990 VSX_CVT_INT_TO_FP(xvcvsxwsp, 4, int32, float32, VsrW(i), VsrW(i), 0, 0)
2991 VSX_CVT_INT_TO_FP(xvcvuxwsp, 4, uint32, float32, VsrW(i), VsrW(i), 0, 0)
2994 * VSX_CVT_INT_TO_FP_VECTOR - VSX integer to floating point conversion
2995 * op - instruction mnemonic
2996 * stp - source type (int32, uint32, int64 or uint64)
2997 * ttp - target type (float32 or float64)
2998 * sfld - source vsr_t field
2999 * tfld - target vsr_t field
3001 #define VSX_CVT_INT_TO_FP_VECTOR(op, stp, ttp, sfld, tfld) \
3002 void helper_##op(CPUPPCState *env, uint32_t opcode, \
3003 ppc_vsr_t *xt, ppc_vsr_t *xb) \
3005 ppc_vsr_t t = *xt; \
3007 t.tfld = stp##_to_##ttp(xb->sfld, &env->fp_status); \
3008 helper_compute_fprf_##ttp(env, t.tfld); \
3010 *xt = t; \
3011 do_float_check_status(env, GETPC()); \
3014 VSX_CVT_INT_TO_FP_VECTOR(xscvsdqp, int64, float128, VsrD(0), f128)
3015 VSX_CVT_INT_TO_FP_VECTOR(xscvudqp, uint64, float128, VsrD(0), f128)
3018 * For "use current rounding mode", define a value that will not be
3019 * one of the existing rounding model enums.
3021 #define FLOAT_ROUND_CURRENT (float_round_nearest_even + float_round_down + \
3022 float_round_up + float_round_to_zero)
3025 * VSX_ROUND - VSX floating point round
3026 * op - instruction mnemonic
3027 * nels - number of elements (1, 2 or 4)
3028 * tp - type (float32 or float64)
3029 * fld - vsr_t field (VsrD(*) or VsrW(*))
3030 * rmode - rounding mode
3031 * sfprf - set FPRF
3033 #define VSX_ROUND(op, nels, tp, fld, rmode, sfprf) \
3034 void helper_##op(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb) \
3036 ppc_vsr_t t = { }; \
3037 int i; \
3038 FloatRoundMode curr_rounding_mode; \
3040 if (rmode != FLOAT_ROUND_CURRENT) { \
3041 curr_rounding_mode = get_float_rounding_mode(&env->fp_status); \
3042 set_float_rounding_mode(rmode, &env->fp_status); \
3045 for (i = 0; i < nels; i++) { \
3046 if (unlikely(tp##_is_signaling_nan(xb->fld, \
3047 &env->fp_status))) { \
3048 float_invalid_op_vxsnan(env, GETPC()); \
3049 t.fld = tp##_snan_to_qnan(xb->fld); \
3050 } else { \
3051 t.fld = tp##_round_to_int(xb->fld, &env->fp_status); \
3053 if (sfprf) { \
3054 helper_compute_fprf_float64(env, t.fld); \
3058 /* \
3059 * If this is not a "use current rounding mode" instruction, \
3060 * then inhibit setting of the XX bit and restore rounding \
3061 * mode from FPSCR \
3062 */ \
3063 if (rmode != FLOAT_ROUND_CURRENT) { \
3064 set_float_rounding_mode(curr_rounding_mode, &env->fp_status); \
3065 env->fp_status.float_exception_flags &= ~float_flag_inexact; \
3068 *xt = t; \
3069 do_float_check_status(env, GETPC()); \
3072 VSX_ROUND(xsrdpi, 1, float64, VsrD(0), float_round_ties_away, 1)
3073 VSX_ROUND(xsrdpic, 1, float64, VsrD(0), FLOAT_ROUND_CURRENT, 1)
3074 VSX_ROUND(xsrdpim, 1, float64, VsrD(0), float_round_down, 1)
3075 VSX_ROUND(xsrdpip, 1, float64, VsrD(0), float_round_up, 1)
3076 VSX_ROUND(xsrdpiz, 1, float64, VsrD(0), float_round_to_zero, 1)
3078 VSX_ROUND(xvrdpi, 2, float64, VsrD(i), float_round_ties_away, 0)
3079 VSX_ROUND(xvrdpic, 2, float64, VsrD(i), FLOAT_ROUND_CURRENT, 0)
3080 VSX_ROUND(xvrdpim, 2, float64, VsrD(i), float_round_down, 0)
3081 VSX_ROUND(xvrdpip, 2, float64, VsrD(i), float_round_up, 0)
3082 VSX_ROUND(xvrdpiz, 2, float64, VsrD(i), float_round_to_zero, 0)
3084 VSX_ROUND(xvrspi, 4, float32, VsrW(i), float_round_ties_away, 0)
3085 VSX_ROUND(xvrspic, 4, float32, VsrW(i), FLOAT_ROUND_CURRENT, 0)
3086 VSX_ROUND(xvrspim, 4, float32, VsrW(i), float_round_down, 0)
3087 VSX_ROUND(xvrspip, 4, float32, VsrW(i), float_round_up, 0)
3088 VSX_ROUND(xvrspiz, 4, float32, VsrW(i), float_round_to_zero, 0)
3090 uint64_t helper_xsrsp(CPUPPCState *env, uint64_t xb)
3092 helper_reset_fpstatus(env);
3094 uint64_t xt = do_frsp(env, xb, GETPC());
3096 helper_compute_fprf_float64(env, xt);
3097 do_float_check_status(env, GETPC());
3098 return xt;
3101 void helper_xvxsigsp(CPUPPCState *env, ppc_vsr_t *xt, ppc_vsr_t *xb)
3103 ppc_vsr_t t = { };
3104 uint32_t exp, i, fraction;
3106 for (i = 0; i < 4; i++) {
3107 exp = (xb->VsrW(i) >> 23) & 0xFF;
3108 fraction = xb->VsrW(i) & 0x7FFFFF;
3109 if (exp != 0 && exp != 255) {
3110 t.VsrW(i) = fraction | 0x00800000;
3111 } else {
3112 t.VsrW(i) = fraction;
3115 *xt = t;
3119 * VSX_TEST_DC - VSX floating point test data class
3120 * op - instruction mnemonic
3121 * nels - number of elements (1, 2 or 4)
3122 * xbn - VSR register number
3123 * tp - type (float32 or float64)
3124 * fld - vsr_t field (VsrD(*) or VsrW(*))
3125 * tfld - target vsr_t field (VsrD(*) or VsrW(*))
3126 * fld_max - target field max
3127 * scrf - set result in CR and FPCC
3129 #define VSX_TEST_DC(op, nels, xbn, tp, fld, tfld, fld_max, scrf) \
3130 void helper_##op(CPUPPCState *env, uint32_t opcode) \
3132 ppc_vsr_t *xt = &env->vsr[xT(opcode)]; \
3133 ppc_vsr_t *xb = &env->vsr[xbn]; \
3134 ppc_vsr_t t = { }; \
3135 uint32_t i, sign, dcmx; \
3136 uint32_t cc, match = 0; \
3138 if (!scrf) { \
3139 dcmx = DCMX_XV(opcode); \
3140 } else { \
3141 t = *xt; \
3142 dcmx = DCMX(opcode); \
3145 for (i = 0; i < nels; i++) { \
3146 sign = tp##_is_neg(xb->fld); \
3147 if (tp##_is_any_nan(xb->fld)) { \
3148 match = extract32(dcmx, 6, 1); \
3149 } else if (tp##_is_infinity(xb->fld)) { \
3150 match = extract32(dcmx, 4 + !sign, 1); \
3151 } else if (tp##_is_zero(xb->fld)) { \
3152 match = extract32(dcmx, 2 + !sign, 1); \
3153 } else if (tp##_is_zero_or_denormal(xb->fld)) { \
3154 match = extract32(dcmx, 0 + !sign, 1); \
3157 if (scrf) { \
3158 cc = sign << CRF_LT_BIT | match << CRF_EQ_BIT; \
3159 env->fpscr &= ~FP_FPCC; \
3160 env->fpscr |= cc << FPSCR_FPCC; \
3161 env->crf[BF(opcode)] = cc; \
3162 } else { \
3163 t.tfld = match ? fld_max : 0; \
3165 match = 0; \
3167 if (!scrf) { \
3168 *xt = t; \
3172 VSX_TEST_DC(xvtstdcdp, 2, xB(opcode), float64, VsrD(i), VsrD(i), UINT64_MAX, 0)
3173 VSX_TEST_DC(xvtstdcsp, 4, xB(opcode), float32, VsrW(i), VsrW(i), UINT32_MAX, 0)
3174 VSX_TEST_DC(xststdcdp, 1, xB(opcode), float64, VsrD(0), VsrD(0), 0, 1)
3175 VSX_TEST_DC(xststdcqp, 1, (rB(opcode) + 32), float128, f128, VsrD(0), 0, 1)
3177 void helper_xststdcsp(CPUPPCState *env, uint32_t opcode, ppc_vsr_t *xb)
3179 uint32_t dcmx, sign, exp;
3180 uint32_t cc, match = 0, not_sp = 0;
3181 float64 arg = xb->VsrD(0);
3182 float64 arg_sp;
3184 dcmx = DCMX(opcode);
3185 exp = (arg >> 52) & 0x7FF;
3186 sign = float64_is_neg(arg);
3188 if (float64_is_any_nan(arg)) {
3189 match = extract32(dcmx, 6, 1);
3190 } else if (float64_is_infinity(arg)) {
3191 match = extract32(dcmx, 4 + !sign, 1);
3192 } else if (float64_is_zero(arg)) {
3193 match = extract32(dcmx, 2 + !sign, 1);
3194 } else if (float64_is_zero_or_denormal(arg) || (exp > 0 && exp < 0x381)) {
3195 match = extract32(dcmx, 0 + !sign, 1);
3198 arg_sp = helper_todouble(helper_tosingle(arg));
3199 not_sp = arg != arg_sp;
3201 cc = sign << CRF_LT_BIT | match << CRF_EQ_BIT | not_sp << CRF_SO_BIT;
3202 env->fpscr &= ~FP_FPCC;
3203 env->fpscr |= cc << FPSCR_FPCC;
3204 env->crf[BF(opcode)] = cc;
3207 void helper_xsrqpi(CPUPPCState *env, uint32_t opcode,
3208 ppc_vsr_t *xt, ppc_vsr_t *xb)
3210 ppc_vsr_t t = { };
3211 uint8_t r = Rrm(opcode);
3212 uint8_t ex = Rc(opcode);
3213 uint8_t rmc = RMC(opcode);
3214 uint8_t rmode = 0;
3215 float_status tstat;
3217 helper_reset_fpstatus(env);
3219 if (r == 0 && rmc == 0) {
3220 rmode = float_round_ties_away;
3221 } else if (r == 0 && rmc == 0x3) {
3222 rmode = fpscr_rn;
3223 } else if (r == 1) {
3224 switch (rmc) {
3225 case 0:
3226 rmode = float_round_nearest_even;
3227 break;
3228 case 1:
3229 rmode = float_round_to_zero;
3230 break;
3231 case 2:
3232 rmode = float_round_up;
3233 break;
3234 case 3:
3235 rmode = float_round_down;
3236 break;
3237 default:
3238 abort();
3242 tstat = env->fp_status;
3243 set_float_exception_flags(0, &tstat);
3244 set_float_rounding_mode(rmode, &tstat);
3245 t.f128 = float128_round_to_int(xb->f128, &tstat);
3246 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
3248 if (unlikely(tstat.float_exception_flags & float_flag_invalid_snan)) {
3249 float_invalid_op_vxsnan(env, GETPC());
3252 if (ex == 0 && (tstat.float_exception_flags & float_flag_inexact)) {
3253 env->fp_status.float_exception_flags &= ~float_flag_inexact;
3256 helper_compute_fprf_float128(env, t.f128);
3257 do_float_check_status(env, GETPC());
3258 *xt = t;
3261 void helper_xsrqpxp(CPUPPCState *env, uint32_t opcode,
3262 ppc_vsr_t *xt, ppc_vsr_t *xb)
3264 ppc_vsr_t t = { };
3265 uint8_t r = Rrm(opcode);
3266 uint8_t rmc = RMC(opcode);
3267 uint8_t rmode = 0;
3268 floatx80 round_res;
3269 float_status tstat;
3271 helper_reset_fpstatus(env);
3273 if (r == 0 && rmc == 0) {
3274 rmode = float_round_ties_away;
3275 } else if (r == 0 && rmc == 0x3) {
3276 rmode = fpscr_rn;
3277 } else if (r == 1) {
3278 switch (rmc) {
3279 case 0:
3280 rmode = float_round_nearest_even;
3281 break;
3282 case 1:
3283 rmode = float_round_to_zero;
3284 break;
3285 case 2:
3286 rmode = float_round_up;
3287 break;
3288 case 3:
3289 rmode = float_round_down;
3290 break;
3291 default:
3292 abort();
3296 tstat = env->fp_status;
3297 set_float_exception_flags(0, &tstat);
3298 set_float_rounding_mode(rmode, &tstat);
3299 round_res = float128_to_floatx80(xb->f128, &tstat);
3300 t.f128 = floatx80_to_float128(round_res, &tstat);
3301 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
3303 if (unlikely(tstat.float_exception_flags & float_flag_invalid_snan)) {
3304 float_invalid_op_vxsnan(env, GETPC());
3305 t.f128 = float128_snan_to_qnan(t.f128);
3308 helper_compute_fprf_float128(env, t.f128);
3309 *xt = t;
3310 do_float_check_status(env, GETPC());
3313 void helper_xssqrtqp(CPUPPCState *env, uint32_t opcode,
3314 ppc_vsr_t *xt, ppc_vsr_t *xb)
3316 ppc_vsr_t t = { };
3317 float_status tstat;
3319 helper_reset_fpstatus(env);
3321 tstat = env->fp_status;
3322 if (unlikely(Rc(opcode) != 0)) {
3323 tstat.float_rounding_mode = float_round_to_odd;
3326 set_float_exception_flags(0, &tstat);
3327 t.f128 = float128_sqrt(xb->f128, &tstat);
3328 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
3330 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) {
3331 float_invalid_op_sqrt(env, tstat.float_exception_flags, 1, GETPC());
3334 helper_compute_fprf_float128(env, t.f128);
3335 *xt = t;
3336 do_float_check_status(env, GETPC());
3339 void helper_xssubqp(CPUPPCState *env, uint32_t opcode,
3340 ppc_vsr_t *xt, ppc_vsr_t *xa, ppc_vsr_t *xb)
3342 ppc_vsr_t t = *xt;
3343 float_status tstat;
3345 helper_reset_fpstatus(env);
3347 tstat = env->fp_status;
3348 if (unlikely(Rc(opcode) != 0)) {
3349 tstat.float_rounding_mode = float_round_to_odd;
3352 set_float_exception_flags(0, &tstat);
3353 t.f128 = float128_sub(xa->f128, xb->f128, &tstat);
3354 env->fp_status.float_exception_flags |= tstat.float_exception_flags;
3356 if (unlikely(tstat.float_exception_flags & float_flag_invalid)) {
3357 float_invalid_op_addsub(env, tstat.float_exception_flags, 1, GETPC());
3360 helper_compute_fprf_float128(env, t.f128);
3361 *xt = t;
3362 do_float_check_status(env, GETPC());