2 * MIPS SIMD Architecture Module Instruction emulation helpers for QEMU.
4 * Copyright (c) 2014 Imagination Technologies
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
20 #include "qemu/osdep.h"
23 #include "exec/exec-all.h"
24 #include "exec/helper-proto.h"
26 /* Data format min and max values */
27 #define DF_BITS(df) (1 << ((df) + 3))
29 #define DF_MAX_INT(df) (int64_t)((1LL << (DF_BITS(df) - 1)) - 1)
30 #define M_MAX_INT(m) (int64_t)((1LL << ((m) - 1)) - 1)
32 #define DF_MIN_INT(df) (int64_t)(-(1LL << (DF_BITS(df) - 1)))
33 #define M_MIN_INT(m) (int64_t)(-(1LL << ((m) - 1)))
35 #define DF_MAX_UINT(df) (uint64_t)(-1ULL >> (64 - DF_BITS(df)))
36 #define M_MAX_UINT(m) (uint64_t)(-1ULL >> (64 - (m)))
38 #define UNSIGNED(x, df) ((x) & DF_MAX_UINT(df))
39 #define SIGNED(x, df) \
40 ((((int64_t)x) << (64 - DF_BITS(df))) >> (64 - DF_BITS(df)))
42 /* Element-by-element access macros */
43 #define DF_ELEMENTS(df) (MSA_WRLEN / DF_BITS(df))
51 * +---------------+----------------------------------------------------------+
52 * | NLOC.B | Vector Leading Ones Count (byte) |
53 * | NLOC.H | Vector Leading Ones Count (halfword) |
54 * | NLOC.W | Vector Leading Ones Count (word) |
55 * | NLOC.D | Vector Leading Ones Count (doubleword) |
56 * | NLZC.B | Vector Leading Zeros Count (byte) |
57 * | NLZC.H | Vector Leading Zeros Count (halfword) |
58 * | NLZC.W | Vector Leading Zeros Count (word) |
59 * | NLZC.D | Vector Leading Zeros Count (doubleword) |
60 * | PCNT.B | Vector Population Count (byte) |
61 * | PCNT.H | Vector Population Count (halfword) |
62 * | PCNT.W | Vector Population Count (word) |
63 * | PCNT.D | Vector Population Count (doubleword) |
64 * +---------------+----------------------------------------------------------+
67 /* TODO: insert Bit Count group helpers here */
74 * +---------------+----------------------------------------------------------+
75 * | BINSL.B | Vector Bit Insert Left (byte) |
76 * | BINSL.H | Vector Bit Insert Left (halfword) |
77 * | BINSL.W | Vector Bit Insert Left (word) |
78 * | BINSL.D | Vector Bit Insert Left (doubleword) |
79 * | BINSR.B | Vector Bit Insert Right (byte) |
80 * | BINSR.H | Vector Bit Insert Right (halfword) |
81 * | BINSR.W | Vector Bit Insert Right (word) |
82 * | BINSR.D | Vector Bit Insert Right (doubleword) |
83 * | BMNZ.V | Vector Bit Move If Not Zero |
84 * | BMZ.V | Vector Bit Move If Zero |
85 * | BSEL.V | Vector Bit Select |
86 * +---------------+----------------------------------------------------------+
89 /* TODO: insert Bit Move group helpers here */
96 * +---------------+----------------------------------------------------------+
97 * | BCLR.B | Vector Bit Clear (byte) |
98 * | BCLR.H | Vector Bit Clear (halfword) |
99 * | BCLR.W | Vector Bit Clear (word) |
100 * | BCLR.D | Vector Bit Clear (doubleword) |
101 * | BNEG.B | Vector Bit Negate (byte) |
102 * | BNEG.H | Vector Bit Negate (halfword) |
103 * | BNEG.W | Vector Bit Negate (word) |
104 * | BNEG.D | Vector Bit Negate (doubleword) |
105 * | BSET.B | Vector Bit Set (byte) |
106 * | BSET.H | Vector Bit Set (halfword) |
107 * | BSET.W | Vector Bit Set (word) |
108 * | BSET.D | Vector Bit Set (doubleword) |
109 * +---------------+----------------------------------------------------------+
112 /* TODO: insert Bit Set group helpers here */
119 * +---------------+----------------------------------------------------------+
120 * | MADD_Q.H | Vector Fixed-Point Multiply and Add (halfword) |
121 * | MADD_Q.W | Vector Fixed-Point Multiply and Add (word) |
122 * | MADDR_Q.H | Vector Fixed-Point Multiply and Add Rounded (halfword) |
123 * | MADDR_Q.W | Vector Fixed-Point Multiply and Add Rounded (word) |
124 * | MSUB_Q.H | Vector Fixed-Point Multiply and Subtr. (halfword) |
125 * | MSUB_Q.W | Vector Fixed-Point Multiply and Subtr. (word) |
126 * | MSUBR_Q.H | Vector Fixed-Point Multiply and Subtr. Rounded (halfword)|
127 * | MSUBR_Q.W | Vector Fixed-Point Multiply and Subtr. Rounded (word) |
128 * | MUL_Q.H | Vector Fixed-Point Multiply (halfword) |
129 * | MUL_Q.W | Vector Fixed-Point Multiply (word) |
130 * | MULR_Q.H | Vector Fixed-Point Multiply Rounded (halfword) |
131 * | MULR_Q.W | Vector Fixed-Point Multiply Rounded (word) |
132 * +---------------+----------------------------------------------------------+
135 /* TODO: insert Fixed Multiply group helpers here */
142 * +---------------+----------------------------------------------------------+
143 * | FMAX_A.W | Vector Floating-Point Maximum (Absolute) (word) |
144 * | FMAX_A.D | Vector Floating-Point Maximum (Absolute) (doubleword) |
145 * | FMAX.W | Vector Floating-Point Maximum (word) |
146 * | FMAX.D | Vector Floating-Point Maximum (doubleword) |
147 * | FMIN_A.W | Vector Floating-Point Minimum (Absolute) (word) |
148 * | FMIN_A.D | Vector Floating-Point Minimum (Absolute) (doubleword) |
149 * | FMIN.W | Vector Floating-Point Minimum (word) |
150 * | FMIN.D | Vector Floating-Point Minimum (doubleword) |
151 * +---------------+----------------------------------------------------------+
154 /* TODO: insert Float Max Min group helpers here */
161 * +---------------+----------------------------------------------------------+
162 * | ADD_A.B | Vector Add Absolute Values (byte) |
163 * | ADD_A.H | Vector Add Absolute Values (halfword) |
164 * | ADD_A.W | Vector Add Absolute Values (word) |
165 * | ADD_A.D | Vector Add Absolute Values (doubleword) |
166 * | ADDS_A.B | Vector Signed Saturated Add (of Absolute) (byte) |
167 * | ADDS_A.H | Vector Signed Saturated Add (of Absolute) (halfword) |
168 * | ADDS_A.W | Vector Signed Saturated Add (of Absolute) (word) |
169 * | ADDS_A.D | Vector Signed Saturated Add (of Absolute) (doubleword) |
170 * | ADDS_S.B | Vector Signed Saturated Add (of Signed) (byte) |
171 * | ADDS_S.H | Vector Signed Saturated Add (of Signed) (halfword) |
172 * | ADDS_S.W | Vector Signed Saturated Add (of Signed) (word) |
173 * | ADDS_S.D | Vector Signed Saturated Add (of Signed) (doubleword) |
174 * | ADDS_U.B | Vector Unsigned Saturated Add (of Unsigned) (byte) |
175 * | ADDS_U.H | Vector Unsigned Saturated Add (of Unsigned) (halfword) |
176 * | ADDS_U.W | Vector Unsigned Saturated Add (of Unsigned) (word) |
177 * | ADDS_U.D | Vector Unsigned Saturated Add (of Unsigned) (doubleword) |
178 * | ADDV.B | Vector Add (byte) |
179 * | ADDV.H | Vector Add (halfword) |
180 * | ADDV.W | Vector Add (word) |
181 * | ADDV.D | Vector Add (doubleword) |
182 * | HADD_S.H | Vector Signed Horizontal Add (halfword) |
183 * | HADD_S.W | Vector Signed Horizontal Add (word) |
184 * | HADD_S.D | Vector Signed Horizontal Add (doubleword) |
185 * | HADD_U.H | Vector Unigned Horizontal Add (halfword) |
186 * | HADD_U.W | Vector Unigned Horizontal Add (word) |
187 * | HADD_U.D | Vector Unigned Horizontal Add (doubleword) |
188 * +---------------+----------------------------------------------------------+
191 /* TODO: insert Int Add group helpers here */
198 * +---------------+----------------------------------------------------------+
199 * | AVE_S.B | Vector Signed Average (byte) |
200 * | AVE_S.H | Vector Signed Average (halfword) |
201 * | AVE_S.W | Vector Signed Average (word) |
202 * | AVE_S.D | Vector Signed Average (doubleword) |
203 * | AVE_U.B | Vector Unsigned Average (byte) |
204 * | AVE_U.H | Vector Unsigned Average (halfword) |
205 * | AVE_U.W | Vector Unsigned Average (word) |
206 * | AVE_U.D | Vector Unsigned Average (doubleword) |
207 * | AVER_S.B | Vector Signed Average Rounded (byte) |
208 * | AVER_S.H | Vector Signed Average Rounded (halfword) |
209 * | AVER_S.W | Vector Signed Average Rounded (word) |
210 * | AVER_S.D | Vector Signed Average Rounded (doubleword) |
211 * | AVER_U.B | Vector Unsigned Average Rounded (byte) |
212 * | AVER_U.H | Vector Unsigned Average Rounded (halfword) |
213 * | AVER_U.W | Vector Unsigned Average Rounded (word) |
214 * | AVER_U.D | Vector Unsigned Average Rounded (doubleword) |
215 * +---------------+----------------------------------------------------------+
218 /* TODO: insert Int Average group helpers here */
225 * +---------------+----------------------------------------------------------+
226 * | CEQ.B | Vector Compare Equal (byte) |
227 * | CEQ.H | Vector Compare Equal (halfword) |
228 * | CEQ.W | Vector Compare Equal (word) |
229 * | CEQ.D | Vector Compare Equal (doubleword) |
230 * | CLE_S.B | Vector Compare Signed Less Than or Equal (byte) |
231 * | CLE_S.H | Vector Compare Signed Less Than or Equal (halfword) |
232 * | CLE_S.W | Vector Compare Signed Less Than or Equal (word) |
233 * | CLE_S.D | Vector Compare Signed Less Than or Equal (doubleword) |
234 * | CLE_U.B | Vector Compare Unsigned Less Than or Equal (byte) |
235 * | CLE_U.H | Vector Compare Unsigned Less Than or Equal (halfword) |
236 * | CLE_U.W | Vector Compare Unsigned Less Than or Equal (word) |
237 * | CLE_U.D | Vector Compare Unsigned Less Than or Equal (doubleword) |
238 * | CLT_S.B | Vector Compare Signed Less Than (byte) |
239 * | CLT_S.H | Vector Compare Signed Less Than (halfword) |
240 * | CLT_S.W | Vector Compare Signed Less Than (word) |
241 * | CLT_S.D | Vector Compare Signed Less Than (doubleword) |
242 * | CLT_U.B | Vector Compare Unsigned Less Than (byte) |
243 * | CLT_U.H | Vector Compare Unsigned Less Than (halfword) |
244 * | CLT_U.W | Vector Compare Unsigned Less Than (word) |
245 * | CLT_U.D | Vector Compare Unsigned Less Than (doubleword) |
246 * +---------------+----------------------------------------------------------+
249 /* TODO: insert Int Compare group helpers here */
256 * +---------------+----------------------------------------------------------+
257 * | DIV_S.B | Vector Signed Divide (byte) |
258 * | DIV_S.H | Vector Signed Divide (halfword) |
259 * | DIV_S.W | Vector Signed Divide (word) |
260 * | DIV_S.D | Vector Signed Divide (doubleword) |
261 * | DIV_U.B | Vector Unsigned Divide (byte) |
262 * | DIV_U.H | Vector Unsigned Divide (halfword) |
263 * | DIV_U.W | Vector Unsigned Divide (word) |
264 * | DIV_U.D | Vector Unsigned Divide (doubleword) |
265 * +---------------+----------------------------------------------------------+
268 /* TODO: insert Int Divide group helpers here */
275 * +---------------+----------------------------------------------------------+
276 * | DOTP_S.H | Vector Signed Dot Product (halfword) |
277 * | DOTP_S.W | Vector Signed Dot Product (word) |
278 * | DOTP_S.D | Vector Signed Dot Product (doubleword) |
279 * | DOTP_U.H | Vector Unsigned Dot Product (halfword) |
280 * | DOTP_U.W | Vector Unsigned Dot Product (word) |
281 * | DOTP_U.D | Vector Unsigned Dot Product (doubleword) |
282 * | DPADD_S.H | Vector Signed Dot Product (halfword) |
283 * | DPADD_S.W | Vector Signed Dot Product (word) |
284 * | DPADD_S.D | Vector Signed Dot Product (doubleword) |
285 * | DPADD_U.H | Vector Unsigned Dot Product (halfword) |
286 * | DPADD_U.W | Vector Unsigned Dot Product (word) |
287 * | DPADD_U.D | Vector Unsigned Dot Product (doubleword) |
288 * | DPSUB_S.H | Vector Signed Dot Product (halfword) |
289 * | DPSUB_S.W | Vector Signed Dot Product (word) |
290 * | DPSUB_S.D | Vector Signed Dot Product (doubleword) |
291 * | DPSUB_U.H | Vector Unsigned Dot Product (halfword) |
292 * | DPSUB_U.W | Vector Unsigned Dot Product (word) |
293 * | DPSUB_U.D | Vector Unsigned Dot Product (doubleword) |
294 * +---------------+----------------------------------------------------------+
297 /* TODO: insert Int Dot Product group helpers here */
304 * +---------------+----------------------------------------------------------+
305 * | MAX_A.B | Vector Maximum Based on Absolute Value (byte) |
306 * | MAX_A.H | Vector Maximum Based on Absolute Value (halfword) |
307 * | MAX_A.W | Vector Maximum Based on Absolute Value (word) |
308 * | MAX_A.D | Vector Maximum Based on Absolute Value (doubleword) |
309 * | MAX_S.B | Vector Signed Maximum (byte) |
310 * | MAX_S.H | Vector Signed Maximum (halfword) |
311 * | MAX_S.W | Vector Signed Maximum (word) |
312 * | MAX_S.D | Vector Signed Maximum (doubleword) |
313 * | MAX_U.B | Vector Unsigned Maximum (byte) |
314 * | MAX_U.H | Vector Unsigned Maximum (halfword) |
315 * | MAX_U.W | Vector Unsigned Maximum (word) |
316 * | MAX_U.D | Vector Unsigned Maximum (doubleword) |
317 * | MIN_A.B | Vector Minimum Based on Absolute Value (byte) |
318 * | MIN_A.H | Vector Minimum Based on Absolute Value (halfword) |
319 * | MIN_A.W | Vector Minimum Based on Absolute Value (word) |
320 * | MIN_A.D | Vector Minimum Based on Absolute Value (doubleword) |
321 * | MIN_S.B | Vector Signed Minimum (byte) |
322 * | MIN_S.H | Vector Signed Minimum (halfword) |
323 * | MIN_S.W | Vector Signed Minimum (word) |
324 * | MIN_S.D | Vector Signed Minimum (doubleword) |
325 * | MIN_U.B | Vector Unsigned Minimum (byte) |
326 * | MIN_U.H | Vector Unsigned Minimum (halfword) |
327 * | MIN_U.W | Vector Unsigned Minimum (word) |
328 * | MIN_U.D | Vector Unsigned Minimum (doubleword) |
329 * +---------------+----------------------------------------------------------+
332 /* TODO: insert Int Max Min group helpers here */
339 * +---------------+----------------------------------------------------------+
340 * | MOD_S.B | Vector Signed Modulo (byte) |
341 * | MOD_S.H | Vector Signed Modulo (halfword) |
342 * | MOD_S.W | Vector Signed Modulo (word) |
343 * | MOD_S.D | Vector Signed Modulo (doubleword) |
344 * | MOD_U.B | Vector Unsigned Modulo (byte) |
345 * | MOD_U.H | Vector Unsigned Modulo (halfword) |
346 * | MOD_U.W | Vector Unsigned Modulo (word) |
347 * | MOD_U.D | Vector Unsigned Modulo (doubleword) |
348 * +---------------+----------------------------------------------------------+
351 /* TODO: insert Int Modulo group helpers here */
358 * +---------------+----------------------------------------------------------+
359 * | MADDV.B | Vector Multiply and Add (byte) |
360 * | MADDV.H | Vector Multiply and Add (halfword) |
361 * | MADDV.W | Vector Multiply and Add (word) |
362 * | MADDV.D | Vector Multiply and Add (doubleword) |
363 * | MSUBV.B | Vector Multiply and Subtract (byte) |
364 * | MSUBV.H | Vector Multiply and Subtract (halfword) |
365 * | MSUBV.W | Vector Multiply and Subtract (word) |
366 * | MSUBV.D | Vector Multiply and Subtract (doubleword) |
367 * | MULV.B | Vector Multiply (byte) |
368 * | MULV.H | Vector Multiply (halfword) |
369 * | MULV.W | Vector Multiply (word) |
370 * | MULV.D | Vector Multiply (doubleword) |
371 * +---------------+----------------------------------------------------------+
374 /* TODO: insert Int Multiply group helpers here */
381 * +---------------+----------------------------------------------------------+
382 * | ASUB_S.B | Vector Absolute Values of Signed Subtract (byte) |
383 * | ASUB_S.H | Vector Absolute Values of Signed Subtract (halfword) |
384 * | ASUB_S.W | Vector Absolute Values of Signed Subtract (word) |
385 * | ASUB_S.D | Vector Absolute Values of Signed Subtract (doubleword) |
386 * | ASUB_U.B | Vector Absolute Values of Unsigned Subtract (byte) |
387 * | ASUB_U.H | Vector Absolute Values of Unsigned Subtract (halfword) |
388 * | ASUB_U.W | Vector Absolute Values of Unsigned Subtract (word) |
389 * | ASUB_U.D | Vector Absolute Values of Unsigned Subtract (doubleword) |
390 * | HSUB_S.H | Vector Signed Horizontal Subtract (halfword) |
391 * | HSUB_S.W | Vector Signed Horizontal Subtract (word) |
392 * | HSUB_S.D | Vector Signed Horizontal Subtract (doubleword) |
393 * | HSUB_U.H | Vector Unigned Horizontal Subtract (halfword) |
394 * | HSUB_U.W | Vector Unigned Horizontal Subtract (word) |
395 * | HSUB_U.D | Vector Unigned Horizontal Subtract (doubleword) |
396 * | SUBS_S.B | Vector Signed Saturated Subtract (of Signed) (byte) |
397 * | SUBS_S.H | Vector Signed Saturated Subtract (of Signed) (halfword) |
398 * | SUBS_S.W | Vector Signed Saturated Subtract (of Signed) (word) |
399 * | SUBS_S.D | Vector Signed Saturated Subtract (of Signed) (doubleword)|
400 * | SUBS_U.B | Vector Unsigned Saturated Subtract (of Uns.) (byte) |
401 * | SUBS_U.H | Vector Unsigned Saturated Subtract (of Uns.) (halfword) |
402 * | SUBS_U.W | Vector Unsigned Saturated Subtract (of Uns.) (word) |
403 * | SUBS_U.D | Vector Unsigned Saturated Subtract (of Uns.) (doubleword)|
404 * | SUBSUS_U.B | Vector Uns. Sat. Subtract (of S. from Uns.) (byte) |
405 * | SUBSUS_U.H | Vector Uns. Sat. Subtract (of S. from Uns.) (halfword) |
406 * | SUBSUS_U.W | Vector Uns. Sat. Subtract (of S. from Uns.) (word) |
407 * | SUBSUS_U.D | Vector Uns. Sat. Subtract (of S. from Uns.) (doubleword) |
408 * | SUBSUU_S.B | Vector Signed Saturated Subtract (of Uns.) (byte) |
409 * | SUBSUU_S.H | Vector Signed Saturated Subtract (of Uns.) (halfword) |
410 * | SUBSUU_S.W | Vector Signed Saturated Subtract (of Uns.) (word) |
411 * | SUBSUU_S.D | Vector Signed Saturated Subtract (of Uns.) (doubleword) |
412 * | SUBV.B | Vector Subtract (byte) |
413 * | SUBV.H | Vector Subtract (halfword) |
414 * | SUBV.W | Vector Subtract (word) |
415 * | SUBV.D | Vector Subtract (doubleword) |
416 * +---------------+----------------------------------------------------------+
419 /* TODO: insert Int Subtract group helpers here */
426 * +---------------+----------------------------------------------------------+
427 * | ILVEV.B | Vector Interleave Even (byte) |
428 * | ILVEV.H | Vector Interleave Even (halfword) |
429 * | ILVEV.W | Vector Interleave Even (word) |
430 * | ILVEV.D | Vector Interleave Even (doubleword) |
431 * | ILVOD.B | Vector Interleave Odd (byte) |
432 * | ILVOD.H | Vector Interleave Odd (halfword) |
433 * | ILVOD.W | Vector Interleave Odd (word) |
434 * | ILVOD.D | Vector Interleave Odd (doubleword) |
435 * | ILVL.B | Vector Interleave Left (byte) |
436 * | ILVL.H | Vector Interleave Left (halfword) |
437 * | ILVL.W | Vector Interleave Left (word) |
438 * | ILVL.D | Vector Interleave Left (doubleword) |
439 * | ILVR.B | Vector Interleave Right (byte) |
440 * | ILVR.H | Vector Interleave Right (halfword) |
441 * | ILVR.W | Vector Interleave Right (word) |
442 * | ILVR.D | Vector Interleave Right (doubleword) |
443 * +---------------+----------------------------------------------------------+
446 /* TODO: insert Interleave group helpers here */
453 * +---------------+----------------------------------------------------------+
454 * | AND.V | Vector Logical And |
455 * | NOR.V | Vector Logical Negated Or |
456 * | OR.V | Vector Logical Or |
457 * | XOR.V | Vector Logical Exclusive Or |
458 * +---------------+----------------------------------------------------------+
461 /* TODO: insert Logic group helpers here */
468 * +---------------+----------------------------------------------------------+
469 * | MOVE.V | Vector Move |
470 * +---------------+----------------------------------------------------------+
473 /* TODO: insert Move group helpers here */
480 * +---------------+----------------------------------------------------------+
481 * | PCKEV.B | Vector Pack Even (byte) |
482 * | PCKEV.H | Vector Pack Even (halfword) |
483 * | PCKEV.W | Vector Pack Even (word) |
484 * | PCKEV.D | Vector Pack Even (doubleword) |
485 * | PCKOD.B | Vector Pack Odd (byte) |
486 * | PCKOD.H | Vector Pack Odd (halfword) |
487 * | PCKOD.W | Vector Pack Odd (word) |
488 * | PCKOD.D | Vector Pack Odd (doubleword) |
489 * | VSHF.B | Vector Data Preserving Shuffle (byte) |
490 * | VSHF.H | Vector Data Preserving Shuffle (halfword) |
491 * | VSHF.W | Vector Data Preserving Shuffle (word) |
492 * | VSHF.D | Vector Data Preserving Shuffle (doubleword) |
493 * +---------------+----------------------------------------------------------+
496 /* TODO: insert Pack group helpers here */
503 * +---------------+----------------------------------------------------------+
504 * | SLL.B | Vector Shift Left (byte) |
505 * | SLL.H | Vector Shift Left (halfword) |
506 * | SLL.W | Vector Shift Left (word) |
507 * | SLL.D | Vector Shift Left (doubleword) |
508 * | SRA.B | Vector Shift Right Arithmetic (byte) |
509 * | SRA.H | Vector Shift Right Arithmetic (halfword) |
510 * | SRA.W | Vector Shift Right Arithmetic (word) |
511 * | SRA.D | Vector Shift Right Arithmetic (doubleword) |
512 * | SRAR.B | Vector Shift Right Arithmetic Rounded (byte) |
513 * | SRAR.H | Vector Shift Right Arithmetic Rounded (halfword) |
514 * | SRAR.W | Vector Shift Right Arithmetic Rounded (word) |
515 * | SRAR.D | Vector Shift Right Arithmetic Rounded (doubleword) |
516 * | SRL.B | Vector Shift Right Logical (byte) |
517 * | SRL.H | Vector Shift Right Logical (halfword) |
518 * | SRL.W | Vector Shift Right Logical (word) |
519 * | SRL.D | Vector Shift Right Logical (doubleword) |
520 * | SRLR.B | Vector Shift Right Logical Rounded (byte) |
521 * | SRLR.H | Vector Shift Right Logical Rounded (halfword) |
522 * | SRLR.W | Vector Shift Right Logical Rounded (word) |
523 * | SRLR.D | Vector Shift Right Logical Rounded (doubleword) |
524 * +---------------+----------------------------------------------------------+
527 /* TODO: insert Shift group helpers here */
530 static inline void msa_move_v(wr_t
*pwd
, wr_t
*pws
)
534 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
535 pwd
->d
[i
] = pws
->d
[i
];
539 #define MSA_FN_IMM8(FUNC, DEST, OPERATION) \
540 void helper_msa_ ## FUNC(CPUMIPSState *env, uint32_t wd, uint32_t ws, \
543 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
544 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
546 for (i = 0; i < DF_ELEMENTS(DF_BYTE); i++) { \
551 MSA_FN_IMM8(andi_b
, pwd
->b
[i
], pws
->b
[i
] & i8
)
552 MSA_FN_IMM8(ori_b
, pwd
->b
[i
], pws
->b
[i
] | i8
)
553 MSA_FN_IMM8(nori_b
, pwd
->b
[i
], ~(pws
->b
[i
] | i8
))
554 MSA_FN_IMM8(xori_b
, pwd
->b
[i
], pws
->b
[i
] ^ i8
)
556 #define BIT_MOVE_IF_NOT_ZERO(dest, arg1, arg2, df) \
557 UNSIGNED(((dest & (~arg2)) | (arg1 & arg2)), df)
558 MSA_FN_IMM8(bmnzi_b
, pwd
->b
[i
],
559 BIT_MOVE_IF_NOT_ZERO(pwd
->b
[i
], pws
->b
[i
], i8
, DF_BYTE
))
561 #define BIT_MOVE_IF_ZERO(dest, arg1, arg2, df) \
562 UNSIGNED((dest & arg2) | (arg1 & (~arg2)), df)
563 MSA_FN_IMM8(bmzi_b
, pwd
->b
[i
],
564 BIT_MOVE_IF_ZERO(pwd
->b
[i
], pws
->b
[i
], i8
, DF_BYTE
))
566 #define BIT_SELECT(dest, arg1, arg2, df) \
567 UNSIGNED((arg1 & (~dest)) | (arg2 & dest), df)
568 MSA_FN_IMM8(bseli_b
, pwd
->b
[i
],
569 BIT_SELECT(pwd
->b
[i
], pws
->b
[i
], i8
, DF_BYTE
))
573 #define SHF_POS(i, imm) (((i) & 0xfc) + (((imm) >> (2 * ((i) & 0x03))) & 0x03))
575 void helper_msa_shf_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
576 uint32_t ws
, uint32_t imm
)
578 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
579 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
585 for (i
= 0; i
< DF_ELEMENTS(DF_BYTE
); i
++) {
586 pwx
->b
[i
] = pws
->b
[SHF_POS(i
, imm
)];
590 for (i
= 0; i
< DF_ELEMENTS(DF_HALF
); i
++) {
591 pwx
->h
[i
] = pws
->h
[SHF_POS(i
, imm
)];
595 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
596 pwx
->w
[i
] = pws
->w
[SHF_POS(i
, imm
)];
602 msa_move_v(pwd
, pwx
);
605 #define MSA_FN_VECTOR(FUNC, DEST, OPERATION) \
606 void helper_msa_ ## FUNC(CPUMIPSState *env, uint32_t wd, uint32_t ws, \
609 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
610 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
611 wr_t *pwt = &(env->active_fpu.fpr[wt].wr); \
613 for (i = 0; i < DF_ELEMENTS(DF_DOUBLE); i++) { \
618 MSA_FN_VECTOR(bmnz_v
, pwd
->d
[i
],
619 BIT_MOVE_IF_NOT_ZERO(pwd
->d
[i
], pws
->d
[i
], pwt
->d
[i
], DF_DOUBLE
))
620 MSA_FN_VECTOR(bmz_v
, pwd
->d
[i
],
621 BIT_MOVE_IF_ZERO(pwd
->d
[i
], pws
->d
[i
], pwt
->d
[i
], DF_DOUBLE
))
622 MSA_FN_VECTOR(bsel_v
, pwd
->d
[i
],
623 BIT_SELECT(pwd
->d
[i
], pws
->d
[i
], pwt
->d
[i
], DF_DOUBLE
))
624 #undef BIT_MOVE_IF_NOT_ZERO
625 #undef BIT_MOVE_IF_ZERO
629 void helper_msa_and_v(CPUMIPSState
*env
, uint32_t wd
, uint32_t ws
, uint32_t wt
)
631 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
632 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
633 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
635 pwd
->d
[0] = pws
->d
[0] & pwt
->d
[0];
636 pwd
->d
[1] = pws
->d
[1] & pwt
->d
[1];
639 void helper_msa_or_v(CPUMIPSState
*env
, uint32_t wd
, uint32_t ws
, uint32_t wt
)
641 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
642 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
643 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
645 pwd
->d
[0] = pws
->d
[0] | pwt
->d
[0];
646 pwd
->d
[1] = pws
->d
[1] | pwt
->d
[1];
649 void helper_msa_nor_v(CPUMIPSState
*env
, uint32_t wd
, uint32_t ws
, uint32_t wt
)
651 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
652 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
653 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
655 pwd
->d
[0] = ~(pws
->d
[0] | pwt
->d
[0]);
656 pwd
->d
[1] = ~(pws
->d
[1] | pwt
->d
[1]);
659 void helper_msa_xor_v(CPUMIPSState
*env
, uint32_t wd
, uint32_t ws
, uint32_t wt
)
661 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
662 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
663 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
665 pwd
->d
[0] = pws
->d
[0] ^ pwt
->d
[0];
666 pwd
->d
[1] = pws
->d
[1] ^ pwt
->d
[1];
669 static inline int64_t msa_addv_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
674 static inline int64_t msa_subv_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
679 static inline int64_t msa_ceq_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
681 return arg1
== arg2
? -1 : 0;
684 static inline int64_t msa_cle_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
686 return arg1
<= arg2
? -1 : 0;
689 static inline int64_t msa_cle_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
691 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
692 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
693 return u_arg1
<= u_arg2
? -1 : 0;
696 static inline int64_t msa_clt_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
698 return arg1
< arg2
? -1 : 0;
701 static inline int64_t msa_clt_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
703 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
704 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
705 return u_arg1
< u_arg2
? -1 : 0;
708 static inline int64_t msa_max_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
710 return arg1
> arg2
? arg1
: arg2
;
713 static inline int64_t msa_max_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
715 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
716 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
717 return u_arg1
> u_arg2
? arg1
: arg2
;
720 static inline int64_t msa_min_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
722 return arg1
< arg2
? arg1
: arg2
;
725 static inline int64_t msa_min_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
727 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
728 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
729 return u_arg1
< u_arg2
? arg1
: arg2
;
732 #define MSA_BINOP_IMM_DF(helper, func) \
733 void helper_msa_ ## helper ## _df(CPUMIPSState *env, uint32_t df, \
734 uint32_t wd, uint32_t ws, int32_t u5) \
736 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
737 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
742 for (i = 0; i < DF_ELEMENTS(DF_BYTE); i++) { \
743 pwd->b[i] = msa_ ## func ## _df(df, pws->b[i], u5); \
747 for (i = 0; i < DF_ELEMENTS(DF_HALF); i++) { \
748 pwd->h[i] = msa_ ## func ## _df(df, pws->h[i], u5); \
752 for (i = 0; i < DF_ELEMENTS(DF_WORD); i++) { \
753 pwd->w[i] = msa_ ## func ## _df(df, pws->w[i], u5); \
757 for (i = 0; i < DF_ELEMENTS(DF_DOUBLE); i++) { \
758 pwd->d[i] = msa_ ## func ## _df(df, pws->d[i], u5); \
766 MSA_BINOP_IMM_DF(addvi
, addv
)
767 MSA_BINOP_IMM_DF(subvi
, subv
)
768 MSA_BINOP_IMM_DF(ceqi
, ceq
)
769 MSA_BINOP_IMM_DF(clei_s
, cle_s
)
770 MSA_BINOP_IMM_DF(clei_u
, cle_u
)
771 MSA_BINOP_IMM_DF(clti_s
, clt_s
)
772 MSA_BINOP_IMM_DF(clti_u
, clt_u
)
773 MSA_BINOP_IMM_DF(maxi_s
, max_s
)
774 MSA_BINOP_IMM_DF(maxi_u
, max_u
)
775 MSA_BINOP_IMM_DF(mini_s
, min_s
)
776 MSA_BINOP_IMM_DF(mini_u
, min_u
)
777 #undef MSA_BINOP_IMM_DF
779 void helper_msa_ldi_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
782 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
787 for (i
= 0; i
< DF_ELEMENTS(DF_BYTE
); i
++) {
788 pwd
->b
[i
] = (int8_t)s10
;
792 for (i
= 0; i
< DF_ELEMENTS(DF_HALF
); i
++) {
793 pwd
->h
[i
] = (int16_t)s10
;
797 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
798 pwd
->w
[i
] = (int32_t)s10
;
802 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
803 pwd
->d
[i
] = (int64_t)s10
;
811 /* Data format bit position and unsigned values */
812 #define BIT_POSITION(x, df) ((uint64_t)(x) % DF_BITS(df))
814 static inline int64_t msa_sll_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
816 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
817 return arg1
<< b_arg2
;
820 static inline int64_t msa_sra_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
822 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
823 return arg1
>> b_arg2
;
826 static inline int64_t msa_srl_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
828 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
829 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
830 return u_arg1
>> b_arg2
;
833 static inline int64_t msa_bclr_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
835 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
836 return UNSIGNED(arg1
& (~(1LL << b_arg2
)), df
);
839 static inline int64_t msa_bset_df(uint32_t df
, int64_t arg1
,
842 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
843 return UNSIGNED(arg1
| (1LL << b_arg2
), df
);
846 static inline int64_t msa_bneg_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
848 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
849 return UNSIGNED(arg1
^ (1LL << b_arg2
), df
);
852 static inline int64_t msa_binsl_df(uint32_t df
, int64_t dest
, int64_t arg1
,
855 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
856 uint64_t u_dest
= UNSIGNED(dest
, df
);
857 int32_t sh_d
= BIT_POSITION(arg2
, df
) + 1;
858 int32_t sh_a
= DF_BITS(df
) - sh_d
;
859 if (sh_d
== DF_BITS(df
)) {
862 return UNSIGNED(UNSIGNED(u_dest
<< sh_d
, df
) >> sh_d
, df
) |
863 UNSIGNED(UNSIGNED(u_arg1
>> sh_a
, df
) << sh_a
, df
);
867 static inline int64_t msa_binsr_df(uint32_t df
, int64_t dest
, int64_t arg1
,
870 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
871 uint64_t u_dest
= UNSIGNED(dest
, df
);
872 int32_t sh_d
= BIT_POSITION(arg2
, df
) + 1;
873 int32_t sh_a
= DF_BITS(df
) - sh_d
;
874 if (sh_d
== DF_BITS(df
)) {
877 return UNSIGNED(UNSIGNED(u_dest
>> sh_d
, df
) << sh_d
, df
) |
878 UNSIGNED(UNSIGNED(u_arg1
<< sh_a
, df
) >> sh_a
, df
);
882 static inline int64_t msa_sat_s_df(uint32_t df
, int64_t arg
, uint32_t m
)
884 return arg
< M_MIN_INT(m
+ 1) ? M_MIN_INT(m
+ 1) :
885 arg
> M_MAX_INT(m
+ 1) ? M_MAX_INT(m
+ 1) :
889 static inline int64_t msa_sat_u_df(uint32_t df
, int64_t arg
, uint32_t m
)
891 uint64_t u_arg
= UNSIGNED(arg
, df
);
892 return u_arg
< M_MAX_UINT(m
+ 1) ? u_arg
:
896 static inline int64_t msa_srar_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
898 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
902 int64_t r_bit
= (arg1
>> (b_arg2
- 1)) & 1;
903 return (arg1
>> b_arg2
) + r_bit
;
907 static inline int64_t msa_srlr_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
909 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
910 int32_t b_arg2
= BIT_POSITION(arg2
, df
);
914 uint64_t r_bit
= (u_arg1
>> (b_arg2
- 1)) & 1;
915 return (u_arg1
>> b_arg2
) + r_bit
;
919 #define MSA_BINOP_IMMU_DF(helper, func) \
920 void helper_msa_ ## helper ## _df(CPUMIPSState *env, uint32_t df, uint32_t wd, \
921 uint32_t ws, uint32_t u5) \
923 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
924 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
929 for (i = 0; i < DF_ELEMENTS(DF_BYTE); i++) { \
930 pwd->b[i] = msa_ ## func ## _df(df, pws->b[i], u5); \
934 for (i = 0; i < DF_ELEMENTS(DF_HALF); i++) { \
935 pwd->h[i] = msa_ ## func ## _df(df, pws->h[i], u5); \
939 for (i = 0; i < DF_ELEMENTS(DF_WORD); i++) { \
940 pwd->w[i] = msa_ ## func ## _df(df, pws->w[i], u5); \
944 for (i = 0; i < DF_ELEMENTS(DF_DOUBLE); i++) { \
945 pwd->d[i] = msa_ ## func ## _df(df, pws->d[i], u5); \
953 MSA_BINOP_IMMU_DF(slli
, sll
)
954 MSA_BINOP_IMMU_DF(srai
, sra
)
955 MSA_BINOP_IMMU_DF(srli
, srl
)
956 MSA_BINOP_IMMU_DF(bclri
, bclr
)
957 MSA_BINOP_IMMU_DF(bseti
, bset
)
958 MSA_BINOP_IMMU_DF(bnegi
, bneg
)
959 MSA_BINOP_IMMU_DF(sat_s
, sat_s
)
960 MSA_BINOP_IMMU_DF(sat_u
, sat_u
)
961 MSA_BINOP_IMMU_DF(srari
, srar
)
962 MSA_BINOP_IMMU_DF(srlri
, srlr
)
963 #undef MSA_BINOP_IMMU_DF
965 #define MSA_TEROP_IMMU_DF(helper, func) \
966 void helper_msa_ ## helper ## _df(CPUMIPSState *env, uint32_t df, \
967 uint32_t wd, uint32_t ws, uint32_t u5) \
969 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
970 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
975 for (i = 0; i < DF_ELEMENTS(DF_BYTE); i++) { \
976 pwd->b[i] = msa_ ## func ## _df(df, pwd->b[i], pws->b[i], \
981 for (i = 0; i < DF_ELEMENTS(DF_HALF); i++) { \
982 pwd->h[i] = msa_ ## func ## _df(df, pwd->h[i], pws->h[i], \
987 for (i = 0; i < DF_ELEMENTS(DF_WORD); i++) { \
988 pwd->w[i] = msa_ ## func ## _df(df, pwd->w[i], pws->w[i], \
993 for (i = 0; i < DF_ELEMENTS(DF_DOUBLE); i++) { \
994 pwd->d[i] = msa_ ## func ## _df(df, pwd->d[i], pws->d[i], \
1003 MSA_TEROP_IMMU_DF(binsli
, binsl
)
1004 MSA_TEROP_IMMU_DF(binsri
, binsr
)
1005 #undef MSA_TEROP_IMMU_DF
1007 static inline int64_t msa_max_a_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1009 uint64_t abs_arg1
= arg1
>= 0 ? arg1
: -arg1
;
1010 uint64_t abs_arg2
= arg2
>= 0 ? arg2
: -arg2
;
1011 return abs_arg1
> abs_arg2
? arg1
: arg2
;
1014 static inline int64_t msa_min_a_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1016 uint64_t abs_arg1
= arg1
>= 0 ? arg1
: -arg1
;
1017 uint64_t abs_arg2
= arg2
>= 0 ? arg2
: -arg2
;
1018 return abs_arg1
< abs_arg2
? arg1
: arg2
;
1021 static inline int64_t msa_add_a_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1023 uint64_t abs_arg1
= arg1
>= 0 ? arg1
: -arg1
;
1024 uint64_t abs_arg2
= arg2
>= 0 ? arg2
: -arg2
;
1025 return abs_arg1
+ abs_arg2
;
1028 static inline int64_t msa_adds_a_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1030 uint64_t max_int
= (uint64_t)DF_MAX_INT(df
);
1031 uint64_t abs_arg1
= arg1
>= 0 ? arg1
: -arg1
;
1032 uint64_t abs_arg2
= arg2
>= 0 ? arg2
: -arg2
;
1033 if (abs_arg1
> max_int
|| abs_arg2
> max_int
) {
1034 return (int64_t)max_int
;
1036 return (abs_arg1
< max_int
- abs_arg2
) ? abs_arg1
+ abs_arg2
: max_int
;
1040 static inline int64_t msa_adds_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1042 int64_t max_int
= DF_MAX_INT(df
);
1043 int64_t min_int
= DF_MIN_INT(df
);
1045 return (min_int
- arg1
< arg2
) ? arg1
+ arg2
: min_int
;
1047 return (arg2
< max_int
- arg1
) ? arg1
+ arg2
: max_int
;
1051 static inline uint64_t msa_adds_u_df(uint32_t df
, uint64_t arg1
, uint64_t arg2
)
1053 uint64_t max_uint
= DF_MAX_UINT(df
);
1054 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1055 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1056 return (u_arg1
< max_uint
- u_arg2
) ? u_arg1
+ u_arg2
: max_uint
;
1059 static inline int64_t msa_ave_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1062 return (arg1
>> 1) + (arg2
>> 1) + (arg1
& arg2
& 1);
1065 static inline uint64_t msa_ave_u_df(uint32_t df
, uint64_t arg1
, uint64_t arg2
)
1067 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1068 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1069 /* unsigned shift */
1070 return (u_arg1
>> 1) + (u_arg2
>> 1) + (u_arg1
& u_arg2
& 1);
1073 static inline int64_t msa_aver_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1076 return (arg1
>> 1) + (arg2
>> 1) + ((arg1
| arg2
) & 1);
1079 static inline uint64_t msa_aver_u_df(uint32_t df
, uint64_t arg1
, uint64_t arg2
)
1081 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1082 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1083 /* unsigned shift */
1084 return (u_arg1
>> 1) + (u_arg2
>> 1) + ((u_arg1
| u_arg2
) & 1);
1087 static inline int64_t msa_subs_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1089 int64_t max_int
= DF_MAX_INT(df
);
1090 int64_t min_int
= DF_MIN_INT(df
);
1092 return (min_int
+ arg2
< arg1
) ? arg1
- arg2
: min_int
;
1094 return (arg1
< max_int
+ arg2
) ? arg1
- arg2
: max_int
;
1098 static inline int64_t msa_subs_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1100 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1101 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1102 return (u_arg1
> u_arg2
) ? u_arg1
- u_arg2
: 0;
1105 static inline int64_t msa_subsus_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1107 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1108 uint64_t max_uint
= DF_MAX_UINT(df
);
1110 uint64_t u_arg2
= (uint64_t)arg2
;
1111 return (u_arg1
> u_arg2
) ?
1112 (int64_t)(u_arg1
- u_arg2
) :
1115 uint64_t u_arg2
= (uint64_t)(-arg2
);
1116 return (u_arg1
< max_uint
- u_arg2
) ?
1117 (int64_t)(u_arg1
+ u_arg2
) :
1122 static inline int64_t msa_subsuu_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1124 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1125 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1126 int64_t max_int
= DF_MAX_INT(df
);
1127 int64_t min_int
= DF_MIN_INT(df
);
1128 if (u_arg1
> u_arg2
) {
1129 return u_arg1
- u_arg2
< (uint64_t)max_int
?
1130 (int64_t)(u_arg1
- u_arg2
) :
1133 return u_arg2
- u_arg1
< (uint64_t)(-min_int
) ?
1134 (int64_t)(u_arg1
- u_arg2
) :
1139 static inline int64_t msa_asub_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1141 /* signed compare */
1142 return (arg1
< arg2
) ?
1143 (uint64_t)(arg2
- arg1
) : (uint64_t)(arg1
- arg2
);
1146 static inline uint64_t msa_asub_u_df(uint32_t df
, uint64_t arg1
, uint64_t arg2
)
1148 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1149 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1150 /* unsigned compare */
1151 return (u_arg1
< u_arg2
) ?
1152 (uint64_t)(u_arg2
- u_arg1
) : (uint64_t)(u_arg1
- u_arg2
);
1155 static inline int64_t msa_mulv_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1160 static inline int64_t msa_div_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1162 if (arg1
== DF_MIN_INT(df
) && arg2
== -1) {
1163 return DF_MIN_INT(df
);
1165 return arg2
? arg1
/ arg2
1166 : arg1
>= 0 ? -1 : 1;
1169 static inline int64_t msa_div_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1171 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1172 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1173 return arg2
? u_arg1
/ u_arg2
: -1;
1176 static inline int64_t msa_mod_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1178 if (arg1
== DF_MIN_INT(df
) && arg2
== -1) {
1181 return arg2
? arg1
% arg2
: arg1
;
1184 static inline int64_t msa_mod_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1186 uint64_t u_arg1
= UNSIGNED(arg1
, df
);
1187 uint64_t u_arg2
= UNSIGNED(arg2
, df
);
1188 return u_arg2
? u_arg1
% u_arg2
: u_arg1
;
1191 #define SIGNED_EVEN(a, df) \
1192 ((((int64_t)(a)) << (64 - DF_BITS(df) / 2)) >> (64 - DF_BITS(df) / 2))
1194 #define UNSIGNED_EVEN(a, df) \
1195 ((((uint64_t)(a)) << (64 - DF_BITS(df) / 2)) >> (64 - DF_BITS(df) / 2))
1197 #define SIGNED_ODD(a, df) \
1198 ((((int64_t)(a)) << (64 - DF_BITS(df))) >> (64 - DF_BITS(df) / 2))
1200 #define UNSIGNED_ODD(a, df) \
1201 ((((uint64_t)(a)) << (64 - DF_BITS(df))) >> (64 - DF_BITS(df) / 2))
1203 #define SIGNED_EXTRACT(e, o, a, df) \
1205 e = SIGNED_EVEN(a, df); \
1206 o = SIGNED_ODD(a, df); \
1209 #define UNSIGNED_EXTRACT(e, o, a, df) \
1211 e = UNSIGNED_EVEN(a, df); \
1212 o = UNSIGNED_ODD(a, df); \
1215 static inline int64_t msa_dotp_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1221 SIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1222 SIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1223 return (even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
);
1226 static inline int64_t msa_dotp_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1232 UNSIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1233 UNSIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1234 return (even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
);
1237 #define CONCATENATE_AND_SLIDE(s, k) \
1239 for (i = 0; i < s; i++) { \
1240 v[i] = pws->b[s * k + i]; \
1241 v[i + s] = pwd->b[s * k + i]; \
1243 for (i = 0; i < s; i++) { \
1244 pwd->b[s * k + i] = v[i + n]; \
1248 static inline void msa_sld_df(uint32_t df
, wr_t
*pwd
,
1249 wr_t
*pws
, target_ulong rt
)
1251 uint32_t n
= rt
% DF_ELEMENTS(df
);
1257 CONCATENATE_AND_SLIDE(DF_ELEMENTS(DF_BYTE
), 0);
1260 for (k
= 0; k
< 2; k
++) {
1261 CONCATENATE_AND_SLIDE(DF_ELEMENTS(DF_HALF
), k
);
1265 for (k
= 0; k
< 4; k
++) {
1266 CONCATENATE_AND_SLIDE(DF_ELEMENTS(DF_WORD
), k
);
1270 for (k
= 0; k
< 8; k
++) {
1271 CONCATENATE_AND_SLIDE(DF_ELEMENTS(DF_DOUBLE
), k
);
1279 static inline int64_t msa_hadd_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1281 return SIGNED_ODD(arg1
, df
) + SIGNED_EVEN(arg2
, df
);
1284 static inline int64_t msa_hadd_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1286 return UNSIGNED_ODD(arg1
, df
) + UNSIGNED_EVEN(arg2
, df
);
1289 static inline int64_t msa_hsub_s_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1291 return SIGNED_ODD(arg1
, df
) - SIGNED_EVEN(arg2
, df
);
1294 static inline int64_t msa_hsub_u_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1296 return UNSIGNED_ODD(arg1
, df
) - UNSIGNED_EVEN(arg2
, df
);
1299 static inline int64_t msa_mul_q_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1301 int64_t q_min
= DF_MIN_INT(df
);
1302 int64_t q_max
= DF_MAX_INT(df
);
1304 if (arg1
== q_min
&& arg2
== q_min
) {
1307 return (arg1
* arg2
) >> (DF_BITS(df
) - 1);
1310 static inline int64_t msa_mulr_q_df(uint32_t df
, int64_t arg1
, int64_t arg2
)
1312 int64_t q_min
= DF_MIN_INT(df
);
1313 int64_t q_max
= DF_MAX_INT(df
);
1314 int64_t r_bit
= 1 << (DF_BITS(df
) - 2);
1316 if (arg1
== q_min
&& arg2
== q_min
) {
1319 return (arg1
* arg2
+ r_bit
) >> (DF_BITS(df
) - 1);
1322 #define MSA_BINOP_DF(func) \
1323 void helper_msa_ ## func ## _df(CPUMIPSState *env, uint32_t df, \
1324 uint32_t wd, uint32_t ws, uint32_t wt) \
1326 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
1327 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
1328 wr_t *pwt = &(env->active_fpu.fpr[wt].wr); \
1332 pwd->b[0] = msa_ ## func ## _df(df, pws->b[0], pwt->b[0]); \
1333 pwd->b[1] = msa_ ## func ## _df(df, pws->b[1], pwt->b[1]); \
1334 pwd->b[2] = msa_ ## func ## _df(df, pws->b[2], pwt->b[2]); \
1335 pwd->b[3] = msa_ ## func ## _df(df, pws->b[3], pwt->b[3]); \
1336 pwd->b[4] = msa_ ## func ## _df(df, pws->b[4], pwt->b[4]); \
1337 pwd->b[5] = msa_ ## func ## _df(df, pws->b[5], pwt->b[5]); \
1338 pwd->b[6] = msa_ ## func ## _df(df, pws->b[6], pwt->b[6]); \
1339 pwd->b[7] = msa_ ## func ## _df(df, pws->b[7], pwt->b[7]); \
1340 pwd->b[8] = msa_ ## func ## _df(df, pws->b[8], pwt->b[8]); \
1341 pwd->b[9] = msa_ ## func ## _df(df, pws->b[9], pwt->b[9]); \
1342 pwd->b[10] = msa_ ## func ## _df(df, pws->b[10], pwt->b[10]); \
1343 pwd->b[11] = msa_ ## func ## _df(df, pws->b[11], pwt->b[11]); \
1344 pwd->b[12] = msa_ ## func ## _df(df, pws->b[12], pwt->b[12]); \
1345 pwd->b[13] = msa_ ## func ## _df(df, pws->b[13], pwt->b[13]); \
1346 pwd->b[14] = msa_ ## func ## _df(df, pws->b[14], pwt->b[14]); \
1347 pwd->b[15] = msa_ ## func ## _df(df, pws->b[15], pwt->b[15]); \
1350 pwd->h[0] = msa_ ## func ## _df(df, pws->h[0], pwt->h[0]); \
1351 pwd->h[1] = msa_ ## func ## _df(df, pws->h[1], pwt->h[1]); \
1352 pwd->h[2] = msa_ ## func ## _df(df, pws->h[2], pwt->h[2]); \
1353 pwd->h[3] = msa_ ## func ## _df(df, pws->h[3], pwt->h[3]); \
1354 pwd->h[4] = msa_ ## func ## _df(df, pws->h[4], pwt->h[4]); \
1355 pwd->h[5] = msa_ ## func ## _df(df, pws->h[5], pwt->h[5]); \
1356 pwd->h[6] = msa_ ## func ## _df(df, pws->h[6], pwt->h[6]); \
1357 pwd->h[7] = msa_ ## func ## _df(df, pws->h[7], pwt->h[7]); \
1360 pwd->w[0] = msa_ ## func ## _df(df, pws->w[0], pwt->w[0]); \
1361 pwd->w[1] = msa_ ## func ## _df(df, pws->w[1], pwt->w[1]); \
1362 pwd->w[2] = msa_ ## func ## _df(df, pws->w[2], pwt->w[2]); \
1363 pwd->w[3] = msa_ ## func ## _df(df, pws->w[3], pwt->w[3]); \
1366 pwd->d[0] = msa_ ## func ## _df(df, pws->d[0], pwt->d[0]); \
1367 pwd->d[1] = msa_ ## func ## _df(df, pws->d[1], pwt->d[1]); \
1394 MSA_BINOP_DF(adds_a
)
1395 MSA_BINOP_DF(adds_s
)
1396 MSA_BINOP_DF(adds_u
)
1399 MSA_BINOP_DF(aver_s
)
1400 MSA_BINOP_DF(aver_u
)
1401 MSA_BINOP_DF(subs_s
)
1402 MSA_BINOP_DF(subs_u
)
1403 MSA_BINOP_DF(subsus_u
)
1404 MSA_BINOP_DF(subsuu_s
)
1405 MSA_BINOP_DF(asub_s
)
1406 MSA_BINOP_DF(asub_u
)
1412 MSA_BINOP_DF(dotp_s
)
1413 MSA_BINOP_DF(dotp_u
)
1416 MSA_BINOP_DF(hadd_s
)
1417 MSA_BINOP_DF(hadd_u
)
1418 MSA_BINOP_DF(hsub_s
)
1419 MSA_BINOP_DF(hsub_u
)
1422 MSA_BINOP_DF(mulr_q
)
1425 void helper_msa_sld_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
1426 uint32_t ws
, uint32_t rt
)
1428 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
1429 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
1431 msa_sld_df(df
, pwd
, pws
, env
->active_tc
.gpr
[rt
]);
1434 static inline int64_t msa_maddv_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1437 return dest
+ arg1
* arg2
;
1440 static inline int64_t msa_msubv_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1443 return dest
- arg1
* arg2
;
1446 static inline int64_t msa_dpadd_s_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1453 SIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1454 SIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1455 return dest
+ (even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
);
1458 static inline int64_t msa_dpadd_u_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1465 UNSIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1466 UNSIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1467 return dest
+ (even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
);
1470 static inline int64_t msa_dpsub_s_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1477 SIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1478 SIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1479 return dest
- ((even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
));
1482 static inline int64_t msa_dpsub_u_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1489 UNSIGNED_EXTRACT(even_arg1
, odd_arg1
, arg1
, df
);
1490 UNSIGNED_EXTRACT(even_arg2
, odd_arg2
, arg2
, df
);
1491 return dest
- ((even_arg1
* even_arg2
) + (odd_arg1
* odd_arg2
));
1494 static inline int64_t msa_madd_q_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1497 int64_t q_prod
, q_ret
;
1499 int64_t q_max
= DF_MAX_INT(df
);
1500 int64_t q_min
= DF_MIN_INT(df
);
1502 q_prod
= arg1
* arg2
;
1503 q_ret
= ((dest
<< (DF_BITS(df
) - 1)) + q_prod
) >> (DF_BITS(df
) - 1);
1505 return (q_ret
< q_min
) ? q_min
: (q_max
< q_ret
) ? q_max
: q_ret
;
1508 static inline int64_t msa_msub_q_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1511 int64_t q_prod
, q_ret
;
1513 int64_t q_max
= DF_MAX_INT(df
);
1514 int64_t q_min
= DF_MIN_INT(df
);
1516 q_prod
= arg1
* arg2
;
1517 q_ret
= ((dest
<< (DF_BITS(df
) - 1)) - q_prod
) >> (DF_BITS(df
) - 1);
1519 return (q_ret
< q_min
) ? q_min
: (q_max
< q_ret
) ? q_max
: q_ret
;
1522 static inline int64_t msa_maddr_q_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1525 int64_t q_prod
, q_ret
;
1527 int64_t q_max
= DF_MAX_INT(df
);
1528 int64_t q_min
= DF_MIN_INT(df
);
1529 int64_t r_bit
= 1 << (DF_BITS(df
) - 2);
1531 q_prod
= arg1
* arg2
;
1532 q_ret
= ((dest
<< (DF_BITS(df
) - 1)) + q_prod
+ r_bit
) >> (DF_BITS(df
) - 1);
1534 return (q_ret
< q_min
) ? q_min
: (q_max
< q_ret
) ? q_max
: q_ret
;
1537 static inline int64_t msa_msubr_q_df(uint32_t df
, int64_t dest
, int64_t arg1
,
1540 int64_t q_prod
, q_ret
;
1542 int64_t q_max
= DF_MAX_INT(df
);
1543 int64_t q_min
= DF_MIN_INT(df
);
1544 int64_t r_bit
= 1 << (DF_BITS(df
) - 2);
1546 q_prod
= arg1
* arg2
;
1547 q_ret
= ((dest
<< (DF_BITS(df
) - 1)) - q_prod
+ r_bit
) >> (DF_BITS(df
) - 1);
1549 return (q_ret
< q_min
) ? q_min
: (q_max
< q_ret
) ? q_max
: q_ret
;
1552 #define MSA_TEROP_DF(func) \
1553 void helper_msa_ ## func ## _df(CPUMIPSState *env, uint32_t df, uint32_t wd, \
1554 uint32_t ws, uint32_t wt) \
1556 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
1557 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
1558 wr_t *pwt = &(env->active_fpu.fpr[wt].wr); \
1562 pwd->b[0] = msa_ ## func ## _df(df, pwd->b[0], pws->b[0], \
1564 pwd->b[1] = msa_ ## func ## _df(df, pwd->b[1], pws->b[1], \
1566 pwd->b[2] = msa_ ## func ## _df(df, pwd->b[2], pws->b[2], \
1568 pwd->b[3] = msa_ ## func ## _df(df, pwd->b[3], pws->b[3], \
1570 pwd->b[4] = msa_ ## func ## _df(df, pwd->b[4], pws->b[4], \
1572 pwd->b[5] = msa_ ## func ## _df(df, pwd->b[5], pws->b[5], \
1574 pwd->b[6] = msa_ ## func ## _df(df, pwd->b[6], pws->b[6], \
1576 pwd->b[7] = msa_ ## func ## _df(df, pwd->b[7], pws->b[7], \
1578 pwd->b[8] = msa_ ## func ## _df(df, pwd->b[8], pws->b[8], \
1580 pwd->b[9] = msa_ ## func ## _df(df, pwd->b[9], pws->b[9], \
1582 pwd->b[10] = msa_ ## func ## _df(df, pwd->b[10], pws->b[10], \
1584 pwd->b[11] = msa_ ## func ## _df(df, pwd->b[11], pws->b[11], \
1586 pwd->b[12] = msa_ ## func ## _df(df, pwd->b[12], pws->b[12], \
1588 pwd->b[13] = msa_ ## func ## _df(df, pwd->b[13], pws->b[13], \
1590 pwd->b[14] = msa_ ## func ## _df(df, pwd->b[14], pws->b[14], \
1592 pwd->b[15] = msa_ ## func ## _df(df, pwd->b[15], pws->b[15], \
1596 pwd->h[0] = msa_ ## func ## _df(df, pwd->h[0], pws->h[0], pwt->h[0]); \
1597 pwd->h[1] = msa_ ## func ## _df(df, pwd->h[1], pws->h[1], pwt->h[1]); \
1598 pwd->h[2] = msa_ ## func ## _df(df, pwd->h[2], pws->h[2], pwt->h[2]); \
1599 pwd->h[3] = msa_ ## func ## _df(df, pwd->h[3], pws->h[3], pwt->h[3]); \
1600 pwd->h[4] = msa_ ## func ## _df(df, pwd->h[4], pws->h[4], pwt->h[4]); \
1601 pwd->h[5] = msa_ ## func ## _df(df, pwd->h[5], pws->h[5], pwt->h[5]); \
1602 pwd->h[6] = msa_ ## func ## _df(df, pwd->h[6], pws->h[6], pwt->h[6]); \
1603 pwd->h[7] = msa_ ## func ## _df(df, pwd->h[7], pws->h[7], pwt->h[7]); \
1606 pwd->w[0] = msa_ ## func ## _df(df, pwd->w[0], pws->w[0], pwt->w[0]); \
1607 pwd->w[1] = msa_ ## func ## _df(df, pwd->w[1], pws->w[1], pwt->w[1]); \
1608 pwd->w[2] = msa_ ## func ## _df(df, pwd->w[2], pws->w[2], pwt->w[2]); \
1609 pwd->w[3] = msa_ ## func ## _df(df, pwd->w[3], pws->w[3], pwt->w[3]); \
1612 pwd->d[0] = msa_ ## func ## _df(df, pwd->d[0], pws->d[0], pwt->d[0]); \
1613 pwd->d[1] = msa_ ## func ## _df(df, pwd->d[1], pws->d[1], pwt->d[1]); \
1622 MSA_TEROP_DF(dpadd_s
)
1623 MSA_TEROP_DF(dpadd_u
)
1624 MSA_TEROP_DF(dpsub_s
)
1625 MSA_TEROP_DF(dpsub_u
)
1628 MSA_TEROP_DF(madd_q
)
1629 MSA_TEROP_DF(msub_q
)
1630 MSA_TEROP_DF(maddr_q
)
1631 MSA_TEROP_DF(msubr_q
)
1634 static inline void msa_splat_df(uint32_t df
, wr_t
*pwd
,
1635 wr_t
*pws
, target_ulong rt
)
1637 uint32_t n
= rt
% DF_ELEMENTS(df
);
1642 for (i
= 0; i
< DF_ELEMENTS(DF_BYTE
); i
++) {
1643 pwd
->b
[i
] = pws
->b
[n
];
1647 for (i
= 0; i
< DF_ELEMENTS(DF_HALF
); i
++) {
1648 pwd
->h
[i
] = pws
->h
[n
];
1652 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
1653 pwd
->w
[i
] = pws
->w
[n
];
1657 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
1658 pwd
->d
[i
] = pws
->d
[n
];
1666 void helper_msa_splat_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
1667 uint32_t ws
, uint32_t rt
)
1669 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
1670 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
1672 msa_splat_df(df
, pwd
, pws
, env
->active_tc
.gpr
[rt
]);
1675 #define MSA_DO_B MSA_DO(b)
1676 #define MSA_DO_H MSA_DO(h)
1677 #define MSA_DO_W MSA_DO(w)
1678 #define MSA_DO_D MSA_DO(d)
1680 #define MSA_LOOP_B MSA_LOOP(B)
1681 #define MSA_LOOP_H MSA_LOOP(H)
1682 #define MSA_LOOP_W MSA_LOOP(W)
1683 #define MSA_LOOP_D MSA_LOOP(D)
1685 #define MSA_LOOP_COND_B MSA_LOOP_COND(DF_BYTE)
1686 #define MSA_LOOP_COND_H MSA_LOOP_COND(DF_HALF)
1687 #define MSA_LOOP_COND_W MSA_LOOP_COND(DF_WORD)
1688 #define MSA_LOOP_COND_D MSA_LOOP_COND(DF_DOUBLE)
1690 #define MSA_LOOP(DF) \
1692 for (i = 0; i < (MSA_LOOP_COND_ ## DF) ; i++) { \
1697 #define MSA_FN_DF(FUNC) \
1698 void helper_msa_##FUNC(CPUMIPSState *env, uint32_t df, uint32_t wd, \
1699 uint32_t ws, uint32_t wt) \
1701 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
1702 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
1703 wr_t *pwt = &(env->active_fpu.fpr[wt].wr); \
1704 wr_t wx, *pwx = &wx; \
1722 msa_move_v(pwd, pwx); \
1725 #define MSA_LOOP_COND(DF) \
1726 (DF_ELEMENTS(DF) / 2)
1728 #define Rb(pwr, i) (pwr->b[i])
1729 #define Lb(pwr, i) (pwr->b[i + DF_ELEMENTS(DF_BYTE) / 2])
1730 #define Rh(pwr, i) (pwr->h[i])
1731 #define Lh(pwr, i) (pwr->h[i + DF_ELEMENTS(DF_HALF) / 2])
1732 #define Rw(pwr, i) (pwr->w[i])
1733 #define Lw(pwr, i) (pwr->w[i + DF_ELEMENTS(DF_WORD) / 2])
1734 #define Rd(pwr, i) (pwr->d[i])
1735 #define Ld(pwr, i) (pwr->d[i + DF_ELEMENTS(DF_DOUBLE) / 2])
1737 #undef MSA_LOOP_COND
1739 #define MSA_LOOP_COND(DF) \
1742 #define MSA_DO(DF) \
1744 uint32_t n = DF_ELEMENTS(df); \
1745 uint32_t k = (pwd->DF[i] & 0x3f) % (2 * n); \
1747 (pwd->DF[i] & 0xc0) ? 0 : k < n ? pwt->DF[k] : pws->DF[k - n]; \
1751 #undef MSA_LOOP_COND
1755 void helper_msa_ilvev_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
1756 uint32_t ws
, uint32_t wt
)
1758 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
1759 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
1760 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
1764 #if defined(HOST_WORDS_BIGENDIAN)
1765 pwd
->b
[8] = pws
->b
[9];
1766 pwd
->b
[9] = pwt
->b
[9];
1767 pwd
->b
[10] = pws
->b
[11];
1768 pwd
->b
[11] = pwt
->b
[11];
1769 pwd
->b
[12] = pws
->b
[13];
1770 pwd
->b
[13] = pwt
->b
[13];
1771 pwd
->b
[14] = pws
->b
[15];
1772 pwd
->b
[15] = pwt
->b
[15];
1773 pwd
->b
[0] = pws
->b
[1];
1774 pwd
->b
[1] = pwt
->b
[1];
1775 pwd
->b
[2] = pws
->b
[3];
1776 pwd
->b
[3] = pwt
->b
[3];
1777 pwd
->b
[4] = pws
->b
[5];
1778 pwd
->b
[5] = pwt
->b
[5];
1779 pwd
->b
[6] = pws
->b
[7];
1780 pwd
->b
[7] = pwt
->b
[7];
1782 pwd
->b
[15] = pws
->b
[14];
1783 pwd
->b
[14] = pwt
->b
[14];
1784 pwd
->b
[13] = pws
->b
[12];
1785 pwd
->b
[12] = pwt
->b
[12];
1786 pwd
->b
[11] = pws
->b
[10];
1787 pwd
->b
[10] = pwt
->b
[10];
1788 pwd
->b
[9] = pws
->b
[8];
1789 pwd
->b
[8] = pwt
->b
[8];
1790 pwd
->b
[7] = pws
->b
[6];
1791 pwd
->b
[6] = pwt
->b
[6];
1792 pwd
->b
[5] = pws
->b
[4];
1793 pwd
->b
[4] = pwt
->b
[4];
1794 pwd
->b
[3] = pws
->b
[2];
1795 pwd
->b
[2] = pwt
->b
[2];
1796 pwd
->b
[1] = pws
->b
[0];
1797 pwd
->b
[0] = pwt
->b
[0];
1801 #if defined(HOST_WORDS_BIGENDIAN)
1802 pwd
->h
[4] = pws
->h
[5];
1803 pwd
->h
[5] = pwt
->h
[5];
1804 pwd
->h
[6] = pws
->h
[7];
1805 pwd
->h
[7] = pwt
->h
[7];
1806 pwd
->h
[0] = pws
->h
[1];
1807 pwd
->h
[1] = pwt
->h
[1];
1808 pwd
->h
[2] = pws
->h
[3];
1809 pwd
->h
[3] = pwt
->h
[3];
1811 pwd
->h
[7] = pws
->h
[6];
1812 pwd
->h
[6] = pwt
->h
[6];
1813 pwd
->h
[5] = pws
->h
[4];
1814 pwd
->h
[4] = pwt
->h
[4];
1815 pwd
->h
[3] = pws
->h
[2];
1816 pwd
->h
[2] = pwt
->h
[2];
1817 pwd
->h
[1] = pws
->h
[0];
1818 pwd
->h
[0] = pwt
->h
[0];
1822 #if defined(HOST_WORDS_BIGENDIAN)
1823 pwd
->w
[2] = pws
->w
[3];
1824 pwd
->w
[3] = pwt
->w
[3];
1825 pwd
->w
[0] = pws
->w
[1];
1826 pwd
->w
[1] = pwt
->w
[1];
1828 pwd
->w
[3] = pws
->w
[2];
1829 pwd
->w
[2] = pwt
->w
[2];
1830 pwd
->w
[1] = pws
->w
[0];
1831 pwd
->w
[0] = pwt
->w
[0];
1835 pwd
->d
[1] = pws
->d
[0];
1836 pwd
->d
[0] = pwt
->d
[0];
1843 void helper_msa_ilvod_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
1844 uint32_t ws
, uint32_t wt
)
1846 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
1847 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
1848 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
1852 #if defined(HOST_WORDS_BIGENDIAN)
1853 pwd
->b
[7] = pwt
->b
[6];
1854 pwd
->b
[6] = pws
->b
[6];
1855 pwd
->b
[5] = pwt
->b
[4];
1856 pwd
->b
[4] = pws
->b
[4];
1857 pwd
->b
[3] = pwt
->b
[2];
1858 pwd
->b
[2] = pws
->b
[2];
1859 pwd
->b
[1] = pwt
->b
[0];
1860 pwd
->b
[0] = pws
->b
[0];
1861 pwd
->b
[15] = pwt
->b
[14];
1862 pwd
->b
[14] = pws
->b
[14];
1863 pwd
->b
[13] = pwt
->b
[12];
1864 pwd
->b
[12] = pws
->b
[12];
1865 pwd
->b
[11] = pwt
->b
[10];
1866 pwd
->b
[10] = pws
->b
[10];
1867 pwd
->b
[9] = pwt
->b
[8];
1868 pwd
->b
[8] = pws
->b
[8];
1870 pwd
->b
[0] = pwt
->b
[1];
1871 pwd
->b
[1] = pws
->b
[1];
1872 pwd
->b
[2] = pwt
->b
[3];
1873 pwd
->b
[3] = pws
->b
[3];
1874 pwd
->b
[4] = pwt
->b
[5];
1875 pwd
->b
[5] = pws
->b
[5];
1876 pwd
->b
[6] = pwt
->b
[7];
1877 pwd
->b
[7] = pws
->b
[7];
1878 pwd
->b
[8] = pwt
->b
[9];
1879 pwd
->b
[9] = pws
->b
[9];
1880 pwd
->b
[10] = pwt
->b
[11];
1881 pwd
->b
[11] = pws
->b
[11];
1882 pwd
->b
[12] = pwt
->b
[13];
1883 pwd
->b
[13] = pws
->b
[13];
1884 pwd
->b
[14] = pwt
->b
[15];
1885 pwd
->b
[15] = pws
->b
[15];
1889 #if defined(HOST_WORDS_BIGENDIAN)
1890 pwd
->h
[3] = pwt
->h
[2];
1891 pwd
->h
[2] = pws
->h
[2];
1892 pwd
->h
[1] = pwt
->h
[0];
1893 pwd
->h
[0] = pws
->h
[0];
1894 pwd
->h
[7] = pwt
->h
[6];
1895 pwd
->h
[6] = pws
->h
[6];
1896 pwd
->h
[5] = pwt
->h
[4];
1897 pwd
->h
[4] = pws
->h
[4];
1899 pwd
->h
[0] = pwt
->h
[1];
1900 pwd
->h
[1] = pws
->h
[1];
1901 pwd
->h
[2] = pwt
->h
[3];
1902 pwd
->h
[3] = pws
->h
[3];
1903 pwd
->h
[4] = pwt
->h
[5];
1904 pwd
->h
[5] = pws
->h
[5];
1905 pwd
->h
[6] = pwt
->h
[7];
1906 pwd
->h
[7] = pws
->h
[7];
1910 #if defined(HOST_WORDS_BIGENDIAN)
1911 pwd
->w
[1] = pwt
->w
[0];
1912 pwd
->w
[0] = pws
->w
[0];
1913 pwd
->w
[3] = pwt
->w
[2];
1914 pwd
->w
[2] = pws
->w
[2];
1916 pwd
->w
[0] = pwt
->w
[1];
1917 pwd
->w
[1] = pws
->w
[1];
1918 pwd
->w
[2] = pwt
->w
[3];
1919 pwd
->w
[3] = pws
->w
[3];
1923 pwd
->d
[0] = pwt
->d
[1];
1924 pwd
->d
[1] = pws
->d
[1];
1931 void helper_msa_ilvl_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
1932 uint32_t ws
, uint32_t wt
)
1934 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
1935 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
1936 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
1940 #if defined(HOST_WORDS_BIGENDIAN)
1941 pwd
->b
[7] = pwt
->b
[15];
1942 pwd
->b
[6] = pws
->b
[15];
1943 pwd
->b
[5] = pwt
->b
[14];
1944 pwd
->b
[4] = pws
->b
[14];
1945 pwd
->b
[3] = pwt
->b
[13];
1946 pwd
->b
[2] = pws
->b
[13];
1947 pwd
->b
[1] = pwt
->b
[12];
1948 pwd
->b
[0] = pws
->b
[12];
1949 pwd
->b
[15] = pwt
->b
[11];
1950 pwd
->b
[14] = pws
->b
[11];
1951 pwd
->b
[13] = pwt
->b
[10];
1952 pwd
->b
[12] = pws
->b
[10];
1953 pwd
->b
[11] = pwt
->b
[9];
1954 pwd
->b
[10] = pws
->b
[9];
1955 pwd
->b
[9] = pwt
->b
[8];
1956 pwd
->b
[8] = pws
->b
[8];
1958 pwd
->b
[0] = pwt
->b
[8];
1959 pwd
->b
[1] = pws
->b
[8];
1960 pwd
->b
[2] = pwt
->b
[9];
1961 pwd
->b
[3] = pws
->b
[9];
1962 pwd
->b
[4] = pwt
->b
[10];
1963 pwd
->b
[5] = pws
->b
[10];
1964 pwd
->b
[6] = pwt
->b
[11];
1965 pwd
->b
[7] = pws
->b
[11];
1966 pwd
->b
[8] = pwt
->b
[12];
1967 pwd
->b
[9] = pws
->b
[12];
1968 pwd
->b
[10] = pwt
->b
[13];
1969 pwd
->b
[11] = pws
->b
[13];
1970 pwd
->b
[12] = pwt
->b
[14];
1971 pwd
->b
[13] = pws
->b
[14];
1972 pwd
->b
[14] = pwt
->b
[15];
1973 pwd
->b
[15] = pws
->b
[15];
1977 #if defined(HOST_WORDS_BIGENDIAN)
1978 pwd
->h
[3] = pwt
->h
[7];
1979 pwd
->h
[2] = pws
->h
[7];
1980 pwd
->h
[1] = pwt
->h
[6];
1981 pwd
->h
[0] = pws
->h
[6];
1982 pwd
->h
[7] = pwt
->h
[5];
1983 pwd
->h
[6] = pws
->h
[5];
1984 pwd
->h
[5] = pwt
->h
[4];
1985 pwd
->h
[4] = pws
->h
[4];
1987 pwd
->h
[0] = pwt
->h
[4];
1988 pwd
->h
[1] = pws
->h
[4];
1989 pwd
->h
[2] = pwt
->h
[5];
1990 pwd
->h
[3] = pws
->h
[5];
1991 pwd
->h
[4] = pwt
->h
[6];
1992 pwd
->h
[5] = pws
->h
[6];
1993 pwd
->h
[6] = pwt
->h
[7];
1994 pwd
->h
[7] = pws
->h
[7];
1998 #if defined(HOST_WORDS_BIGENDIAN)
1999 pwd
->w
[1] = pwt
->w
[3];
2000 pwd
->w
[0] = pws
->w
[3];
2001 pwd
->w
[3] = pwt
->w
[2];
2002 pwd
->w
[2] = pws
->w
[2];
2004 pwd
->w
[0] = pwt
->w
[2];
2005 pwd
->w
[1] = pws
->w
[2];
2006 pwd
->w
[2] = pwt
->w
[3];
2007 pwd
->w
[3] = pws
->w
[3];
2011 pwd
->d
[0] = pwt
->d
[1];
2012 pwd
->d
[1] = pws
->d
[1];
2019 void helper_msa_ilvr_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2020 uint32_t ws
, uint32_t wt
)
2022 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2023 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2024 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
2028 #if defined(HOST_WORDS_BIGENDIAN)
2029 pwd
->b
[8] = pws
->b
[0];
2030 pwd
->b
[9] = pwt
->b
[0];
2031 pwd
->b
[10] = pws
->b
[1];
2032 pwd
->b
[11] = pwt
->b
[1];
2033 pwd
->b
[12] = pws
->b
[2];
2034 pwd
->b
[13] = pwt
->b
[2];
2035 pwd
->b
[14] = pws
->b
[3];
2036 pwd
->b
[15] = pwt
->b
[3];
2037 pwd
->b
[0] = pws
->b
[4];
2038 pwd
->b
[1] = pwt
->b
[4];
2039 pwd
->b
[2] = pws
->b
[5];
2040 pwd
->b
[3] = pwt
->b
[5];
2041 pwd
->b
[4] = pws
->b
[6];
2042 pwd
->b
[5] = pwt
->b
[6];
2043 pwd
->b
[6] = pws
->b
[7];
2044 pwd
->b
[7] = pwt
->b
[7];
2046 pwd
->b
[15] = pws
->b
[7];
2047 pwd
->b
[14] = pwt
->b
[7];
2048 pwd
->b
[13] = pws
->b
[6];
2049 pwd
->b
[12] = pwt
->b
[6];
2050 pwd
->b
[11] = pws
->b
[5];
2051 pwd
->b
[10] = pwt
->b
[5];
2052 pwd
->b
[9] = pws
->b
[4];
2053 pwd
->b
[8] = pwt
->b
[4];
2054 pwd
->b
[7] = pws
->b
[3];
2055 pwd
->b
[6] = pwt
->b
[3];
2056 pwd
->b
[5] = pws
->b
[2];
2057 pwd
->b
[4] = pwt
->b
[2];
2058 pwd
->b
[3] = pws
->b
[1];
2059 pwd
->b
[2] = pwt
->b
[1];
2060 pwd
->b
[1] = pws
->b
[0];
2061 pwd
->b
[0] = pwt
->b
[0];
2065 #if defined(HOST_WORDS_BIGENDIAN)
2066 pwd
->h
[4] = pws
->h
[0];
2067 pwd
->h
[5] = pwt
->h
[0];
2068 pwd
->h
[6] = pws
->h
[1];
2069 pwd
->h
[7] = pwt
->h
[1];
2070 pwd
->h
[0] = pws
->h
[2];
2071 pwd
->h
[1] = pwt
->h
[2];
2072 pwd
->h
[2] = pws
->h
[3];
2073 pwd
->h
[3] = pwt
->h
[3];
2075 pwd
->h
[7] = pws
->h
[3];
2076 pwd
->h
[6] = pwt
->h
[3];
2077 pwd
->h
[5] = pws
->h
[2];
2078 pwd
->h
[4] = pwt
->h
[2];
2079 pwd
->h
[3] = pws
->h
[1];
2080 pwd
->h
[2] = pwt
->h
[1];
2081 pwd
->h
[1] = pws
->h
[0];
2082 pwd
->h
[0] = pwt
->h
[0];
2086 #if defined(HOST_WORDS_BIGENDIAN)
2087 pwd
->w
[2] = pws
->w
[0];
2088 pwd
->w
[3] = pwt
->w
[0];
2089 pwd
->w
[0] = pws
->w
[1];
2090 pwd
->w
[1] = pwt
->w
[1];
2092 pwd
->w
[3] = pws
->w
[1];
2093 pwd
->w
[2] = pwt
->w
[1];
2094 pwd
->w
[1] = pws
->w
[0];
2095 pwd
->w
[0] = pwt
->w
[0];
2099 pwd
->d
[1] = pws
->d
[0];
2100 pwd
->d
[0] = pwt
->d
[0];
2107 void helper_msa_pckev_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2108 uint32_t ws
, uint32_t wt
)
2110 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2111 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2112 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
2116 pwd
->b
[15] = pws
->b
[14];
2117 pwd
->b
[13] = pws
->b
[10];
2118 pwd
->b
[11] = pws
->b
[6];
2119 pwd
->b
[9] = pws
->b
[2];
2120 pwd
->b
[7] = pwt
->b
[14];
2121 pwd
->b
[5] = pwt
->b
[10];
2122 pwd
->b
[3] = pwt
->b
[6];
2123 pwd
->b
[1] = pwt
->b
[2];
2124 pwd
->b
[14] = pws
->b
[12];
2125 pwd
->b
[10] = pws
->b
[4];
2126 pwd
->b
[6] = pwt
->b
[12];
2127 pwd
->b
[2] = pwt
->b
[4];
2128 pwd
->b
[12] = pws
->b
[8];
2129 pwd
->b
[4] = pwt
->b
[8];
2130 pwd
->b
[8] = pws
->b
[0];
2131 pwd
->b
[0] = pwt
->b
[0];
2134 pwd
->h
[7] = pws
->h
[6];
2135 pwd
->h
[5] = pws
->h
[2];
2136 pwd
->h
[3] = pwt
->h
[6];
2137 pwd
->h
[1] = pwt
->h
[2];
2138 pwd
->h
[6] = pws
->h
[4];
2139 pwd
->h
[2] = pwt
->h
[4];
2140 pwd
->h
[4] = pws
->h
[0];
2141 pwd
->h
[0] = pwt
->h
[0];
2144 pwd
->w
[3] = pws
->w
[2];
2145 pwd
->w
[1] = pwt
->w
[2];
2146 pwd
->w
[2] = pws
->w
[0];
2147 pwd
->w
[0] = pwt
->w
[0];
2150 pwd
->d
[1] = pws
->d
[0];
2151 pwd
->d
[0] = pwt
->d
[0];
2158 void helper_msa_pckod_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2159 uint32_t ws
, uint32_t wt
)
2161 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2162 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2163 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
2167 pwd
->b
[0] = pwt
->b
[1];
2168 pwd
->b
[2] = pwt
->b
[5];
2169 pwd
->b
[4] = pwt
->b
[9];
2170 pwd
->b
[6] = pwt
->b
[13];
2171 pwd
->b
[8] = pws
->b
[1];
2172 pwd
->b
[10] = pws
->b
[5];
2173 pwd
->b
[12] = pws
->b
[9];
2174 pwd
->b
[14] = pws
->b
[13];
2175 pwd
->b
[1] = pwt
->b
[3];
2176 pwd
->b
[5] = pwt
->b
[11];
2177 pwd
->b
[9] = pws
->b
[3];
2178 pwd
->b
[13] = pws
->b
[11];
2179 pwd
->b
[3] = pwt
->b
[7];
2180 pwd
->b
[11] = pws
->b
[7];
2181 pwd
->b
[7] = pwt
->b
[15];
2182 pwd
->b
[15] = pws
->b
[15];
2185 pwd
->h
[0] = pwt
->h
[1];
2186 pwd
->h
[2] = pwt
->h
[5];
2187 pwd
->h
[4] = pws
->h
[1];
2188 pwd
->h
[6] = pws
->h
[5];
2189 pwd
->h
[1] = pwt
->h
[3];
2190 pwd
->h
[5] = pws
->h
[3];
2191 pwd
->h
[3] = pwt
->h
[7];
2192 pwd
->h
[7] = pws
->h
[7];
2195 pwd
->w
[0] = pwt
->w
[1];
2196 pwd
->w
[2] = pws
->w
[1];
2197 pwd
->w
[1] = pwt
->w
[3];
2198 pwd
->w
[3] = pws
->w
[3];
2201 pwd
->d
[0] = pwt
->d
[1];
2202 pwd
->d
[1] = pws
->d
[1];
2210 void helper_msa_sldi_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2211 uint32_t ws
, uint32_t n
)
2213 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2214 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2216 msa_sld_df(df
, pwd
, pws
, n
);
2219 void helper_msa_splati_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2220 uint32_t ws
, uint32_t n
)
2222 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2223 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2225 msa_splat_df(df
, pwd
, pws
, n
);
2228 void helper_msa_copy_s_b(CPUMIPSState
*env
, uint32_t rd
,
2229 uint32_t ws
, uint32_t n
)
2232 #if defined(HOST_WORDS_BIGENDIAN)
2239 env
->active_tc
.gpr
[rd
] = (int8_t)env
->active_fpu
.fpr
[ws
].wr
.b
[n
];
2242 void helper_msa_copy_s_h(CPUMIPSState
*env
, uint32_t rd
,
2243 uint32_t ws
, uint32_t n
)
2246 #if defined(HOST_WORDS_BIGENDIAN)
2253 env
->active_tc
.gpr
[rd
] = (int16_t)env
->active_fpu
.fpr
[ws
].wr
.h
[n
];
2256 void helper_msa_copy_s_w(CPUMIPSState
*env
, uint32_t rd
,
2257 uint32_t ws
, uint32_t n
)
2260 #if defined(HOST_WORDS_BIGENDIAN)
2267 env
->active_tc
.gpr
[rd
] = (int32_t)env
->active_fpu
.fpr
[ws
].wr
.w
[n
];
2270 void helper_msa_copy_s_d(CPUMIPSState
*env
, uint32_t rd
,
2271 uint32_t ws
, uint32_t n
)
2274 env
->active_tc
.gpr
[rd
] = (int64_t)env
->active_fpu
.fpr
[ws
].wr
.d
[n
];
2277 void helper_msa_copy_u_b(CPUMIPSState
*env
, uint32_t rd
,
2278 uint32_t ws
, uint32_t n
)
2281 #if defined(HOST_WORDS_BIGENDIAN)
2288 env
->active_tc
.gpr
[rd
] = (uint8_t)env
->active_fpu
.fpr
[ws
].wr
.b
[n
];
2291 void helper_msa_copy_u_h(CPUMIPSState
*env
, uint32_t rd
,
2292 uint32_t ws
, uint32_t n
)
2295 #if defined(HOST_WORDS_BIGENDIAN)
2302 env
->active_tc
.gpr
[rd
] = (uint16_t)env
->active_fpu
.fpr
[ws
].wr
.h
[n
];
2305 void helper_msa_copy_u_w(CPUMIPSState
*env
, uint32_t rd
,
2306 uint32_t ws
, uint32_t n
)
2309 #if defined(HOST_WORDS_BIGENDIAN)
2316 env
->active_tc
.gpr
[rd
] = (uint32_t)env
->active_fpu
.fpr
[ws
].wr
.w
[n
];
2319 void helper_msa_insert_b(CPUMIPSState
*env
, uint32_t wd
,
2320 uint32_t rs_num
, uint32_t n
)
2322 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2323 target_ulong rs
= env
->active_tc
.gpr
[rs_num
];
2325 #if defined(HOST_WORDS_BIGENDIAN)
2332 pwd
->b
[n
] = (int8_t)rs
;
2335 void helper_msa_insert_h(CPUMIPSState
*env
, uint32_t wd
,
2336 uint32_t rs_num
, uint32_t n
)
2338 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2339 target_ulong rs
= env
->active_tc
.gpr
[rs_num
];
2341 #if defined(HOST_WORDS_BIGENDIAN)
2348 pwd
->h
[n
] = (int16_t)rs
;
2351 void helper_msa_insert_w(CPUMIPSState
*env
, uint32_t wd
,
2352 uint32_t rs_num
, uint32_t n
)
2354 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2355 target_ulong rs
= env
->active_tc
.gpr
[rs_num
];
2357 #if defined(HOST_WORDS_BIGENDIAN)
2364 pwd
->w
[n
] = (int32_t)rs
;
2367 void helper_msa_insert_d(CPUMIPSState
*env
, uint32_t wd
,
2368 uint32_t rs_num
, uint32_t n
)
2370 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2371 target_ulong rs
= env
->active_tc
.gpr
[rs_num
];
2373 pwd
->d
[n
] = (int64_t)rs
;
2376 void helper_msa_insve_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2377 uint32_t ws
, uint32_t n
)
2379 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2380 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2384 pwd
->b
[n
] = (int8_t)pws
->b
[0];
2387 pwd
->h
[n
] = (int16_t)pws
->h
[0];
2390 pwd
->w
[n
] = (int32_t)pws
->w
[0];
2393 pwd
->d
[n
] = (int64_t)pws
->d
[0];
2400 void helper_msa_ctcmsa(CPUMIPSState
*env
, target_ulong elm
, uint32_t cd
)
2406 env
->active_tc
.msacsr
= (int32_t)elm
& MSACSR_MASK
;
2407 restore_msa_fp_status(env
);
2408 /* check exception */
2409 if ((GET_FP_ENABLE(env
->active_tc
.msacsr
) | FP_UNIMPLEMENTED
)
2410 & GET_FP_CAUSE(env
->active_tc
.msacsr
)) {
2411 do_raise_exception(env
, EXCP_MSAFPE
, GETPC());
2417 target_ulong
helper_msa_cfcmsa(CPUMIPSState
*env
, uint32_t cs
)
2423 return env
->active_tc
.msacsr
& MSACSR_MASK
;
2428 void helper_msa_move_v(CPUMIPSState
*env
, uint32_t wd
, uint32_t ws
)
2430 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2431 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
2433 msa_move_v(pwd
, pws
);
2436 static inline int64_t msa_pcnt_df(uint32_t df
, int64_t arg
)
2440 x
= UNSIGNED(arg
, df
);
2442 x
= (x
& 0x5555555555555555ULL
) + ((x
>> 1) & 0x5555555555555555ULL
);
2443 x
= (x
& 0x3333333333333333ULL
) + ((x
>> 2) & 0x3333333333333333ULL
);
2444 x
= (x
& 0x0F0F0F0F0F0F0F0FULL
) + ((x
>> 4) & 0x0F0F0F0F0F0F0F0FULL
);
2445 x
= (x
& 0x00FF00FF00FF00FFULL
) + ((x
>> 8) & 0x00FF00FF00FF00FFULL
);
2446 x
= (x
& 0x0000FFFF0000FFFFULL
) + ((x
>> 16) & 0x0000FFFF0000FFFFULL
);
2447 x
= (x
& 0x00000000FFFFFFFFULL
) + ((x
>> 32));
2452 static inline int64_t msa_nlzc_df(uint32_t df
, int64_t arg
)
2457 x
= UNSIGNED(arg
, df
);
2459 c
= DF_BITS(df
) / 2;
2473 static inline int64_t msa_nloc_df(uint32_t df
, int64_t arg
)
2475 return msa_nlzc_df(df
, UNSIGNED((~arg
), df
));
2478 void helper_msa_fill_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
2481 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
2486 for (i
= 0; i
< DF_ELEMENTS(DF_BYTE
); i
++) {
2487 pwd
->b
[i
] = (int8_t)env
->active_tc
.gpr
[rs
];
2491 for (i
= 0; i
< DF_ELEMENTS(DF_HALF
); i
++) {
2492 pwd
->h
[i
] = (int16_t)env
->active_tc
.gpr
[rs
];
2496 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
2497 pwd
->w
[i
] = (int32_t)env
->active_tc
.gpr
[rs
];
2501 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
2502 pwd
->d
[i
] = (int64_t)env
->active_tc
.gpr
[rs
];
2510 #define MSA_UNOP_DF(func) \
2511 void helper_msa_ ## func ## _df(CPUMIPSState *env, uint32_t df, \
2512 uint32_t wd, uint32_t ws) \
2514 wr_t *pwd = &(env->active_fpu.fpr[wd].wr); \
2515 wr_t *pws = &(env->active_fpu.fpr[ws].wr); \
2519 pwd->b[0] = msa_ ## func ## _df(df, pws->b[0]); \
2520 pwd->b[1] = msa_ ## func ## _df(df, pws->b[1]); \
2521 pwd->b[2] = msa_ ## func ## _df(df, pws->b[2]); \
2522 pwd->b[3] = msa_ ## func ## _df(df, pws->b[3]); \
2523 pwd->b[4] = msa_ ## func ## _df(df, pws->b[4]); \
2524 pwd->b[5] = msa_ ## func ## _df(df, pws->b[5]); \
2525 pwd->b[6] = msa_ ## func ## _df(df, pws->b[6]); \
2526 pwd->b[7] = msa_ ## func ## _df(df, pws->b[7]); \
2527 pwd->b[8] = msa_ ## func ## _df(df, pws->b[8]); \
2528 pwd->b[9] = msa_ ## func ## _df(df, pws->b[9]); \
2529 pwd->b[10] = msa_ ## func ## _df(df, pws->b[10]); \
2530 pwd->b[11] = msa_ ## func ## _df(df, pws->b[11]); \
2531 pwd->b[12] = msa_ ## func ## _df(df, pws->b[12]); \
2532 pwd->b[13] = msa_ ## func ## _df(df, pws->b[13]); \
2533 pwd->b[14] = msa_ ## func ## _df(df, pws->b[14]); \
2534 pwd->b[15] = msa_ ## func ## _df(df, pws->b[15]); \
2537 pwd->h[0] = msa_ ## func ## _df(df, pws->h[0]); \
2538 pwd->h[1] = msa_ ## func ## _df(df, pws->h[1]); \
2539 pwd->h[2] = msa_ ## func ## _df(df, pws->h[2]); \
2540 pwd->h[3] = msa_ ## func ## _df(df, pws->h[3]); \
2541 pwd->h[4] = msa_ ## func ## _df(df, pws->h[4]); \
2542 pwd->h[5] = msa_ ## func ## _df(df, pws->h[5]); \
2543 pwd->h[6] = msa_ ## func ## _df(df, pws->h[6]); \
2544 pwd->h[7] = msa_ ## func ## _df(df, pws->h[7]); \
2547 pwd->w[0] = msa_ ## func ## _df(df, pws->w[0]); \
2548 pwd->w[1] = msa_ ## func ## _df(df, pws->w[1]); \
2549 pwd->w[2] = msa_ ## func ## _df(df, pws->w[2]); \
2550 pwd->w[3] = msa_ ## func ## _df(df, pws->w[3]); \
2553 pwd->d[0] = msa_ ## func ## _df(df, pws->d[0]); \
2554 pwd->d[1] = msa_ ## func ## _df(df, pws->d[1]); \
2566 #define FLOAT_ONE32 make_float32(0x3f8 << 20)
2567 #define FLOAT_ONE64 make_float64(0x3ffULL << 52)
2569 #define FLOAT_SNAN16(s) (float16_default_nan(s) ^ 0x0220)
2571 #define FLOAT_SNAN32(s) (float32_default_nan(s) ^ 0x00400020)
2573 #define FLOAT_SNAN64(s) (float64_default_nan(s) ^ 0x0008000000000020ULL)
2574 /* 0x7ff0000000000020 */
2576 static inline void clear_msacsr_cause(CPUMIPSState
*env
)
2578 SET_FP_CAUSE(env
->active_tc
.msacsr
, 0);
2581 static inline void check_msacsr_cause(CPUMIPSState
*env
, uintptr_t retaddr
)
2583 if ((GET_FP_CAUSE(env
->active_tc
.msacsr
) &
2584 (GET_FP_ENABLE(env
->active_tc
.msacsr
) | FP_UNIMPLEMENTED
)) == 0) {
2585 UPDATE_FP_FLAGS(env
->active_tc
.msacsr
,
2586 GET_FP_CAUSE(env
->active_tc
.msacsr
));
2588 do_raise_exception(env
, EXCP_MSAFPE
, retaddr
);
2592 /* Flush-to-zero use cases for update_msacsr() */
2593 #define CLEAR_FS_UNDERFLOW 1
2594 #define CLEAR_IS_INEXACT 2
2595 #define RECIPROCAL_INEXACT 4
2597 static inline int update_msacsr(CPUMIPSState
*env
, int action
, int denormal
)
2605 ieee_ex
= get_float_exception_flags(&env
->active_tc
.msa_fp_status
);
2607 /* QEMU softfloat does not signal all underflow cases */
2609 ieee_ex
|= float_flag_underflow
;
2612 c
= ieee_ex_to_mips(ieee_ex
);
2613 enable
= GET_FP_ENABLE(env
->active_tc
.msacsr
) | FP_UNIMPLEMENTED
;
2615 /* Set Inexact (I) when flushing inputs to zero */
2616 if ((ieee_ex
& float_flag_input_denormal
) &&
2617 (env
->active_tc
.msacsr
& MSACSR_FS_MASK
) != 0) {
2618 if (action
& CLEAR_IS_INEXACT
) {
2625 /* Set Inexact (I) and Underflow (U) when flushing outputs to zero */
2626 if ((ieee_ex
& float_flag_output_denormal
) &&
2627 (env
->active_tc
.msacsr
& MSACSR_FS_MASK
) != 0) {
2629 if (action
& CLEAR_FS_UNDERFLOW
) {
2636 /* Set Inexact (I) when Overflow (O) is not enabled */
2637 if ((c
& FP_OVERFLOW
) != 0 && (enable
& FP_OVERFLOW
) == 0) {
2641 /* Clear Exact Underflow when Underflow (U) is not enabled */
2642 if ((c
& FP_UNDERFLOW
) != 0 && (enable
& FP_UNDERFLOW
) == 0 &&
2643 (c
& FP_INEXACT
) == 0) {
2648 * Reciprocal operations set only Inexact when valid and not
2651 if ((action
& RECIPROCAL_INEXACT
) &&
2652 (c
& (FP_INVALID
| FP_DIV0
)) == 0) {
2656 cause
= c
& enable
; /* all current enabled exceptions */
2660 * No enabled exception, update the MSACSR Cause
2661 * with all current exceptions
2663 SET_FP_CAUSE(env
->active_tc
.msacsr
,
2664 (GET_FP_CAUSE(env
->active_tc
.msacsr
) | c
));
2666 /* Current exceptions are enabled */
2667 if ((env
->active_tc
.msacsr
& MSACSR_NX_MASK
) == 0) {
2669 * Exception(s) will trap, update MSACSR Cause
2670 * with all enabled exceptions
2672 SET_FP_CAUSE(env
->active_tc
.msacsr
,
2673 (GET_FP_CAUSE(env
->active_tc
.msacsr
) | c
));
2680 static inline int get_enabled_exceptions(const CPUMIPSState
*env
, int c
)
2682 int enable
= GET_FP_ENABLE(env
->active_tc
.msacsr
) | FP_UNIMPLEMENTED
;
2686 static inline float16
float16_from_float32(int32_t a
, flag ieee
,
2687 float_status
*status
)
2691 f_val
= float32_to_float16((float32
)a
, ieee
, status
);
2693 return a
< 0 ? (f_val
| (1 << 15)) : f_val
;
2696 static inline float32
float32_from_float64(int64_t a
, float_status
*status
)
2700 f_val
= float64_to_float32((float64
)a
, status
);
2702 return a
< 0 ? (f_val
| (1 << 31)) : f_val
;
2705 static inline float32
float32_from_float16(int16_t a
, flag ieee
,
2706 float_status
*status
)
2710 f_val
= float16_to_float32((float16
)a
, ieee
, status
);
2712 return a
< 0 ? (f_val
| (1 << 31)) : f_val
;
2715 static inline float64
float64_from_float32(int32_t a
, float_status
*status
)
2719 f_val
= float32_to_float64((float64
)a
, status
);
2721 return a
< 0 ? (f_val
| (1ULL << 63)) : f_val
;
2724 static inline float32
float32_from_q16(int16_t a
, float_status
*status
)
2728 /* conversion as integer and scaling */
2729 f_val
= int32_to_float32(a
, status
);
2730 f_val
= float32_scalbn(f_val
, -15, status
);
2735 static inline float64
float64_from_q32(int32_t a
, float_status
*status
)
2739 /* conversion as integer and scaling */
2740 f_val
= int32_to_float64(a
, status
);
2741 f_val
= float64_scalbn(f_val
, -31, status
);
2746 static inline int16_t float32_to_q16(float32 a
, float_status
*status
)
2749 int32_t q_min
= 0xffff8000;
2750 int32_t q_max
= 0x00007fff;
2754 if (float32_is_any_nan(a
)) {
2755 float_raise(float_flag_invalid
, status
);
2760 a
= float32_scalbn(a
, 15, status
);
2762 ieee_ex
= get_float_exception_flags(status
);
2763 set_float_exception_flags(ieee_ex
& (~float_flag_underflow
)
2766 if (ieee_ex
& float_flag_overflow
) {
2767 float_raise(float_flag_inexact
, status
);
2768 return (int32_t)a
< 0 ? q_min
: q_max
;
2771 /* conversion to int */
2772 q_val
= float32_to_int32(a
, status
);
2774 ieee_ex
= get_float_exception_flags(status
);
2775 set_float_exception_flags(ieee_ex
& (~float_flag_underflow
)
2778 if (ieee_ex
& float_flag_invalid
) {
2779 set_float_exception_flags(ieee_ex
& (~float_flag_invalid
)
2781 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2782 return (int32_t)a
< 0 ? q_min
: q_max
;
2785 if (q_val
< q_min
) {
2786 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2787 return (int16_t)q_min
;
2790 if (q_max
< q_val
) {
2791 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2792 return (int16_t)q_max
;
2795 return (int16_t)q_val
;
2798 static inline int32_t float64_to_q32(float64 a
, float_status
*status
)
2801 int64_t q_min
= 0xffffffff80000000LL
;
2802 int64_t q_max
= 0x000000007fffffffLL
;
2806 if (float64_is_any_nan(a
)) {
2807 float_raise(float_flag_invalid
, status
);
2812 a
= float64_scalbn(a
, 31, status
);
2814 ieee_ex
= get_float_exception_flags(status
);
2815 set_float_exception_flags(ieee_ex
& (~float_flag_underflow
)
2818 if (ieee_ex
& float_flag_overflow
) {
2819 float_raise(float_flag_inexact
, status
);
2820 return (int64_t)a
< 0 ? q_min
: q_max
;
2823 /* conversion to integer */
2824 q_val
= float64_to_int64(a
, status
);
2826 ieee_ex
= get_float_exception_flags(status
);
2827 set_float_exception_flags(ieee_ex
& (~float_flag_underflow
)
2830 if (ieee_ex
& float_flag_invalid
) {
2831 set_float_exception_flags(ieee_ex
& (~float_flag_invalid
)
2833 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2834 return (int64_t)a
< 0 ? q_min
: q_max
;
2837 if (q_val
< q_min
) {
2838 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2839 return (int32_t)q_min
;
2842 if (q_max
< q_val
) {
2843 float_raise(float_flag_overflow
| float_flag_inexact
, status
);
2844 return (int32_t)q_max
;
2847 return (int32_t)q_val
;
2850 #define MSA_FLOAT_COND(DEST, OP, ARG1, ARG2, BITS, QUIET) \
2852 float_status *status = &env->active_tc.msa_fp_status; \
2855 set_float_exception_flags(0, status); \
2857 cond = float ## BITS ## _ ## OP(ARG1, ARG2, status); \
2859 cond = float ## BITS ## _ ## OP ## _quiet(ARG1, ARG2, status); \
2861 DEST = cond ? M_MAX_UINT(BITS) : 0; \
2862 c = update_msacsr(env, CLEAR_IS_INEXACT, 0); \
2864 if (get_enabled_exceptions(env, c)) { \
2865 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
2869 #define MSA_FLOAT_AF(DEST, ARG1, ARG2, BITS, QUIET) \
2871 MSA_FLOAT_COND(DEST, eq, ARG1, ARG2, BITS, QUIET); \
2872 if ((DEST & M_MAX_UINT(BITS)) == M_MAX_UINT(BITS)) { \
2877 #define MSA_FLOAT_UEQ(DEST, ARG1, ARG2, BITS, QUIET) \
2879 MSA_FLOAT_COND(DEST, unordered, ARG1, ARG2, BITS, QUIET); \
2881 MSA_FLOAT_COND(DEST, eq, ARG1, ARG2, BITS, QUIET); \
2885 #define MSA_FLOAT_NE(DEST, ARG1, ARG2, BITS, QUIET) \
2887 MSA_FLOAT_COND(DEST, lt, ARG1, ARG2, BITS, QUIET); \
2889 MSA_FLOAT_COND(DEST, lt, ARG2, ARG1, BITS, QUIET); \
2893 #define MSA_FLOAT_UNE(DEST, ARG1, ARG2, BITS, QUIET) \
2895 MSA_FLOAT_COND(DEST, unordered, ARG1, ARG2, BITS, QUIET); \
2897 MSA_FLOAT_COND(DEST, lt, ARG1, ARG2, BITS, QUIET); \
2899 MSA_FLOAT_COND(DEST, lt, ARG2, ARG1, BITS, QUIET); \
2904 #define MSA_FLOAT_ULE(DEST, ARG1, ARG2, BITS, QUIET) \
2906 MSA_FLOAT_COND(DEST, unordered, ARG1, ARG2, BITS, QUIET); \
2908 MSA_FLOAT_COND(DEST, le, ARG1, ARG2, BITS, QUIET); \
2912 #define MSA_FLOAT_ULT(DEST, ARG1, ARG2, BITS, QUIET) \
2914 MSA_FLOAT_COND(DEST, unordered, ARG1, ARG2, BITS, QUIET); \
2916 MSA_FLOAT_COND(DEST, lt, ARG1, ARG2, BITS, QUIET); \
2920 #define MSA_FLOAT_OR(DEST, ARG1, ARG2, BITS, QUIET) \
2922 MSA_FLOAT_COND(DEST, le, ARG1, ARG2, BITS, QUIET); \
2924 MSA_FLOAT_COND(DEST, le, ARG2, ARG1, BITS, QUIET); \
2928 static inline void compare_af(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
2929 wr_t
*pwt
, uint32_t df
, int quiet
,
2932 wr_t wx
, *pwx
= &wx
;
2935 clear_msacsr_cause(env
);
2939 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
2940 MSA_FLOAT_AF(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
2944 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
2945 MSA_FLOAT_AF(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
2952 check_msacsr_cause(env
, retaddr
);
2954 msa_move_v(pwd
, pwx
);
2957 static inline void compare_un(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
2958 wr_t
*pwt
, uint32_t df
, int quiet
,
2961 wr_t wx
, *pwx
= &wx
;
2964 clear_msacsr_cause(env
);
2968 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
2969 MSA_FLOAT_COND(pwx
->w
[i
], unordered
, pws
->w
[i
], pwt
->w
[i
], 32,
2974 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
2975 MSA_FLOAT_COND(pwx
->d
[i
], unordered
, pws
->d
[i
], pwt
->d
[i
], 64,
2983 check_msacsr_cause(env
, retaddr
);
2985 msa_move_v(pwd
, pwx
);
2988 static inline void compare_eq(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
2989 wr_t
*pwt
, uint32_t df
, int quiet
,
2992 wr_t wx
, *pwx
= &wx
;
2995 clear_msacsr_cause(env
);
2999 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3000 MSA_FLOAT_COND(pwx
->w
[i
], eq
, pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3004 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3005 MSA_FLOAT_COND(pwx
->d
[i
], eq
, pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3012 check_msacsr_cause(env
, retaddr
);
3014 msa_move_v(pwd
, pwx
);
3017 static inline void compare_ueq(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3018 wr_t
*pwt
, uint32_t df
, int quiet
,
3021 wr_t wx
, *pwx
= &wx
;
3024 clear_msacsr_cause(env
);
3028 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3029 MSA_FLOAT_UEQ(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3033 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3034 MSA_FLOAT_UEQ(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3041 check_msacsr_cause(env
, retaddr
);
3043 msa_move_v(pwd
, pwx
);
3046 static inline void compare_lt(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3047 wr_t
*pwt
, uint32_t df
, int quiet
,
3050 wr_t wx
, *pwx
= &wx
;
3053 clear_msacsr_cause(env
);
3057 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3058 MSA_FLOAT_COND(pwx
->w
[i
], lt
, pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3062 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3063 MSA_FLOAT_COND(pwx
->d
[i
], lt
, pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3070 check_msacsr_cause(env
, retaddr
);
3072 msa_move_v(pwd
, pwx
);
3075 static inline void compare_ult(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3076 wr_t
*pwt
, uint32_t df
, int quiet
,
3079 wr_t wx
, *pwx
= &wx
;
3082 clear_msacsr_cause(env
);
3086 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3087 MSA_FLOAT_ULT(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3091 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3092 MSA_FLOAT_ULT(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3099 check_msacsr_cause(env
, retaddr
);
3101 msa_move_v(pwd
, pwx
);
3104 static inline void compare_le(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3105 wr_t
*pwt
, uint32_t df
, int quiet
,
3108 wr_t wx
, *pwx
= &wx
;
3111 clear_msacsr_cause(env
);
3115 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3116 MSA_FLOAT_COND(pwx
->w
[i
], le
, pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3120 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3121 MSA_FLOAT_COND(pwx
->d
[i
], le
, pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3128 check_msacsr_cause(env
, retaddr
);
3130 msa_move_v(pwd
, pwx
);
3133 static inline void compare_ule(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3134 wr_t
*pwt
, uint32_t df
, int quiet
,
3137 wr_t wx
, *pwx
= &wx
;
3140 clear_msacsr_cause(env
);
3144 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3145 MSA_FLOAT_ULE(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3149 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3150 MSA_FLOAT_ULE(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3157 check_msacsr_cause(env
, retaddr
);
3159 msa_move_v(pwd
, pwx
);
3162 static inline void compare_or(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3163 wr_t
*pwt
, uint32_t df
, int quiet
,
3166 wr_t wx
, *pwx
= &wx
;
3169 clear_msacsr_cause(env
);
3173 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3174 MSA_FLOAT_OR(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3178 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3179 MSA_FLOAT_OR(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3186 check_msacsr_cause(env
, retaddr
);
3188 msa_move_v(pwd
, pwx
);
3191 static inline void compare_une(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3192 wr_t
*pwt
, uint32_t df
, int quiet
,
3195 wr_t wx
, *pwx
= &wx
;
3198 clear_msacsr_cause(env
);
3202 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3203 MSA_FLOAT_UNE(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3207 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3208 MSA_FLOAT_UNE(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3215 check_msacsr_cause(env
, retaddr
);
3217 msa_move_v(pwd
, pwx
);
3220 static inline void compare_ne(CPUMIPSState
*env
, wr_t
*pwd
, wr_t
*pws
,
3221 wr_t
*pwt
, uint32_t df
, int quiet
,
3224 wr_t wx
, *pwx
= &wx
;
3227 clear_msacsr_cause(env
);
3231 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3232 MSA_FLOAT_NE(pwx
->w
[i
], pws
->w
[i
], pwt
->w
[i
], 32, quiet
);
3236 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3237 MSA_FLOAT_NE(pwx
->d
[i
], pws
->d
[i
], pwt
->d
[i
], 64, quiet
);
3244 check_msacsr_cause(env
, retaddr
);
3246 msa_move_v(pwd
, pwx
);
3249 void helper_msa_fcaf_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3250 uint32_t ws
, uint32_t wt
)
3252 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3253 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3254 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3255 compare_af(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3258 void helper_msa_fcun_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3259 uint32_t ws
, uint32_t wt
)
3261 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3262 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3263 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3264 compare_un(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3267 void helper_msa_fceq_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3268 uint32_t ws
, uint32_t wt
)
3270 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3271 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3272 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3273 compare_eq(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3276 void helper_msa_fcueq_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3277 uint32_t ws
, uint32_t wt
)
3279 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3280 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3281 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3282 compare_ueq(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3285 void helper_msa_fclt_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3286 uint32_t ws
, uint32_t wt
)
3288 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3289 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3290 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3291 compare_lt(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3294 void helper_msa_fcult_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3295 uint32_t ws
, uint32_t wt
)
3297 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3298 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3299 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3300 compare_ult(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3303 void helper_msa_fcle_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3304 uint32_t ws
, uint32_t wt
)
3306 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3307 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3308 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3309 compare_le(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3312 void helper_msa_fcule_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3313 uint32_t ws
, uint32_t wt
)
3315 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3316 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3317 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3318 compare_ule(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3321 void helper_msa_fsaf_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3322 uint32_t ws
, uint32_t wt
)
3324 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3325 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3326 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3327 compare_af(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3330 void helper_msa_fsun_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3331 uint32_t ws
, uint32_t wt
)
3333 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3334 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3335 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3336 compare_un(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3339 void helper_msa_fseq_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3340 uint32_t ws
, uint32_t wt
)
3342 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3343 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3344 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3345 compare_eq(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3348 void helper_msa_fsueq_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3349 uint32_t ws
, uint32_t wt
)
3351 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3352 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3353 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3354 compare_ueq(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3357 void helper_msa_fslt_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3358 uint32_t ws
, uint32_t wt
)
3360 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3361 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3362 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3363 compare_lt(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3366 void helper_msa_fsult_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3367 uint32_t ws
, uint32_t wt
)
3369 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3370 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3371 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3372 compare_ult(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3375 void helper_msa_fsle_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3376 uint32_t ws
, uint32_t wt
)
3378 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3379 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3380 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3381 compare_le(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3384 void helper_msa_fsule_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3385 uint32_t ws
, uint32_t wt
)
3387 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3388 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3389 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3390 compare_ule(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3393 void helper_msa_fcor_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3394 uint32_t ws
, uint32_t wt
)
3396 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3397 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3398 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3399 compare_or(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3402 void helper_msa_fcune_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3403 uint32_t ws
, uint32_t wt
)
3405 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3406 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3407 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3408 compare_une(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3411 void helper_msa_fcne_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3412 uint32_t ws
, uint32_t wt
)
3414 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3415 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3416 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3417 compare_ne(env
, pwd
, pws
, pwt
, df
, 1, GETPC());
3420 void helper_msa_fsor_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3421 uint32_t ws
, uint32_t wt
)
3423 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3424 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3425 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3426 compare_or(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3429 void helper_msa_fsune_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3430 uint32_t ws
, uint32_t wt
)
3432 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3433 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3434 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3435 compare_une(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3438 void helper_msa_fsne_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3439 uint32_t ws
, uint32_t wt
)
3441 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3442 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3443 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3444 compare_ne(env
, pwd
, pws
, pwt
, df
, 0, GETPC());
3447 #define float16_is_zero(ARG) 0
3448 #define float16_is_zero_or_denormal(ARG) 0
3450 #define IS_DENORMAL(ARG, BITS) \
3451 (!float ## BITS ## _is_zero(ARG) \
3452 && float ## BITS ## _is_zero_or_denormal(ARG))
3454 #define MSA_FLOAT_BINOP(DEST, OP, ARG1, ARG2, BITS) \
3456 float_status *status = &env->active_tc.msa_fp_status; \
3459 set_float_exception_flags(0, status); \
3460 DEST = float ## BITS ## _ ## OP(ARG1, ARG2, status); \
3461 c = update_msacsr(env, 0, IS_DENORMAL(DEST, BITS)); \
3463 if (get_enabled_exceptions(env, c)) { \
3464 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
3468 void helper_msa_fadd_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3469 uint32_t ws
, uint32_t wt
)
3471 wr_t wx
, *pwx
= &wx
;
3472 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3473 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3474 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3477 clear_msacsr_cause(env
);
3481 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3482 MSA_FLOAT_BINOP(pwx
->w
[i
], add
, pws
->w
[i
], pwt
->w
[i
], 32);
3486 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3487 MSA_FLOAT_BINOP(pwx
->d
[i
], add
, pws
->d
[i
], pwt
->d
[i
], 64);
3494 check_msacsr_cause(env
, GETPC());
3495 msa_move_v(pwd
, pwx
);
3498 void helper_msa_fsub_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3499 uint32_t ws
, uint32_t wt
)
3501 wr_t wx
, *pwx
= &wx
;
3502 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3503 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3504 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3507 clear_msacsr_cause(env
);
3511 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3512 MSA_FLOAT_BINOP(pwx
->w
[i
], sub
, pws
->w
[i
], pwt
->w
[i
], 32);
3516 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3517 MSA_FLOAT_BINOP(pwx
->d
[i
], sub
, pws
->d
[i
], pwt
->d
[i
], 64);
3524 check_msacsr_cause(env
, GETPC());
3525 msa_move_v(pwd
, pwx
);
3528 void helper_msa_fmul_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3529 uint32_t ws
, uint32_t wt
)
3531 wr_t wx
, *pwx
= &wx
;
3532 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3533 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3534 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3537 clear_msacsr_cause(env
);
3541 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3542 MSA_FLOAT_BINOP(pwx
->w
[i
], mul
, pws
->w
[i
], pwt
->w
[i
], 32);
3546 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3547 MSA_FLOAT_BINOP(pwx
->d
[i
], mul
, pws
->d
[i
], pwt
->d
[i
], 64);
3554 check_msacsr_cause(env
, GETPC());
3556 msa_move_v(pwd
, pwx
);
3559 void helper_msa_fdiv_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3560 uint32_t ws
, uint32_t wt
)
3562 wr_t wx
, *pwx
= &wx
;
3563 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3564 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3565 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3568 clear_msacsr_cause(env
);
3572 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3573 MSA_FLOAT_BINOP(pwx
->w
[i
], div
, pws
->w
[i
], pwt
->w
[i
], 32);
3577 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3578 MSA_FLOAT_BINOP(pwx
->d
[i
], div
, pws
->d
[i
], pwt
->d
[i
], 64);
3585 check_msacsr_cause(env
, GETPC());
3587 msa_move_v(pwd
, pwx
);
3590 #define MSA_FLOAT_MULADD(DEST, ARG1, ARG2, ARG3, NEGATE, BITS) \
3592 float_status *status = &env->active_tc.msa_fp_status; \
3595 set_float_exception_flags(0, status); \
3596 DEST = float ## BITS ## _muladd(ARG2, ARG3, ARG1, NEGATE, status); \
3597 c = update_msacsr(env, 0, IS_DENORMAL(DEST, BITS)); \
3599 if (get_enabled_exceptions(env, c)) { \
3600 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
3604 void helper_msa_fmadd_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3605 uint32_t ws
, uint32_t wt
)
3607 wr_t wx
, *pwx
= &wx
;
3608 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3609 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3610 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3613 clear_msacsr_cause(env
);
3617 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3618 MSA_FLOAT_MULADD(pwx
->w
[i
], pwd
->w
[i
],
3619 pws
->w
[i
], pwt
->w
[i
], 0, 32);
3623 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3624 MSA_FLOAT_MULADD(pwx
->d
[i
], pwd
->d
[i
],
3625 pws
->d
[i
], pwt
->d
[i
], 0, 64);
3632 check_msacsr_cause(env
, GETPC());
3634 msa_move_v(pwd
, pwx
);
3637 void helper_msa_fmsub_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3638 uint32_t ws
, uint32_t wt
)
3640 wr_t wx
, *pwx
= &wx
;
3641 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3642 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3643 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3646 clear_msacsr_cause(env
);
3650 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3651 MSA_FLOAT_MULADD(pwx
->w
[i
], pwd
->w
[i
],
3652 pws
->w
[i
], pwt
->w
[i
],
3653 float_muladd_negate_product
, 32);
3657 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3658 MSA_FLOAT_MULADD(pwx
->d
[i
], pwd
->d
[i
],
3659 pws
->d
[i
], pwt
->d
[i
],
3660 float_muladd_negate_product
, 64);
3667 check_msacsr_cause(env
, GETPC());
3669 msa_move_v(pwd
, pwx
);
3672 void helper_msa_fexp2_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3673 uint32_t ws
, uint32_t wt
)
3675 wr_t wx
, *pwx
= &wx
;
3676 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3677 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3678 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3681 clear_msacsr_cause(env
);
3685 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3686 MSA_FLOAT_BINOP(pwx
->w
[i
], scalbn
, pws
->w
[i
],
3687 pwt
->w
[i
] > 0x200 ? 0x200 :
3688 pwt
->w
[i
] < -0x200 ? -0x200 : pwt
->w
[i
],
3693 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3694 MSA_FLOAT_BINOP(pwx
->d
[i
], scalbn
, pws
->d
[i
],
3695 pwt
->d
[i
] > 0x1000 ? 0x1000 :
3696 pwt
->d
[i
] < -0x1000 ? -0x1000 : pwt
->d
[i
],
3704 check_msacsr_cause(env
, GETPC());
3706 msa_move_v(pwd
, pwx
);
3709 #define MSA_FLOAT_UNOP(DEST, OP, ARG, BITS) \
3711 float_status *status = &env->active_tc.msa_fp_status; \
3714 set_float_exception_flags(0, status); \
3715 DEST = float ## BITS ## _ ## OP(ARG, status); \
3716 c = update_msacsr(env, 0, IS_DENORMAL(DEST, BITS)); \
3718 if (get_enabled_exceptions(env, c)) { \
3719 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
3723 void helper_msa_fexdo_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3724 uint32_t ws
, uint32_t wt
)
3726 wr_t wx
, *pwx
= &wx
;
3727 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3728 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3729 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3732 clear_msacsr_cause(env
);
3736 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3738 * Half precision floats come in two formats: standard
3739 * IEEE and "ARM" format. The latter gains extra exponent
3740 * range by omitting the NaN/Inf encodings.
3744 MSA_FLOAT_BINOP(Lh(pwx
, i
), from_float32
, pws
->w
[i
], ieee
, 16);
3745 MSA_FLOAT_BINOP(Rh(pwx
, i
), from_float32
, pwt
->w
[i
], ieee
, 16);
3749 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3750 MSA_FLOAT_UNOP(Lw(pwx
, i
), from_float64
, pws
->d
[i
], 32);
3751 MSA_FLOAT_UNOP(Rw(pwx
, i
), from_float64
, pwt
->d
[i
], 32);
3758 check_msacsr_cause(env
, GETPC());
3759 msa_move_v(pwd
, pwx
);
3762 #define MSA_FLOAT_UNOP_XD(DEST, OP, ARG, BITS, XBITS) \
3764 float_status *status = &env->active_tc.msa_fp_status; \
3767 set_float_exception_flags(0, status); \
3768 DEST = float ## BITS ## _ ## OP(ARG, status); \
3769 c = update_msacsr(env, CLEAR_FS_UNDERFLOW, 0); \
3771 if (get_enabled_exceptions(env, c)) { \
3772 DEST = ((FLOAT_SNAN ## XBITS(status) >> 6) << 6) | c; \
3776 void helper_msa_ftq_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3777 uint32_t ws
, uint32_t wt
)
3779 wr_t wx
, *pwx
= &wx
;
3780 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3781 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3782 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3785 clear_msacsr_cause(env
);
3789 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
3790 MSA_FLOAT_UNOP_XD(Lh(pwx
, i
), to_q16
, pws
->w
[i
], 32, 16);
3791 MSA_FLOAT_UNOP_XD(Rh(pwx
, i
), to_q16
, pwt
->w
[i
], 32, 16);
3795 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
3796 MSA_FLOAT_UNOP_XD(Lw(pwx
, i
), to_q32
, pws
->d
[i
], 64, 32);
3797 MSA_FLOAT_UNOP_XD(Rw(pwx
, i
), to_q32
, pwt
->d
[i
], 64, 32);
3804 check_msacsr_cause(env
, GETPC());
3806 msa_move_v(pwd
, pwx
);
3809 #define NUMBER_QNAN_PAIR(ARG1, ARG2, BITS, STATUS) \
3810 !float ## BITS ## _is_any_nan(ARG1) \
3811 && float ## BITS ## _is_quiet_nan(ARG2, STATUS)
3813 #define MSA_FLOAT_MAXOP(DEST, OP, ARG1, ARG2, BITS) \
3815 float_status *status = &env->active_tc.msa_fp_status; \
3818 set_float_exception_flags(0, status); \
3819 DEST = float ## BITS ## _ ## OP(ARG1, ARG2, status); \
3820 c = update_msacsr(env, 0, 0); \
3822 if (get_enabled_exceptions(env, c)) { \
3823 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
3827 #define FMAXMIN_A(F, G, X, _S, _T, BITS, STATUS) \
3829 uint## BITS ##_t S = _S, T = _T; \
3830 uint## BITS ##_t as, at, xs, xt, xd; \
3831 if (NUMBER_QNAN_PAIR(S, T, BITS, STATUS)) { \
3834 else if (NUMBER_QNAN_PAIR(T, S, BITS, STATUS)) { \
3837 as = float## BITS ##_abs(S); \
3838 at = float## BITS ##_abs(T); \
3839 MSA_FLOAT_MAXOP(xs, F, S, T, BITS); \
3840 MSA_FLOAT_MAXOP(xt, G, S, T, BITS); \
3841 MSA_FLOAT_MAXOP(xd, F, as, at, BITS); \
3842 X = (as == at || xd == float## BITS ##_abs(xs)) ? xs : xt; \
3845 void helper_msa_fmin_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3846 uint32_t ws
, uint32_t wt
)
3848 float_status
*status
= &env
->active_tc
.msa_fp_status
;
3849 wr_t wx
, *pwx
= &wx
;
3850 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3851 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3852 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3854 clear_msacsr_cause(env
);
3856 if (df
== DF_WORD
) {
3858 if (NUMBER_QNAN_PAIR(pws
->w
[0], pwt
->w
[0], 32, status
)) {
3859 MSA_FLOAT_MAXOP(pwx
->w
[0], min
, pws
->w
[0], pws
->w
[0], 32);
3860 } else if (NUMBER_QNAN_PAIR(pwt
->w
[0], pws
->w
[0], 32, status
)) {
3861 MSA_FLOAT_MAXOP(pwx
->w
[0], min
, pwt
->w
[0], pwt
->w
[0], 32);
3863 MSA_FLOAT_MAXOP(pwx
->w
[0], min
, pws
->w
[0], pwt
->w
[0], 32);
3866 if (NUMBER_QNAN_PAIR(pws
->w
[1], pwt
->w
[1], 32, status
)) {
3867 MSA_FLOAT_MAXOP(pwx
->w
[1], min
, pws
->w
[1], pws
->w
[1], 32);
3868 } else if (NUMBER_QNAN_PAIR(pwt
->w
[1], pws
->w
[1], 32, status
)) {
3869 MSA_FLOAT_MAXOP(pwx
->w
[1], min
, pwt
->w
[1], pwt
->w
[1], 32);
3871 MSA_FLOAT_MAXOP(pwx
->w
[1], min
, pws
->w
[1], pwt
->w
[1], 32);
3874 if (NUMBER_QNAN_PAIR(pws
->w
[2], pwt
->w
[2], 32, status
)) {
3875 MSA_FLOAT_MAXOP(pwx
->w
[2], min
, pws
->w
[2], pws
->w
[2], 32);
3876 } else if (NUMBER_QNAN_PAIR(pwt
->w
[2], pws
->w
[2], 32, status
)) {
3877 MSA_FLOAT_MAXOP(pwx
->w
[2], min
, pwt
->w
[2], pwt
->w
[2], 32);
3879 MSA_FLOAT_MAXOP(pwx
->w
[2], min
, pws
->w
[2], pwt
->w
[2], 32);
3882 if (NUMBER_QNAN_PAIR(pws
->w
[3], pwt
->w
[3], 32, status
)) {
3883 MSA_FLOAT_MAXOP(pwx
->w
[3], min
, pws
->w
[3], pws
->w
[3], 32);
3884 } else if (NUMBER_QNAN_PAIR(pwt
->w
[3], pws
->w
[3], 32, status
)) {
3885 MSA_FLOAT_MAXOP(pwx
->w
[3], min
, pwt
->w
[3], pwt
->w
[3], 32);
3887 MSA_FLOAT_MAXOP(pwx
->w
[3], min
, pws
->w
[3], pwt
->w
[3], 32);
3890 } else if (df
== DF_DOUBLE
) {
3892 if (NUMBER_QNAN_PAIR(pws
->d
[0], pwt
->d
[0], 64, status
)) {
3893 MSA_FLOAT_MAXOP(pwx
->d
[0], min
, pws
->d
[0], pws
->d
[0], 64);
3894 } else if (NUMBER_QNAN_PAIR(pwt
->d
[0], pws
->d
[0], 64, status
)) {
3895 MSA_FLOAT_MAXOP(pwx
->d
[0], min
, pwt
->d
[0], pwt
->d
[0], 64);
3897 MSA_FLOAT_MAXOP(pwx
->d
[0], min
, pws
->d
[0], pwt
->d
[0], 64);
3900 if (NUMBER_QNAN_PAIR(pws
->d
[1], pwt
->d
[1], 64, status
)) {
3901 MSA_FLOAT_MAXOP(pwx
->d
[1], min
, pws
->d
[1], pws
->d
[1], 64);
3902 } else if (NUMBER_QNAN_PAIR(pwt
->d
[1], pws
->d
[1], 64, status
)) {
3903 MSA_FLOAT_MAXOP(pwx
->d
[1], min
, pwt
->d
[1], pwt
->d
[1], 64);
3905 MSA_FLOAT_MAXOP(pwx
->d
[1], min
, pws
->d
[1], pwt
->d
[1], 64);
3914 check_msacsr_cause(env
, GETPC());
3916 msa_move_v(pwd
, pwx
);
3919 void helper_msa_fmin_a_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3920 uint32_t ws
, uint32_t wt
)
3922 float_status
*status
= &env
->active_tc
.msa_fp_status
;
3923 wr_t wx
, *pwx
= &wx
;
3924 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3925 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3926 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3928 clear_msacsr_cause(env
);
3930 if (df
== DF_WORD
) {
3931 FMAXMIN_A(min
, max
, pwx
->w
[0], pws
->w
[0], pwt
->w
[0], 32, status
);
3932 FMAXMIN_A(min
, max
, pwx
->w
[1], pws
->w
[1], pwt
->w
[1], 32, status
);
3933 FMAXMIN_A(min
, max
, pwx
->w
[2], pws
->w
[2], pwt
->w
[2], 32, status
);
3934 FMAXMIN_A(min
, max
, pwx
->w
[3], pws
->w
[3], pwt
->w
[3], 32, status
);
3935 } else if (df
== DF_DOUBLE
) {
3936 FMAXMIN_A(min
, max
, pwx
->d
[0], pws
->d
[0], pwt
->d
[0], 64, status
);
3937 FMAXMIN_A(min
, max
, pwx
->d
[1], pws
->d
[1], pwt
->d
[1], 64, status
);
3942 check_msacsr_cause(env
, GETPC());
3944 msa_move_v(pwd
, pwx
);
3947 void helper_msa_fmax_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
3948 uint32_t ws
, uint32_t wt
)
3950 float_status
*status
= &env
->active_tc
.msa_fp_status
;
3951 wr_t wx
, *pwx
= &wx
;
3952 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
3953 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
3954 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
3956 clear_msacsr_cause(env
);
3958 if (df
== DF_WORD
) {
3960 if (NUMBER_QNAN_PAIR(pws
->w
[0], pwt
->w
[0], 32, status
)) {
3961 MSA_FLOAT_MAXOP(pwx
->w
[0], max
, pws
->w
[0], pws
->w
[0], 32);
3962 } else if (NUMBER_QNAN_PAIR(pwt
->w
[0], pws
->w
[0], 32, status
)) {
3963 MSA_FLOAT_MAXOP(pwx
->w
[0], max
, pwt
->w
[0], pwt
->w
[0], 32);
3965 MSA_FLOAT_MAXOP(pwx
->w
[0], max
, pws
->w
[0], pwt
->w
[0], 32);
3968 if (NUMBER_QNAN_PAIR(pws
->w
[1], pwt
->w
[1], 32, status
)) {
3969 MSA_FLOAT_MAXOP(pwx
->w
[1], max
, pws
->w
[1], pws
->w
[1], 32);
3970 } else if (NUMBER_QNAN_PAIR(pwt
->w
[1], pws
->w
[1], 32, status
)) {
3971 MSA_FLOAT_MAXOP(pwx
->w
[1], max
, pwt
->w
[1], pwt
->w
[1], 32);
3973 MSA_FLOAT_MAXOP(pwx
->w
[1], max
, pws
->w
[1], pwt
->w
[1], 32);
3976 if (NUMBER_QNAN_PAIR(pws
->w
[2], pwt
->w
[2], 32, status
)) {
3977 MSA_FLOAT_MAXOP(pwx
->w
[2], max
, pws
->w
[2], pws
->w
[2], 32);
3978 } else if (NUMBER_QNAN_PAIR(pwt
->w
[2], pws
->w
[2], 32, status
)) {
3979 MSA_FLOAT_MAXOP(pwx
->w
[2], max
, pwt
->w
[2], pwt
->w
[2], 32);
3981 MSA_FLOAT_MAXOP(pwx
->w
[2], max
, pws
->w
[2], pwt
->w
[2], 32);
3984 if (NUMBER_QNAN_PAIR(pws
->w
[3], pwt
->w
[3], 32, status
)) {
3985 MSA_FLOAT_MAXOP(pwx
->w
[3], max
, pws
->w
[3], pws
->w
[3], 32);
3986 } else if (NUMBER_QNAN_PAIR(pwt
->w
[3], pws
->w
[3], 32, status
)) {
3987 MSA_FLOAT_MAXOP(pwx
->w
[3], max
, pwt
->w
[3], pwt
->w
[3], 32);
3989 MSA_FLOAT_MAXOP(pwx
->w
[3], max
, pws
->w
[3], pwt
->w
[3], 32);
3992 } else if (df
== DF_DOUBLE
) {
3994 if (NUMBER_QNAN_PAIR(pws
->d
[0], pwt
->d
[0], 64, status
)) {
3995 MSA_FLOAT_MAXOP(pwx
->d
[0], max
, pws
->d
[0], pws
->d
[0], 64);
3996 } else if (NUMBER_QNAN_PAIR(pwt
->d
[0], pws
->d
[0], 64, status
)) {
3997 MSA_FLOAT_MAXOP(pwx
->d
[0], max
, pwt
->d
[0], pwt
->d
[0], 64);
3999 MSA_FLOAT_MAXOP(pwx
->d
[0], max
, pws
->d
[0], pwt
->d
[0], 64);
4002 if (NUMBER_QNAN_PAIR(pws
->d
[1], pwt
->d
[1], 64, status
)) {
4003 MSA_FLOAT_MAXOP(pwx
->d
[1], max
, pws
->d
[1], pws
->d
[1], 64);
4004 } else if (NUMBER_QNAN_PAIR(pwt
->d
[1], pws
->d
[1], 64, status
)) {
4005 MSA_FLOAT_MAXOP(pwx
->d
[1], max
, pwt
->d
[1], pwt
->d
[1], 64);
4007 MSA_FLOAT_MAXOP(pwx
->d
[1], max
, pws
->d
[1], pwt
->d
[1], 64);
4016 check_msacsr_cause(env
, GETPC());
4018 msa_move_v(pwd
, pwx
);
4021 void helper_msa_fmax_a_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4022 uint32_t ws
, uint32_t wt
)
4024 float_status
*status
= &env
->active_tc
.msa_fp_status
;
4025 wr_t wx
, *pwx
= &wx
;
4026 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4027 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4028 wr_t
*pwt
= &(env
->active_fpu
.fpr
[wt
].wr
);
4030 clear_msacsr_cause(env
);
4032 if (df
== DF_WORD
) {
4033 FMAXMIN_A(max
, min
, pwx
->w
[0], pws
->w
[0], pwt
->w
[0], 32, status
);
4034 FMAXMIN_A(max
, min
, pwx
->w
[1], pws
->w
[1], pwt
->w
[1], 32, status
);
4035 FMAXMIN_A(max
, min
, pwx
->w
[2], pws
->w
[2], pwt
->w
[2], 32, status
);
4036 FMAXMIN_A(max
, min
, pwx
->w
[3], pws
->w
[3], pwt
->w
[3], 32, status
);
4037 } else if (df
== DF_DOUBLE
) {
4038 FMAXMIN_A(max
, min
, pwx
->d
[0], pws
->d
[0], pwt
->d
[0], 64, status
);
4039 FMAXMIN_A(max
, min
, pwx
->d
[1], pws
->d
[1], pwt
->d
[1], 64, status
);
4044 check_msacsr_cause(env
, GETPC());
4046 msa_move_v(pwd
, pwx
);
4049 void helper_msa_fclass_df(CPUMIPSState
*env
, uint32_t df
,
4050 uint32_t wd
, uint32_t ws
)
4052 float_status
*status
= &env
->active_tc
.msa_fp_status
;
4054 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4055 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4056 if (df
== DF_WORD
) {
4057 pwd
->w
[0] = float_class_s(pws
->w
[0], status
);
4058 pwd
->w
[1] = float_class_s(pws
->w
[1], status
);
4059 pwd
->w
[2] = float_class_s(pws
->w
[2], status
);
4060 pwd
->w
[3] = float_class_s(pws
->w
[3], status
);
4061 } else if (df
== DF_DOUBLE
) {
4062 pwd
->d
[0] = float_class_d(pws
->d
[0], status
);
4063 pwd
->d
[1] = float_class_d(pws
->d
[1], status
);
4069 #define MSA_FLOAT_UNOP0(DEST, OP, ARG, BITS) \
4071 float_status *status = &env->active_tc.msa_fp_status; \
4074 set_float_exception_flags(0, status); \
4075 DEST = float ## BITS ## _ ## OP(ARG, status); \
4076 c = update_msacsr(env, CLEAR_FS_UNDERFLOW, 0); \
4078 if (get_enabled_exceptions(env, c)) { \
4079 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
4080 } else if (float ## BITS ## _is_any_nan(ARG)) { \
4085 void helper_msa_ftrunc_s_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4088 wr_t wx
, *pwx
= &wx
;
4089 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4090 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4093 clear_msacsr_cause(env
);
4097 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4098 MSA_FLOAT_UNOP0(pwx
->w
[i
], to_int32_round_to_zero
, pws
->w
[i
], 32);
4102 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4103 MSA_FLOAT_UNOP0(pwx
->d
[i
], to_int64_round_to_zero
, pws
->d
[i
], 64);
4110 check_msacsr_cause(env
, GETPC());
4112 msa_move_v(pwd
, pwx
);
4115 void helper_msa_ftrunc_u_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4118 wr_t wx
, *pwx
= &wx
;
4119 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4120 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4123 clear_msacsr_cause(env
);
4127 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4128 MSA_FLOAT_UNOP0(pwx
->w
[i
], to_uint32_round_to_zero
, pws
->w
[i
], 32);
4132 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4133 MSA_FLOAT_UNOP0(pwx
->d
[i
], to_uint64_round_to_zero
, pws
->d
[i
], 64);
4140 check_msacsr_cause(env
, GETPC());
4142 msa_move_v(pwd
, pwx
);
4145 void helper_msa_fsqrt_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4148 wr_t wx
, *pwx
= &wx
;
4149 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4150 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4153 clear_msacsr_cause(env
);
4157 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4158 MSA_FLOAT_UNOP(pwx
->w
[i
], sqrt
, pws
->w
[i
], 32);
4162 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4163 MSA_FLOAT_UNOP(pwx
->d
[i
], sqrt
, pws
->d
[i
], 64);
4170 check_msacsr_cause(env
, GETPC());
4172 msa_move_v(pwd
, pwx
);
4175 #define MSA_FLOAT_RECIPROCAL(DEST, ARG, BITS) \
4177 float_status *status = &env->active_tc.msa_fp_status; \
4180 set_float_exception_flags(0, status); \
4181 DEST = float ## BITS ## _ ## div(FLOAT_ONE ## BITS, ARG, status); \
4182 c = update_msacsr(env, float ## BITS ## _is_infinity(ARG) || \
4183 float ## BITS ## _is_quiet_nan(DEST, status) ? \
4184 0 : RECIPROCAL_INEXACT, \
4185 IS_DENORMAL(DEST, BITS)); \
4187 if (get_enabled_exceptions(env, c)) { \
4188 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
4192 void helper_msa_frsqrt_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4195 wr_t wx
, *pwx
= &wx
;
4196 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4197 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4200 clear_msacsr_cause(env
);
4204 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4205 MSA_FLOAT_RECIPROCAL(pwx
->w
[i
], float32_sqrt(pws
->w
[i
],
4206 &env
->active_tc
.msa_fp_status
), 32);
4210 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4211 MSA_FLOAT_RECIPROCAL(pwx
->d
[i
], float64_sqrt(pws
->d
[i
],
4212 &env
->active_tc
.msa_fp_status
), 64);
4219 check_msacsr_cause(env
, GETPC());
4221 msa_move_v(pwd
, pwx
);
4224 void helper_msa_frcp_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4227 wr_t wx
, *pwx
= &wx
;
4228 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4229 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4232 clear_msacsr_cause(env
);
4236 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4237 MSA_FLOAT_RECIPROCAL(pwx
->w
[i
], pws
->w
[i
], 32);
4241 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4242 MSA_FLOAT_RECIPROCAL(pwx
->d
[i
], pws
->d
[i
], 64);
4249 check_msacsr_cause(env
, GETPC());
4251 msa_move_v(pwd
, pwx
);
4254 void helper_msa_frint_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4257 wr_t wx
, *pwx
= &wx
;
4258 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4259 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4262 clear_msacsr_cause(env
);
4266 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4267 MSA_FLOAT_UNOP(pwx
->w
[i
], round_to_int
, pws
->w
[i
], 32);
4271 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4272 MSA_FLOAT_UNOP(pwx
->d
[i
], round_to_int
, pws
->d
[i
], 64);
4279 check_msacsr_cause(env
, GETPC());
4281 msa_move_v(pwd
, pwx
);
4284 #define MSA_FLOAT_LOGB(DEST, ARG, BITS) \
4286 float_status *status = &env->active_tc.msa_fp_status; \
4289 set_float_exception_flags(0, status); \
4290 set_float_rounding_mode(float_round_down, status); \
4291 DEST = float ## BITS ## _ ## log2(ARG, status); \
4292 DEST = float ## BITS ## _ ## round_to_int(DEST, status); \
4293 set_float_rounding_mode(ieee_rm[(env->active_tc.msacsr & \
4294 MSACSR_RM_MASK) >> MSACSR_RM], \
4297 set_float_exception_flags(get_float_exception_flags(status) & \
4298 (~float_flag_inexact), \
4301 c = update_msacsr(env, 0, IS_DENORMAL(DEST, BITS)); \
4303 if (get_enabled_exceptions(env, c)) { \
4304 DEST = ((FLOAT_SNAN ## BITS(status) >> 6) << 6) | c; \
4308 void helper_msa_flog2_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4311 wr_t wx
, *pwx
= &wx
;
4312 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4313 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4316 clear_msacsr_cause(env
);
4320 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4321 MSA_FLOAT_LOGB(pwx
->w
[i
], pws
->w
[i
], 32);
4325 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4326 MSA_FLOAT_LOGB(pwx
->d
[i
], pws
->d
[i
], 64);
4333 check_msacsr_cause(env
, GETPC());
4335 msa_move_v(pwd
, pwx
);
4338 void helper_msa_fexupl_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4341 wr_t wx
, *pwx
= &wx
;
4342 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4343 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4346 clear_msacsr_cause(env
);
4350 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4352 * Half precision floats come in two formats: standard
4353 * IEEE and "ARM" format. The latter gains extra exponent
4354 * range by omitting the NaN/Inf encodings.
4358 MSA_FLOAT_BINOP(pwx
->w
[i
], from_float16
, Lh(pws
, i
), ieee
, 32);
4362 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4363 MSA_FLOAT_UNOP(pwx
->d
[i
], from_float32
, Lw(pws
, i
), 64);
4370 check_msacsr_cause(env
, GETPC());
4371 msa_move_v(pwd
, pwx
);
4374 void helper_msa_fexupr_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4377 wr_t wx
, *pwx
= &wx
;
4378 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4379 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4382 clear_msacsr_cause(env
);
4386 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4388 * Half precision floats come in two formats: standard
4389 * IEEE and "ARM" format. The latter gains extra exponent
4390 * range by omitting the NaN/Inf encodings.
4394 MSA_FLOAT_BINOP(pwx
->w
[i
], from_float16
, Rh(pws
, i
), ieee
, 32);
4398 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4399 MSA_FLOAT_UNOP(pwx
->d
[i
], from_float32
, Rw(pws
, i
), 64);
4406 check_msacsr_cause(env
, GETPC());
4407 msa_move_v(pwd
, pwx
);
4410 void helper_msa_ffql_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4413 wr_t wx
, *pwx
= &wx
;
4414 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4415 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4420 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4421 MSA_FLOAT_UNOP(pwx
->w
[i
], from_q16
, Lh(pws
, i
), 32);
4425 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4426 MSA_FLOAT_UNOP(pwx
->d
[i
], from_q32
, Lw(pws
, i
), 64);
4433 msa_move_v(pwd
, pwx
);
4436 void helper_msa_ffqr_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4439 wr_t wx
, *pwx
= &wx
;
4440 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4441 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4446 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4447 MSA_FLOAT_UNOP(pwx
->w
[i
], from_q16
, Rh(pws
, i
), 32);
4451 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4452 MSA_FLOAT_UNOP(pwx
->d
[i
], from_q32
, Rw(pws
, i
), 64);
4459 msa_move_v(pwd
, pwx
);
4462 void helper_msa_ftint_s_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4465 wr_t wx
, *pwx
= &wx
;
4466 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4467 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4470 clear_msacsr_cause(env
);
4474 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4475 MSA_FLOAT_UNOP0(pwx
->w
[i
], to_int32
, pws
->w
[i
], 32);
4479 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4480 MSA_FLOAT_UNOP0(pwx
->d
[i
], to_int64
, pws
->d
[i
], 64);
4487 check_msacsr_cause(env
, GETPC());
4489 msa_move_v(pwd
, pwx
);
4492 void helper_msa_ftint_u_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4495 wr_t wx
, *pwx
= &wx
;
4496 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4497 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4500 clear_msacsr_cause(env
);
4504 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4505 MSA_FLOAT_UNOP0(pwx
->w
[i
], to_uint32
, pws
->w
[i
], 32);
4509 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4510 MSA_FLOAT_UNOP0(pwx
->d
[i
], to_uint64
, pws
->d
[i
], 64);
4517 check_msacsr_cause(env
, GETPC());
4519 msa_move_v(pwd
, pwx
);
4522 #define float32_from_int32 int32_to_float32
4523 #define float32_from_uint32 uint32_to_float32
4525 #define float64_from_int64 int64_to_float64
4526 #define float64_from_uint64 uint64_to_float64
4528 void helper_msa_ffint_s_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4531 wr_t wx
, *pwx
= &wx
;
4532 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4533 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4536 clear_msacsr_cause(env
);
4540 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4541 MSA_FLOAT_UNOP(pwx
->w
[i
], from_int32
, pws
->w
[i
], 32);
4545 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4546 MSA_FLOAT_UNOP(pwx
->d
[i
], from_int64
, pws
->d
[i
], 64);
4553 check_msacsr_cause(env
, GETPC());
4555 msa_move_v(pwd
, pwx
);
4558 void helper_msa_ffint_u_df(CPUMIPSState
*env
, uint32_t df
, uint32_t wd
,
4561 wr_t wx
, *pwx
= &wx
;
4562 wr_t
*pwd
= &(env
->active_fpu
.fpr
[wd
].wr
);
4563 wr_t
*pws
= &(env
->active_fpu
.fpr
[ws
].wr
);
4566 clear_msacsr_cause(env
);
4570 for (i
= 0; i
< DF_ELEMENTS(DF_WORD
); i
++) {
4571 MSA_FLOAT_UNOP(pwx
->w
[i
], from_uint32
, pws
->w
[i
], 32);
4575 for (i
= 0; i
< DF_ELEMENTS(DF_DOUBLE
); i
++) {
4576 MSA_FLOAT_UNOP(pwx
->d
[i
], from_uint64
, pws
->d
[i
], 64);
4583 check_msacsr_cause(env
, GETPC());
4585 msa_move_v(pwd
, pwx
);