1 ;; Machine description for Loongson-specific patterns, such as
2 ;; ST Microelectronics Loongson-2E/2F etc.
3 ;; Copyright (C) 2008-2018 Free Software Foundation, Inc.
4 ;; Contributed by CodeSourcery.
6 ;; This file is part of GCC.
8 ;; GCC is free software; you can redistribute it and/or modify
9 ;; it under the terms of the GNU General Public License as published by
10 ;; the Free Software Foundation; either version 3, or (at your option)
13 ;; GCC is distributed in the hope that it will be useful,
14 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
15 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 ;; GNU General Public License for more details.
18 ;; You should have received a copy of the GNU General Public License
19 ;; along with GCC; see the file COPYING3. If not see
20 ;; <http://www.gnu.org/licenses/>.
22 (define_c_enum "unspec" [
24 UNSPEC_LOONGSON_PCMPEQ
25 UNSPEC_LOONGSON_PCMPGT
27 UNSPEC_LOONGSON_PINSRH
30 UNSPEC_LOONGSON_PMOVMSK
31 UNSPEC_LOONGSON_PMULHU
34 UNSPEC_LOONGSON_PASUBUB
36 UNSPEC_LOONGSON_PSADBH
37 UNSPEC_LOONGSON_PSHUFH
38 UNSPEC_LOONGSON_PUNPCKH
39 UNSPEC_LOONGSON_PUNPCKL
46 ;; Mode iterators and attributes.
48 ;; 64-bit vectors of bytes.
49 (define_mode_iterator VB [V8QI])
51 ;; 64-bit vectors of halfwords.
52 (define_mode_iterator VH [V4HI])
54 ;; 64-bit vectors of words.
55 (define_mode_iterator VW [V2SI])
57 ;; 64-bit vectors of halfwords and bytes.
58 (define_mode_iterator VHB [V4HI V8QI])
60 ;; 64-bit vectors of words and halfwords.
61 (define_mode_iterator VWH [V2SI V4HI])
63 ;; 64-bit vectors of words and bytes
64 (define_mode_iterator VWB [V2SI V8QI])
66 ;; 64-bit vectors of words, halfwords and bytes.
67 (define_mode_iterator VWHB [V2SI V4HI V8QI])
69 ;; 64-bit vectors of words, halfwords and bytes; and DImode.
70 (define_mode_iterator VWHBDI [V2SI V4HI V8QI DI])
72 ;; The Loongson instruction suffixes corresponding to the modes in the
74 (define_mode_attr V_suffix [(V2SI "w") (V4HI "h") (V8QI "b") (DI "d")])
76 ;; Given a vector type T, the mode of a vector half the size of T
77 ;; and with the same number of elements.
78 (define_mode_attr V_squash [(V2SI "V2HI") (V4HI "V4QI")])
80 ;; Given a vector type T, the mode of a vector the same size as T
81 ;; but with half as many elements.
82 (define_mode_attr V_stretch_half [(V2SI "DI") (V4HI "V2SI") (V8QI "V4HI")])
84 ;; The Loongson instruction suffixes corresponding to the transformation
85 ;; expressed by V_stretch_half.
86 (define_mode_attr V_stretch_half_suffix [(V2SI "wd") (V4HI "hw") (V8QI "bh")])
88 ;; Given a vector type T, the mode of a vector the same size as T
89 ;; but with twice as many elements.
90 (define_mode_attr V_squash_double [(V2SI "V4HI") (V4HI "V8QI")])
92 ;; Given a vector type T, the inner mode.
93 (define_mode_attr V_inner [(V8QI "QI") (V4HI "HI") (V2SI "SI")])
95 ;; The Loongson instruction suffixes corresponding to the conversions
96 ;; specified by V_half_width.
97 (define_mode_attr V_squash_double_suffix [(V2SI "wh") (V4HI "hb")])
101 ;; Expander to legitimize moves involving values of vector modes.
102 (define_expand "mov<mode>"
103 [(set (match_operand:VWHB 0)
104 (match_operand:VWHB 1))]
105 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
107 if (mips_legitimize_move (<MODE>mode, operands[0], operands[1]))
111 ;; Handle legitimized moves between values of vector modes.
112 (define_insn "mov<mode>_internal"
113 [(set (match_operand:VWHB 0 "nonimmediate_operand" "=m,f,d,f, d, m, d")
114 (match_operand:VWHB 1 "move_operand" "f,m,f,dYG,dYG,dYG,m"))]
115 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
116 { return mips_output_move (operands[0], operands[1]); }
117 [(set_attr "move_type" "fpstore,fpload,mfc,mtc,move,store,load")
118 (set_attr "mode" "DI")])
120 ;; Initialization of a vector.
122 (define_expand "vec_init<mode><unitmode>"
123 [(set (match_operand:VWHB 0 "register_operand")
124 (match_operand 1 ""))]
125 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
127 mips_expand_vector_init (operands[0], operands[1]);
131 ;; Helper for vec_init. Initialize element 0 of the output from the input.
132 ;; All other elements are undefined.
133 (define_insn "loongson_vec_init1_<mode>"
134 [(set (match_operand:VHB 0 "register_operand" "=f")
135 (unspec:VHB [(truncate:<V_inner>
136 (match_operand:DI 1 "reg_or_0_operand" "Jd"))]
137 UNSPEC_LOONGSON_VINIT))]
138 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
140 [(set_attr "move_type" "mtc")
141 (set_attr "mode" "DI")])
143 ;; Helper for vec_initv2si.
144 (define_insn "*vec_concatv2si"
145 [(set (match_operand:V2SI 0 "register_operand" "=f")
147 (match_operand:SI 1 "register_operand" "f")
148 (match_operand:SI 2 "register_operand" "f")))]
149 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
150 "punpcklwd\t%0,%1,%2"
151 [(set_attr "type" "fcvt")])
153 ;; Instruction patterns for SIMD instructions.
155 ;; Pack with signed saturation.
156 (define_insn "vec_pack_ssat_<mode>"
157 [(set (match_operand:<V_squash_double> 0 "register_operand" "=f")
158 (vec_concat:<V_squash_double>
159 (ss_truncate:<V_squash>
160 (match_operand:VWH 1 "register_operand" "f"))
161 (ss_truncate:<V_squash>
162 (match_operand:VWH 2 "register_operand" "f"))))]
163 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
164 "packss<V_squash_double_suffix>\t%0,%1,%2"
165 [(set_attr "type" "fmul")])
167 ;; Pack with unsigned saturation.
168 (define_insn "vec_pack_usat_<mode>"
169 [(set (match_operand:<V_squash_double> 0 "register_operand" "=f")
170 (vec_concat:<V_squash_double>
171 (us_truncate:<V_squash>
172 (match_operand:VH 1 "register_operand" "f"))
173 (us_truncate:<V_squash>
174 (match_operand:VH 2 "register_operand" "f"))))]
175 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
176 "packus<V_squash_double_suffix>\t%0,%1,%2"
177 [(set_attr "type" "fmul")])
179 ;; Addition, treating overflow by wraparound.
180 (define_insn "add<mode>3"
181 [(set (match_operand:VWHB 0 "register_operand" "=f")
182 (plus:VWHB (match_operand:VWHB 1 "register_operand" "f")
183 (match_operand:VWHB 2 "register_operand" "f")))]
184 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
185 "padd<V_suffix>\t%0,%1,%2"
186 [(set_attr "type" "fadd")])
188 ;; Addition of doubleword integers stored in FP registers.
189 ;; Overflow is treated by wraparound.
190 ;; We use 'unspec' instead of 'plus' here to avoid clash with
191 ;; mips.md::add<mode>3. If 'plus' was used, then such instruction
192 ;; would be recognized as adddi3 and reload would make it use
193 ;; GPRs instead of FPRs.
194 (define_insn "loongson_paddd"
195 [(set (match_operand:DI 0 "register_operand" "=f")
196 (unspec:DI [(match_operand:DI 1 "register_operand" "f")
197 (match_operand:DI 2 "register_operand" "f")]
198 UNSPEC_LOONGSON_PADDD))]
199 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
201 [(set_attr "type" "fadd")])
203 ;; Addition, treating overflow by signed saturation.
204 (define_insn "ssadd<mode>3"
205 [(set (match_operand:VHB 0 "register_operand" "=f")
206 (ss_plus:VHB (match_operand:VHB 1 "register_operand" "f")
207 (match_operand:VHB 2 "register_operand" "f")))]
208 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
209 "padds<V_suffix>\t%0,%1,%2"
210 [(set_attr "type" "fadd")])
212 ;; Addition, treating overflow by unsigned saturation.
213 (define_insn "usadd<mode>3"
214 [(set (match_operand:VHB 0 "register_operand" "=f")
215 (us_plus:VHB (match_operand:VHB 1 "register_operand" "f")
216 (match_operand:VHB 2 "register_operand" "f")))]
217 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
218 "paddus<V_suffix>\t%0,%1,%2"
219 [(set_attr "type" "fadd")])
222 (define_insn "loongson_pandn_<V_suffix>"
223 [(set (match_operand:VWHBDI 0 "register_operand" "=f")
225 (not:VWHBDI (match_operand:VWHBDI 1 "register_operand" "f"))
226 (match_operand:VWHBDI 2 "register_operand" "f")))]
227 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
229 [(set_attr "type" "fmul")])
232 (define_insn "and<mode>3"
233 [(set (match_operand:VWHB 0 "register_operand" "=f")
234 (and:VWHB (match_operand:VWHB 1 "register_operand" "f")
235 (match_operand:VWHB 2 "register_operand" "f")))]
236 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
238 [(set_attr "type" "fmul")])
241 (define_insn "ior<mode>3"
242 [(set (match_operand:VWHB 0 "register_operand" "=f")
243 (ior:VWHB (match_operand:VWHB 1 "register_operand" "f")
244 (match_operand:VWHB 2 "register_operand" "f")))]
245 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
247 [(set_attr "type" "fcvt")])
250 (define_insn "xor<mode>3"
251 [(set (match_operand:VWHB 0 "register_operand" "=f")
252 (xor:VWHB (match_operand:VWHB 1 "register_operand" "f")
253 (match_operand:VWHB 2 "register_operand" "f")))]
254 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
256 [(set_attr "type" "fmul")])
259 (define_insn "*loongson_nor"
260 [(set (match_operand:VWHB 0 "register_operand" "=f")
262 (not:VWHB (match_operand:VWHB 1 "register_operand" "f"))
263 (not:VWHB (match_operand:VWHB 2 "register_operand" "f"))))]
264 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
266 [(set_attr "type" "fmul")])
269 (define_insn "one_cmpl<mode>2"
270 [(set (match_operand:VWHB 0 "register_operand" "=f")
271 (not:VWHB (match_operand:VWHB 1 "register_operand" "f")))]
272 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
274 [(set_attr "type" "fmul")])
277 (define_insn "loongson_pavg<V_suffix>"
278 [(set (match_operand:VHB 0 "register_operand" "=f")
279 (unspec:VHB [(match_operand:VHB 1 "register_operand" "f")
280 (match_operand:VHB 2 "register_operand" "f")]
281 UNSPEC_LOONGSON_PAVG))]
282 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
283 "pavg<V_suffix>\t%0,%1,%2"
284 [(set_attr "type" "fadd")])
287 (define_insn "loongson_pcmpeq<V_suffix>"
288 [(set (match_operand:VWHB 0 "register_operand" "=f")
289 (unspec:VWHB [(match_operand:VWHB 1 "register_operand" "f")
290 (match_operand:VWHB 2 "register_operand" "f")]
291 UNSPEC_LOONGSON_PCMPEQ))]
292 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
293 "pcmpeq<V_suffix>\t%0,%1,%2"
294 [(set_attr "type" "fadd")])
296 ;; Greater-than test.
297 (define_insn "loongson_pcmpgt<V_suffix>"
298 [(set (match_operand:VWHB 0 "register_operand" "=f")
299 (unspec:VWHB [(match_operand:VWHB 1 "register_operand" "f")
300 (match_operand:VWHB 2 "register_operand" "f")]
301 UNSPEC_LOONGSON_PCMPGT))]
302 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
303 "pcmpgt<V_suffix>\t%0,%1,%2"
304 [(set_attr "type" "fadd")])
307 (define_insn "loongson_pextrh"
308 [(set (match_operand:V4HI 0 "register_operand" "=f")
309 (unspec:V4HI [(match_operand:V4HI 1 "register_operand" "f")
310 (match_operand:SI 2 "register_operand" "f")]
311 UNSPEC_LOONGSON_PEXTR))]
312 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
314 [(set_attr "type" "fcvt")])
317 (define_insn "loongson_pinsrh_0"
318 [(set (match_operand:V4HI 0 "register_operand" "=f")
321 (match_operand:V4HI 1 "register_operand" "f")
322 (match_operand:V4HI 2 "register_operand" "f"))
323 (parallel [(const_int 4) (const_int 1)
324 (const_int 2) (const_int 3)])))]
325 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
327 [(set_attr "type" "fdiv")])
329 (define_insn "loongson_pinsrh_1"
330 [(set (match_operand:V4HI 0 "register_operand" "=f")
333 (match_operand:V4HI 1 "register_operand" "f")
334 (match_operand:V4HI 2 "register_operand" "f"))
335 (parallel [(const_int 0) (const_int 4)
336 (const_int 2) (const_int 3)])))]
337 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
339 [(set_attr "type" "fdiv")])
341 (define_insn "loongson_pinsrh_2"
342 [(set (match_operand:V4HI 0 "register_operand" "=f")
345 (match_operand:V4HI 1 "register_operand" "f")
346 (match_operand:V4HI 2 "register_operand" "f"))
347 (parallel [(const_int 0) (const_int 1)
348 (const_int 4) (const_int 3)])))]
349 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
351 [(set_attr "type" "fdiv")])
353 (define_insn "loongson_pinsrh_3"
354 [(set (match_operand:V4HI 0 "register_operand" "=f")
357 (match_operand:V4HI 1 "register_operand" "f")
358 (match_operand:V4HI 2 "register_operand" "f"))
359 (parallel [(const_int 0) (const_int 1)
360 (const_int 2) (const_int 4)])))]
361 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
363 [(set_attr "type" "fdiv")])
365 (define_insn "*vec_setv4hi"
366 [(set (match_operand:V4HI 0 "register_operand" "=f")
367 (unspec:V4HI [(match_operand:V4HI 1 "register_operand" "f")
368 (match_operand:SI 2 "register_operand" "f")
369 (match_operand:SI 3 "const_0_to_3_operand" "")]
370 UNSPEC_LOONGSON_PINSRH))]
371 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
372 "pinsrh_%3\t%0,%1,%2"
373 [(set_attr "type" "fdiv")])
375 (define_expand "vec_setv4hi"
376 [(set (match_operand:V4HI 0 "register_operand" "=f")
377 (unspec:V4HI [(match_operand:V4HI 1 "register_operand" "f")
378 (match_operand:HI 2 "register_operand" "f")
379 (match_operand:SI 3 "const_0_to_3_operand" "")]
380 UNSPEC_LOONGSON_PINSRH))]
381 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
383 rtx ext = gen_reg_rtx (SImode);
384 emit_move_insn (ext, gen_lowpart (SImode, operands[1]));
388 ;; Multiply and add packed integers.
389 (define_insn "loongson_pmaddhw"
390 [(set (match_operand:V2SI 0 "register_operand" "=f")
391 (unspec:V2SI [(match_operand:V4HI 1 "register_operand" "f")
392 (match_operand:V4HI 2 "register_operand" "f")]
393 UNSPEC_LOONGSON_PMADD))]
394 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
396 [(set_attr "type" "fmul")])
398 (define_expand "sdot_prodv4hi"
399 [(match_operand:V2SI 0 "register_operand" "")
400 (match_operand:V4HI 1 "register_operand" "")
401 (match_operand:V4HI 2 "register_operand" "")
402 (match_operand:V2SI 3 "register_operand" "")]
403 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
405 rtx t = gen_reg_rtx (V2SImode);
406 emit_insn (gen_loongson_pmaddhw (t, operands[1], operands[2]));
407 emit_insn (gen_addv2si3 (operands[0], t, operands[3]));
411 ;; Maximum of signed halfwords.
412 (define_insn "smaxv4hi3"
413 [(set (match_operand:V4HI 0 "register_operand" "=f")
414 (smax:V4HI (match_operand:V4HI 1 "register_operand" "f")
415 (match_operand:V4HI 2 "register_operand" "f")))]
416 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
418 [(set_attr "type" "fadd")])
420 (define_expand "smax<mode>3"
421 [(match_operand:VWB 0 "register_operand" "")
422 (match_operand:VWB 1 "register_operand" "")
423 (match_operand:VWB 2 "register_operand" "")]
424 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
426 mips_expand_vec_minmax (operands[0], operands[1], operands[2],
427 gen_loongson_pcmpgt<V_suffix>, false);
431 ;; Maximum of unsigned bytes.
432 (define_insn "umaxv8qi3"
433 [(set (match_operand:V8QI 0 "register_operand" "=f")
434 (umax:V8QI (match_operand:V8QI 1 "register_operand" "f")
435 (match_operand:V8QI 2 "register_operand" "f")))]
436 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
438 [(set_attr "type" "fadd")])
440 ;; Minimum of signed halfwords.
441 (define_insn "sminv4hi3"
442 [(set (match_operand:V4HI 0 "register_operand" "=f")
443 (smin:V4HI (match_operand:V4HI 1 "register_operand" "f")
444 (match_operand:V4HI 2 "register_operand" "f")))]
445 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
447 [(set_attr "type" "fadd")])
449 (define_expand "smin<mode>3"
450 [(match_operand:VWB 0 "register_operand" "")
451 (match_operand:VWB 1 "register_operand" "")
452 (match_operand:VWB 2 "register_operand" "")]
453 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
455 mips_expand_vec_minmax (operands[0], operands[1], operands[2],
456 gen_loongson_pcmpgt<V_suffix>, true);
460 ;; Minimum of unsigned bytes.
461 (define_insn "uminv8qi3"
462 [(set (match_operand:V8QI 0 "register_operand" "=f")
463 (umin:V8QI (match_operand:V8QI 1 "register_operand" "f")
464 (match_operand:V8QI 2 "register_operand" "f")))]
465 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
467 [(set_attr "type" "fadd")])
470 (define_insn "loongson_pmovmsk<V_suffix>"
471 [(set (match_operand:VB 0 "register_operand" "=f")
472 (unspec:VB [(match_operand:VB 1 "register_operand" "f")]
473 UNSPEC_LOONGSON_PMOVMSK))]
474 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
475 "pmovmsk<V_suffix>\t%0,%1"
476 [(set_attr "type" "fabs")])
478 ;; Multiply unsigned integers and store high result.
479 (define_insn "umul<mode>3_highpart"
480 [(set (match_operand:VH 0 "register_operand" "=f")
481 (unspec:VH [(match_operand:VH 1 "register_operand" "f")
482 (match_operand:VH 2 "register_operand" "f")]
483 UNSPEC_LOONGSON_PMULHU))]
484 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
485 "pmulhu<V_suffix>\t%0,%1,%2"
486 [(set_attr "type" "fmul")])
488 ;; Multiply signed integers and store high result.
489 (define_insn "smul<mode>3_highpart"
490 [(set (match_operand:VH 0 "register_operand" "=f")
491 (unspec:VH [(match_operand:VH 1 "register_operand" "f")
492 (match_operand:VH 2 "register_operand" "f")]
493 UNSPEC_LOONGSON_PMULH))]
494 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
495 "pmulh<V_suffix>\t%0,%1,%2"
496 [(set_attr "type" "fmul")])
498 ;; Multiply signed integers and store low result.
499 (define_insn "mul<mode>3"
500 [(set (match_operand:VH 0 "register_operand" "=f")
501 (mult:VH (match_operand:VH 1 "register_operand" "f")
502 (match_operand:VH 2 "register_operand" "f")))]
503 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
504 "pmull<V_suffix>\t%0,%1,%2"
505 [(set_attr "type" "fmul")])
507 ;; Multiply unsigned word integers.
508 (define_insn "loongson_pmulu<V_suffix>"
509 [(set (match_operand:DI 0 "register_operand" "=f")
510 (unspec:DI [(match_operand:VW 1 "register_operand" "f")
511 (match_operand:VW 2 "register_operand" "f")]
512 UNSPEC_LOONGSON_PMULU))]
513 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
514 "pmulu<V_suffix>\t%0,%1,%2"
515 [(set_attr "type" "fmul")])
517 ;; Absolute difference.
518 (define_insn "loongson_pasubub"
519 [(set (match_operand:VB 0 "register_operand" "=f")
520 (unspec:VB [(match_operand:VB 1 "register_operand" "f")
521 (match_operand:VB 2 "register_operand" "f")]
522 UNSPEC_LOONGSON_PASUBUB))]
523 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
525 [(set_attr "type" "fadd")])
527 ;; Sum of unsigned byte integers.
528 (define_insn "loongson_biadd"
529 [(set (match_operand:<V_stretch_half> 0 "register_operand" "=f")
530 (unspec:<V_stretch_half> [(match_operand:VB 1 "register_operand" "f")]
531 UNSPEC_LOONGSON_BIADD))]
532 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
534 [(set_attr "type" "fabs")])
536 (define_insn "reduc_uplus_v8qi"
537 [(set (match_operand:V8QI 0 "register_operand" "=f")
538 (unspec:V8QI [(match_operand:V8QI 1 "register_operand" "f")]
539 UNSPEC_LOONGSON_BIADD))]
540 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
542 [(set_attr "type" "fabs")])
544 ;; Sum of absolute differences.
545 (define_insn "loongson_psadbh"
546 [(set (match_operand:<V_stretch_half> 0 "register_operand" "=f")
547 (unspec:<V_stretch_half> [(match_operand:VB 1 "register_operand" "f")
548 (match_operand:VB 2 "register_operand" "f")]
549 UNSPEC_LOONGSON_PSADBH))]
550 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
551 "pasubub\t%0,%1,%2;biadd\t%0,%0"
552 [(set_attr "type" "fadd")])
554 ;; Shuffle halfwords.
555 (define_insn "loongson_pshufh"
556 [(set (match_operand:VH 0 "register_operand" "=f")
557 (unspec:VH [(match_operand:VH 1 "register_operand" "f")
558 (match_operand:SI 2 "register_operand" "f")]
559 UNSPEC_LOONGSON_PSHUFH))]
560 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
562 [(set_attr "type" "fmul")])
564 ;; Shift left logical.
565 (define_insn "ashl<mode>3"
566 [(set (match_operand:VWH 0 "register_operand" "=f")
567 (ashift:VWH (match_operand:VWH 1 "register_operand" "f")
568 (match_operand:SI 2 "register_operand" "f")))]
569 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
570 "psll<V_suffix>\t%0,%1,%2"
571 [(set_attr "type" "fcvt")])
573 ;; Shift right arithmetic.
574 (define_insn "ashr<mode>3"
575 [(set (match_operand:VWH 0 "register_operand" "=f")
576 (ashiftrt:VWH (match_operand:VWH 1 "register_operand" "f")
577 (match_operand:SI 2 "register_operand" "f")))]
578 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
579 "psra<V_suffix>\t%0,%1,%2"
580 [(set_attr "type" "fcvt")])
582 ;; Shift right logical.
583 (define_insn "lshr<mode>3"
584 [(set (match_operand:VWH 0 "register_operand" "=f")
585 (lshiftrt:VWH (match_operand:VWH 1 "register_operand" "f")
586 (match_operand:SI 2 "register_operand" "f")))]
587 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
588 "psrl<V_suffix>\t%0,%1,%2"
589 [(set_attr "type" "fcvt")])
591 ;; Subtraction, treating overflow by wraparound.
592 (define_insn "sub<mode>3"
593 [(set (match_operand:VWHB 0 "register_operand" "=f")
594 (minus:VWHB (match_operand:VWHB 1 "register_operand" "f")
595 (match_operand:VWHB 2 "register_operand" "f")))]
596 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
597 "psub<V_suffix>\t%0,%1,%2"
598 [(set_attr "type" "fadd")])
600 ;; Subtraction of doubleword integers stored in FP registers.
601 ;; Overflow is treated by wraparound.
602 ;; See loongson_paddd for the reason we use 'unspec' rather than
604 (define_insn "loongson_psubd"
605 [(set (match_operand:DI 0 "register_operand" "=f")
606 (unspec:DI [(match_operand:DI 1 "register_operand" "f")
607 (match_operand:DI 2 "register_operand" "f")]
608 UNSPEC_LOONGSON_PSUBD))]
609 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
611 [(set_attr "type" "fadd")])
613 ;; Subtraction, treating overflow by signed saturation.
614 (define_insn "sssub<mode>3"
615 [(set (match_operand:VHB 0 "register_operand" "=f")
616 (ss_minus:VHB (match_operand:VHB 1 "register_operand" "f")
617 (match_operand:VHB 2 "register_operand" "f")))]
618 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
619 "psubs<V_suffix>\t%0,%1,%2"
620 [(set_attr "type" "fadd")])
622 ;; Subtraction, treating overflow by unsigned saturation.
623 (define_insn "ussub<mode>3"
624 [(set (match_operand:VHB 0 "register_operand" "=f")
625 (us_minus:VHB (match_operand:VHB 1 "register_operand" "f")
626 (match_operand:VHB 2 "register_operand" "f")))]
627 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
628 "psubus<V_suffix>\t%0,%1,%2"
629 [(set_attr "type" "fadd")])
631 ;; Unpack high data. Recall that Loongson only runs in little-endian.
632 (define_insn "loongson_punpckhbh"
633 [(set (match_operand:V8QI 0 "register_operand" "=f")
636 (match_operand:V8QI 1 "register_operand" "f")
637 (match_operand:V8QI 2 "register_operand" "f"))
638 (parallel [(const_int 4) (const_int 12)
639 (const_int 5) (const_int 13)
640 (const_int 6) (const_int 14)
641 (const_int 7) (const_int 15)])))]
642 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
643 "punpckhbh\t%0,%1,%2"
644 [(set_attr "type" "fdiv")])
646 (define_insn "loongson_punpckhhw"
647 [(set (match_operand:V4HI 0 "register_operand" "=f")
650 (match_operand:V4HI 1 "register_operand" "f")
651 (match_operand:V4HI 2 "register_operand" "f"))
652 (parallel [(const_int 2) (const_int 6)
653 (const_int 3) (const_int 7)])))]
654 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
655 "punpckhhw\t%0,%1,%2"
656 [(set_attr "type" "fdiv")])
658 (define_insn "loongson_punpckhhw_qi"
659 [(set (match_operand:V8QI 0 "register_operand" "=f")
662 (match_operand:V8QI 1 "register_operand" "f")
663 (match_operand:V8QI 2 "register_operand" "f"))
664 (parallel [(const_int 4) (const_int 5)
665 (const_int 12) (const_int 13)
666 (const_int 6) (const_int 7)
667 (const_int 14) (const_int 15)])))]
668 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
669 "punpckhhw\t%0,%1,%2"
670 [(set_attr "type" "fdiv")])
672 (define_insn "loongson_punpckhwd"
673 [(set (match_operand:V2SI 0 "register_operand" "=f")
676 (match_operand:V2SI 1 "register_operand" "f")
677 (match_operand:V2SI 2 "register_operand" "f"))
678 (parallel [(const_int 1) (const_int 3)])))]
679 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
680 "punpckhwd\t%0,%1,%2"
681 [(set_attr "type" "fcvt")])
683 (define_insn "loongson_punpckhwd_qi"
684 [(set (match_operand:V8QI 0 "register_operand" "=f")
687 (match_operand:V8QI 1 "register_operand" "f")
688 (match_operand:V8QI 2 "register_operand" "f"))
689 (parallel [(const_int 4) (const_int 5)
690 (const_int 6) (const_int 7)
691 (const_int 12) (const_int 13)
692 (const_int 14) (const_int 15)])))]
693 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
694 "punpckhwd\t%0,%1,%2"
695 [(set_attr "type" "fcvt")])
697 (define_insn "loongson_punpckhwd_hi"
698 [(set (match_operand:V4HI 0 "register_operand" "=f")
701 (match_operand:V4HI 1 "register_operand" "f")
702 (match_operand:V4HI 2 "register_operand" "f"))
703 (parallel [(const_int 2) (const_int 3)
704 (const_int 6) (const_int 7)])))]
705 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
706 "punpckhwd\t%0,%1,%2"
707 [(set_attr "type" "fcvt")])
710 (define_insn "loongson_punpcklbh"
711 [(set (match_operand:V8QI 0 "register_operand" "=f")
714 (match_operand:V8QI 1 "register_operand" "f")
715 (match_operand:V8QI 2 "register_operand" "f"))
716 (parallel [(const_int 0) (const_int 8)
717 (const_int 1) (const_int 9)
718 (const_int 2) (const_int 10)
719 (const_int 3) (const_int 11)])))]
720 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
721 "punpcklbh\t%0,%1,%2"
722 [(set_attr "type" "fdiv")])
724 (define_insn "loongson_punpcklhw"
725 [(set (match_operand:V4HI 0 "register_operand" "=f")
728 (match_operand:V4HI 1 "register_operand" "f")
729 (match_operand:V4HI 2 "register_operand" "f"))
730 (parallel [(const_int 0) (const_int 4)
731 (const_int 1) (const_int 5)])))]
732 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
733 "punpcklhw\t%0,%1,%2"
734 [(set_attr "type" "fdiv")])
736 (define_insn "*loongson_punpcklhw_qi"
737 [(set (match_operand:V8QI 0 "register_operand" "=f")
740 (match_operand:V8QI 1 "register_operand" "f")
741 (match_operand:V8QI 2 "register_operand" "f"))
742 (parallel [(const_int 0) (const_int 1)
743 (const_int 8) (const_int 9)
744 (const_int 2) (const_int 3)
745 (const_int 10) (const_int 11)])))]
746 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
747 "punpcklhw\t%0,%1,%2"
748 [(set_attr "type" "fdiv")])
750 (define_insn "loongson_punpcklwd"
751 [(set (match_operand:V2SI 0 "register_operand" "=f")
754 (match_operand:V2SI 1 "register_operand" "f")
755 (match_operand:V2SI 2 "register_operand" "f"))
756 (parallel [(const_int 0) (const_int 2)])))]
757 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
758 "punpcklwd\t%0,%1,%2"
759 [(set_attr "type" "fcvt")])
761 (define_insn "*loongson_punpcklwd_qi"
762 [(set (match_operand:V8QI 0 "register_operand" "=f")
765 (match_operand:V8QI 1 "register_operand" "f")
766 (match_operand:V8QI 2 "register_operand" "f"))
767 (parallel [(const_int 0) (const_int 1)
768 (const_int 2) (const_int 3)
769 (const_int 8) (const_int 9)
770 (const_int 10) (const_int 11)])))]
771 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
772 "punpcklwd\t%0,%1,%2"
773 [(set_attr "type" "fcvt")])
775 (define_insn "*loongson_punpcklwd_hi"
776 [(set (match_operand:V4HI 0 "register_operand" "=f")
779 (match_operand:V4HI 1 "register_operand" "f")
780 (match_operand:V4HI 2 "register_operand" "f"))
781 (parallel [(const_int 0) (const_int 1)
782 (const_int 4) (const_int 5)])))]
783 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
784 "punpcklwd\t%0,%1,%2"
785 [(set_attr "type" "fcvt")])
787 (define_expand "vec_unpacks_lo_<mode>"
788 [(match_operand:<V_stretch_half> 0 "register_operand" "")
789 (match_operand:VHB 1 "register_operand" "")]
790 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
792 mips_expand_vec_unpack (operands, false, false);
796 (define_expand "vec_unpacks_hi_<mode>"
797 [(match_operand:<V_stretch_half> 0 "register_operand" "")
798 (match_operand:VHB 1 "register_operand" "")]
799 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
801 mips_expand_vec_unpack (operands, false, true);
805 (define_expand "vec_unpacku_lo_<mode>"
806 [(match_operand:<V_stretch_half> 0 "register_operand" "")
807 (match_operand:VHB 1 "register_operand" "")]
808 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
810 mips_expand_vec_unpack (operands, true, false);
814 (define_expand "vec_unpacku_hi_<mode>"
815 [(match_operand:<V_stretch_half> 0 "register_operand" "")
816 (match_operand:VHB 1 "register_operand" "")]
817 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
819 mips_expand_vec_unpack (operands, true, true);
823 ;; Whole vector shifts, used for reduction epilogues.
824 (define_insn "vec_shl_<mode>"
825 [(set (match_operand:VWHBDI 0 "register_operand" "=f")
826 (unspec:VWHBDI [(match_operand:VWHBDI 1 "register_operand" "f")
827 (match_operand:SI 2 "register_operand" "f")]
828 UNSPEC_LOONGSON_DSLL))]
829 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
831 [(set_attr "type" "fcvt")])
833 (define_insn "vec_shr_<mode>"
834 [(set (match_operand:VWHBDI 0 "register_operand" "=f")
835 (unspec:VWHBDI [(match_operand:VWHBDI 1 "register_operand" "f")
836 (match_operand:SI 2 "register_operand" "f")]
837 UNSPEC_LOONGSON_DSRL))]
838 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
840 [(set_attr "type" "fcvt")])
842 (define_insn "vec_loongson_extract_lo_<mode>"
843 [(set (match_operand:<V_inner> 0 "register_operand" "=r")
844 (vec_select:<V_inner>
845 (match_operand:VWHB 1 "register_operand" "f")
846 (parallel [(const_int 0)])))]
847 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
849 [(set_attr "type" "mfc")])
851 (define_expand "reduc_plus_scal_<mode>"
852 [(match_operand:<V_inner> 0 "register_operand" "")
853 (match_operand:VWHB 1 "register_operand" "")]
854 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
856 rtx tmp = gen_reg_rtx (GET_MODE (operands[1]));
857 mips_expand_vec_reduc (tmp, operands[1], gen_add<mode>3);
858 emit_insn (gen_vec_loongson_extract_lo_<mode> (operands[0], tmp));
862 (define_expand "reduc_smax_scal_<mode>"
863 [(match_operand:<V_inner> 0 "register_operand" "")
864 (match_operand:VWHB 1 "register_operand" "")]
865 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
867 rtx tmp = gen_reg_rtx (GET_MODE (operands[1]));
868 mips_expand_vec_reduc (tmp, operands[1], gen_smax<mode>3);
869 emit_insn (gen_vec_loongson_extract_lo_<mode> (operands[0], tmp));
873 (define_expand "reduc_smin_scal_<mode>"
874 [(match_operand:<V_inner> 0 "register_operand" "")
875 (match_operand:VWHB 1 "register_operand" "")]
876 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
878 rtx tmp = gen_reg_rtx (GET_MODE (operands[1]));
879 mips_expand_vec_reduc (tmp, operands[1], gen_smin<mode>3);
880 emit_insn (gen_vec_loongson_extract_lo_<mode> (operands[0], tmp));
884 (define_expand "reduc_umax_scal_<mode>"
885 [(match_operand:<V_inner> 0 "register_operand" "")
886 (match_operand:VB 1 "register_operand" "")]
887 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
889 rtx tmp = gen_reg_rtx (GET_MODE (operands[1]));
890 mips_expand_vec_reduc (tmp, operands[1], gen_umax<mode>3);
891 emit_insn (gen_vec_loongson_extract_lo_<mode> (operands[0], tmp));
895 (define_expand "reduc_umin_scal_<mode>"
896 [(match_operand:<V_inner> 0 "register_operand" "")
897 (match_operand:VB 1 "register_operand" "")]
898 "TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS"
900 rtx tmp = gen_reg_rtx (GET_MODE (operands[1]));
901 mips_expand_vec_reduc (tmp, operands[1], gen_umin<mode>3);
902 emit_insn (gen_vec_loongson_extract_lo_<mode> (operands[0], tmp));