1 /* IR-agnostic target query functions relating to optabs
2 Copyright (C) 1987-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
23 #include "coretypes.h"
25 #include "insn-codes.h"
26 #include "optabs-query.h"
27 #include "optabs-libfuncs.h"
28 #include "insn-config.h"
31 #include "vec-perm-indices.h"
33 struct target_optabs default_target_optabs
;
34 struct target_optabs
*this_fn_optabs
= &default_target_optabs
;
36 struct target_optabs
*this_target_optabs
= &default_target_optabs
;
39 /* Return the insn used to perform conversion OP from mode FROM_MODE
40 to mode TO_MODE; return CODE_FOR_nothing if the target does not have
41 such an insn, or if it is unsuitable for optimization type OPT_TYPE. */
44 convert_optab_handler (convert_optab optab
, machine_mode to_mode
,
45 machine_mode from_mode
, optimization_type opt_type
)
47 insn_code icode
= convert_optab_handler (optab
, to_mode
, from_mode
);
48 if (icode
== CODE_FOR_nothing
49 || !targetm
.optab_supported_p (optab
, to_mode
, from_mode
, opt_type
))
50 return CODE_FOR_nothing
;
54 /* Return the insn used to implement mode MODE of OP; return
55 CODE_FOR_nothing if the target does not have such an insn,
56 or if it is unsuitable for optimization type OPT_TYPE. */
59 direct_optab_handler (convert_optab optab
, machine_mode mode
,
60 optimization_type opt_type
)
62 insn_code icode
= direct_optab_handler (optab
, mode
);
63 if (icode
== CODE_FOR_nothing
64 || !targetm
.optab_supported_p (optab
, mode
, mode
, opt_type
))
65 return CODE_FOR_nothing
;
69 /* Enumerates the possible types of structure operand to an
71 enum extraction_type
{ ET_unaligned_mem
, ET_reg
};
73 /* Check whether insv, extv or extzv pattern ICODE can be used for an
74 insertion or extraction of type TYPE on a structure of mode MODE.
75 Return true if so and fill in *INSN accordingly. STRUCT_OP is the
76 operand number of the structure (the first sign_extract or zero_extract
77 operand) and FIELD_OP is the operand number of the field (the other
78 side of the set from the sign_extract or zero_extract). */
81 get_traditional_extraction_insn (extraction_insn
*insn
,
82 enum extraction_type type
,
85 int struct_op
, int field_op
)
87 const struct insn_data_d
*data
= &insn_data
[icode
];
89 machine_mode struct_mode
= data
->operand
[struct_op
].mode
;
90 if (struct_mode
== VOIDmode
)
91 struct_mode
= word_mode
;
92 if (mode
!= struct_mode
)
95 machine_mode field_mode
= data
->operand
[field_op
].mode
;
96 if (field_mode
== VOIDmode
)
97 field_mode
= word_mode
;
99 machine_mode pos_mode
= data
->operand
[struct_op
+ 2].mode
;
100 if (pos_mode
== VOIDmode
)
101 pos_mode
= word_mode
;
104 insn
->field_mode
= as_a
<scalar_int_mode
> (field_mode
);
105 if (type
== ET_unaligned_mem
)
106 insn
->struct_mode
= byte_mode
;
107 else if (struct_mode
== BLKmode
)
108 insn
->struct_mode
= opt_scalar_int_mode ();
110 insn
->struct_mode
= as_a
<scalar_int_mode
> (struct_mode
);
111 insn
->pos_mode
= as_a
<scalar_int_mode
> (pos_mode
);
115 /* Return true if an optab exists to perform an insertion or extraction
116 of type TYPE in mode MODE. Describe the instruction in *INSN if so.
118 REG_OPTAB is the optab to use for register structures and
119 MISALIGN_OPTAB is the optab to use for misaligned memory structures.
120 POS_OP is the operand number of the bit position. */
123 get_optab_extraction_insn (struct extraction_insn
*insn
,
124 enum extraction_type type
,
125 machine_mode mode
, direct_optab reg_optab
,
126 direct_optab misalign_optab
, int pos_op
)
128 direct_optab optab
= (type
== ET_unaligned_mem
? misalign_optab
: reg_optab
);
129 enum insn_code icode
= direct_optab_handler (optab
, mode
);
130 if (icode
== CODE_FOR_nothing
)
133 const struct insn_data_d
*data
= &insn_data
[icode
];
135 machine_mode pos_mode
= data
->operand
[pos_op
].mode
;
136 if (pos_mode
== VOIDmode
)
137 pos_mode
= word_mode
;
140 insn
->field_mode
= as_a
<scalar_int_mode
> (mode
);
141 if (type
== ET_unaligned_mem
)
142 insn
->struct_mode
= opt_scalar_int_mode ();
144 insn
->struct_mode
= insn
->field_mode
;
145 insn
->pos_mode
= as_a
<scalar_int_mode
> (pos_mode
);
149 /* Return true if an instruction exists to perform an insertion or
150 extraction (PATTERN says which) of type TYPE in mode MODE.
151 Describe the instruction in *INSN if so. */
154 get_extraction_insn (extraction_insn
*insn
,
155 enum extraction_pattern pattern
,
156 enum extraction_type type
,
162 if (targetm
.have_insv ()
163 && get_traditional_extraction_insn (insn
, type
, mode
,
164 targetm
.code_for_insv
, 0, 3))
166 return get_optab_extraction_insn (insn
, type
, mode
, insv_optab
,
167 insvmisalign_optab
, 2);
170 if (targetm
.have_extv ()
171 && get_traditional_extraction_insn (insn
, type
, mode
,
172 targetm
.code_for_extv
, 1, 0))
174 return get_optab_extraction_insn (insn
, type
, mode
, extv_optab
,
175 extvmisalign_optab
, 3);
178 if (targetm
.have_extzv ()
179 && get_traditional_extraction_insn (insn
, type
, mode
,
180 targetm
.code_for_extzv
, 1, 0))
182 return get_optab_extraction_insn (insn
, type
, mode
, extzv_optab
,
183 extzvmisalign_optab
, 3);
190 /* Return true if an instruction exists to access a field of mode
191 FIELDMODE in a structure that has STRUCT_BITS significant bits.
192 Describe the "best" such instruction in *INSN if so. PATTERN and
193 TYPE describe the type of insertion or extraction we want to perform.
195 For an insertion, the number of significant structure bits includes
196 all bits of the target. For an extraction, it need only include the
197 most significant bit of the field. Larger widths are acceptable
201 get_best_extraction_insn (extraction_insn
*insn
,
202 enum extraction_pattern pattern
,
203 enum extraction_type type
,
204 unsigned HOST_WIDE_INT struct_bits
,
205 machine_mode field_mode
)
207 opt_scalar_int_mode mode_iter
;
208 FOR_EACH_MODE_FROM (mode_iter
, smallest_int_mode_for_size (struct_bits
))
210 scalar_int_mode mode
= mode_iter
.require ();
211 if (get_extraction_insn (insn
, pattern
, type
, mode
))
213 FOR_EACH_MODE_FROM (mode_iter
, mode
)
215 mode
= mode_iter
.require ();
216 if (GET_MODE_SIZE (mode
) > GET_MODE_SIZE (field_mode
)
217 || TRULY_NOOP_TRUNCATION_MODES_P (insn
->field_mode
,
220 get_extraction_insn (insn
, pattern
, type
, mode
);
228 /* Return true if an instruction exists to access a field of mode
229 FIELDMODE in a register structure that has STRUCT_BITS significant bits.
230 Describe the "best" such instruction in *INSN if so. PATTERN describes
231 the type of insertion or extraction we want to perform.
233 For an insertion, the number of significant structure bits includes
234 all bits of the target. For an extraction, it need only include the
235 most significant bit of the field. Larger widths are acceptable
239 get_best_reg_extraction_insn (extraction_insn
*insn
,
240 enum extraction_pattern pattern
,
241 unsigned HOST_WIDE_INT struct_bits
,
242 machine_mode field_mode
)
244 return get_best_extraction_insn (insn
, pattern
, ET_reg
, struct_bits
,
248 /* Return true if an instruction exists to access a field of BITSIZE
249 bits starting BITNUM bits into a memory structure. Describe the
250 "best" such instruction in *INSN if so. PATTERN describes the type
251 of insertion or extraction we want to perform and FIELDMODE is the
252 natural mode of the extracted field.
254 The instructions considered here only access bytes that overlap
255 the bitfield; they do not touch any surrounding bytes. */
258 get_best_mem_extraction_insn (extraction_insn
*insn
,
259 enum extraction_pattern pattern
,
260 HOST_WIDE_INT bitsize
, HOST_WIDE_INT bitnum
,
261 machine_mode field_mode
)
263 unsigned HOST_WIDE_INT struct_bits
= (bitnum
% BITS_PER_UNIT
265 + BITS_PER_UNIT
- 1);
266 struct_bits
-= struct_bits
% BITS_PER_UNIT
;
267 return get_best_extraction_insn (insn
, pattern
, ET_unaligned_mem
,
268 struct_bits
, field_mode
);
271 /* Return the insn code used to extend FROM_MODE to TO_MODE.
272 UNSIGNEDP specifies zero-extension instead of sign-extension. If
273 no such operation exists, CODE_FOR_nothing will be returned. */
276 can_extend_p (machine_mode to_mode
, machine_mode from_mode
,
279 if (unsignedp
< 0 && targetm
.have_ptr_extend ())
280 return targetm
.code_for_ptr_extend
;
282 convert_optab tab
= unsignedp
? zext_optab
: sext_optab
;
283 return convert_optab_handler (tab
, to_mode
, from_mode
);
286 /* Return the insn code to convert fixed-point mode FIXMODE to floating-point
287 mode FLTMODE, or CODE_FOR_nothing if no such instruction exists.
288 UNSIGNEDP specifies whether FIXMODE is unsigned. */
291 can_float_p (machine_mode fltmode
, machine_mode fixmode
,
294 convert_optab tab
= unsignedp
? ufloat_optab
: sfloat_optab
;
295 return convert_optab_handler (tab
, fltmode
, fixmode
);
298 /* Return the insn code to convert floating-point mode FLTMODE to fixed-point
299 mode FIXMODE, or CODE_FOR_nothing if no such instruction exists.
300 UNSIGNEDP specifies whether FIXMODE is unsigned.
302 On a successful return, set *TRUNCP_PTR to true if it is necessary to
303 output an explicit FTRUNC before the instruction. */
306 can_fix_p (machine_mode fixmode
, machine_mode fltmode
,
307 int unsignedp
, bool *truncp_ptr
)
310 enum insn_code icode
;
312 tab
= unsignedp
? ufixtrunc_optab
: sfixtrunc_optab
;
313 icode
= convert_optab_handler (tab
, fixmode
, fltmode
);
314 if (icode
!= CODE_FOR_nothing
)
320 /* FIXME: This requires a port to define both FIX and FTRUNC pattern
321 for this to work. We need to rework the fix* and ftrunc* patterns
322 and documentation. */
323 tab
= unsignedp
? ufix_optab
: sfix_optab
;
324 icode
= convert_optab_handler (tab
, fixmode
, fltmode
);
325 if (icode
!= CODE_FOR_nothing
326 && optab_handler (ftrunc_optab
, fltmode
) != CODE_FOR_nothing
)
332 return CODE_FOR_nothing
;
335 /* Return nonzero if a conditional move of mode MODE is supported.
337 This function is for combine so it can tell whether an insn that looks
338 like a conditional move is actually supported by the hardware. If we
339 guess wrong we lose a bit on optimization, but that's it. */
340 /* ??? sparc64 supports conditionally moving integers values based on fp
341 comparisons, and vice versa. How do we handle them? */
344 can_conditionally_move_p (machine_mode mode
)
346 return direct_optab_handler (movcc_optab
, mode
) != CODE_FOR_nothing
;
349 /* If a target doesn't implement a permute on a vector with multibyte
350 elements, we can try to do the same permute on byte elements.
351 If this makes sense for vector mode MODE then return the appropriate
355 qimode_for_vec_perm (machine_mode mode
)
358 if (GET_MODE_INNER (mode
) != QImode
359 && mode_for_vector (QImode
, GET_MODE_SIZE (mode
)).exists (&qimode
)
360 && VECTOR_MODE_P (qimode
))
362 return opt_machine_mode ();
365 /* Return true if selector SEL can be represented in the integer
366 equivalent of vector mode MODE. */
369 selector_fits_mode_p (machine_mode mode
, const vec_perm_indices
&sel
)
371 unsigned HOST_WIDE_INT mask
= GET_MODE_MASK (GET_MODE_INNER (mode
));
372 return (mask
== HOST_WIDE_INT_M1U
373 || sel
.all_in_range_p (0, mask
+ 1));
376 /* Return true if VEC_PERM_EXPRs with variable selector operands can be
377 expanded using SIMD extensions of the CPU. MODE is the mode of the
378 vectors being permuted. */
381 can_vec_perm_var_p (machine_mode mode
)
383 /* If the target doesn't implement a vector mode for the vector type,
384 then no operations are supported. */
385 if (!VECTOR_MODE_P (mode
))
388 if (direct_optab_handler (vec_perm_optab
, mode
) != CODE_FOR_nothing
)
391 /* We allow fallback to a QI vector mode, and adjust the mask. */
393 if (!qimode_for_vec_perm (mode
).exists (&qimode
)
394 || GET_MODE_NUNITS (qimode
) > GET_MODE_MASK (QImode
) + 1)
397 if (direct_optab_handler (vec_perm_optab
, qimode
) == CODE_FOR_nothing
)
400 /* In order to support the lowering of variable permutations,
401 we need to support shifts and adds. */
402 if (GET_MODE_UNIT_SIZE (mode
) > 2
403 && optab_handler (ashl_optab
, mode
) == CODE_FOR_nothing
404 && optab_handler (vashl_optab
, mode
) == CODE_FOR_nothing
)
406 if (optab_handler (add_optab
, qimode
) == CODE_FOR_nothing
)
412 /* Return true if the target directly supports VEC_PERM_EXPRs on vectors
413 of mode MODE using the selector SEL. ALLOW_VARIABLE_P is true if it
414 is acceptable to force the selector into a register and use a variable
415 permute (if the target supports that).
417 Note that additional permutations representing whole-vector shifts may
418 also be handled via the vec_shr optab, but only where the second input
419 vector is entirely constant zeroes; this case is not dealt with here. */
422 can_vec_perm_const_p (machine_mode mode
, const vec_perm_indices
&sel
,
423 bool allow_variable_p
)
425 /* If the target doesn't implement a vector mode for the vector type,
426 then no operations are supported. */
427 if (!VECTOR_MODE_P (mode
))
430 /* It's probably cheaper to test for the variable case first. */
431 if (allow_variable_p
&& selector_fits_mode_p (mode
, sel
))
433 if (direct_optab_handler (vec_perm_optab
, mode
) != CODE_FOR_nothing
)
436 /* Unlike can_vec_perm_var_p, we don't need to test for optabs
437 related computing the QImode selector, since that happens at
440 if (qimode_for_vec_perm (mode
).exists (&qimode
))
442 vec_perm_indices qimode_indices
;
443 qimode_indices
.new_expanded_vector (sel
, GET_MODE_UNIT_SIZE (mode
));
444 if (selector_fits_mode_p (qimode
, qimode_indices
)
445 && (direct_optab_handler (vec_perm_optab
, qimode
)
446 != CODE_FOR_nothing
))
451 if (targetm
.vectorize
.vec_perm_const
!= NULL
)
453 if (targetm
.vectorize
.vec_perm_const (mode
, NULL_RTX
, NULL_RTX
,
457 /* ??? For completeness, we ought to check the QImode version of
458 vec_perm_const_optab. But all users of this implicit lowering
459 feature implement the variable vec_perm_optab, and the ia64
460 port specifically doesn't want us to lower V2SF operations
461 into integer operations. */
467 /* Find a widening optab even if it doesn't widen as much as we want.
468 E.g. if from_mode is HImode, and to_mode is DImode, and there is no
469 direct HI->SI insn, then return SI->DI, if that exists. */
472 find_widening_optab_handler_and_mode (optab op
, machine_mode to_mode
,
473 machine_mode from_mode
,
474 machine_mode
*found_mode
)
476 gcc_checking_assert (GET_MODE_CLASS (from_mode
) == GET_MODE_CLASS (to_mode
));
477 gcc_checking_assert (from_mode
< to_mode
);
478 FOR_EACH_MODE (from_mode
, from_mode
, to_mode
)
480 enum insn_code handler
= convert_optab_handler (op
, to_mode
, from_mode
);
482 if (handler
!= CODE_FOR_nothing
)
485 *found_mode
= from_mode
;
490 return CODE_FOR_nothing
;
493 /* Return non-zero if a highpart multiply is supported of can be synthisized.
494 For the benefit of expand_mult_highpart, the return value is 1 for direct,
495 2 for even/odd widening, and 3 for hi/lo widening. */
498 can_mult_highpart_p (machine_mode mode
, bool uns_p
)
503 op
= uns_p
? umul_highpart_optab
: smul_highpart_optab
;
504 if (optab_handler (op
, mode
) != CODE_FOR_nothing
)
507 /* If the mode is an integral vector, synth from widening operations. */
508 if (GET_MODE_CLASS (mode
) != MODE_VECTOR_INT
)
511 nunits
= GET_MODE_NUNITS (mode
);
513 op
= uns_p
? vec_widen_umult_even_optab
: vec_widen_smult_even_optab
;
514 if (optab_handler (op
, mode
) != CODE_FOR_nothing
)
516 op
= uns_p
? vec_widen_umult_odd_optab
: vec_widen_smult_odd_optab
;
517 if (optab_handler (op
, mode
) != CODE_FOR_nothing
)
519 /* The encoding has 2 interleaved stepped patterns. */
520 vec_perm_builder
sel (nunits
, 2, 3);
521 for (i
= 0; i
< 6; ++i
)
522 sel
.quick_push (!BYTES_BIG_ENDIAN
524 + ((i
& 1) ? nunits
: 0));
525 vec_perm_indices
indices (sel
, 2, nunits
);
526 if (can_vec_perm_const_p (mode
, indices
))
531 op
= uns_p
? vec_widen_umult_hi_optab
: vec_widen_smult_hi_optab
;
532 if (optab_handler (op
, mode
) != CODE_FOR_nothing
)
534 op
= uns_p
? vec_widen_umult_lo_optab
: vec_widen_smult_lo_optab
;
535 if (optab_handler (op
, mode
) != CODE_FOR_nothing
)
537 /* The encoding has a single stepped pattern. */
538 vec_perm_builder
sel (nunits
, 1, 3);
539 for (int i
= 0; i
< 3; ++i
)
540 sel
.quick_push (2 * i
+ (BYTES_BIG_ENDIAN
? 0 : 1));
541 vec_perm_indices
indices (sel
, 2, nunits
);
542 if (can_vec_perm_const_p (mode
, indices
))
550 /* Return true if target supports vector masked load/store for mode. */
553 can_vec_mask_load_store_p (machine_mode mode
,
554 machine_mode mask_mode
,
557 optab op
= is_load
? maskload_optab
: maskstore_optab
;
560 /* If mode is vector mode, check it directly. */
561 if (VECTOR_MODE_P (mode
))
562 return convert_optab_handler (op
, mode
, mask_mode
) != CODE_FOR_nothing
;
564 /* Otherwise, return true if there is some vector mode with
565 the mask load/store supported. */
567 /* See if there is any chance the mask load or store might be
568 vectorized. If not, punt. */
570 if (!is_a
<scalar_mode
> (mode
, &smode
))
573 vmode
= targetm
.vectorize
.preferred_simd_mode (smode
);
574 if (!VECTOR_MODE_P (vmode
))
577 if ((targetm
.vectorize
.get_mask_mode
578 (GET_MODE_NUNITS (vmode
), GET_MODE_SIZE (vmode
)).exists (&mask_mode
))
579 && convert_optab_handler (op
, vmode
, mask_mode
) != CODE_FOR_nothing
)
582 auto_vector_sizes vector_sizes
;
583 targetm
.vectorize
.autovectorize_vector_sizes (&vector_sizes
);
584 for (unsigned int i
= 0; i
< vector_sizes
.length (); ++i
)
586 poly_uint64 cur
= vector_sizes
[i
];
588 if (!multiple_p (cur
, GET_MODE_SIZE (smode
), &nunits
))
590 if (mode_for_vector (smode
, nunits
).exists (&vmode
)
591 && VECTOR_MODE_P (vmode
)
592 && targetm
.vectorize
.get_mask_mode (nunits
, cur
).exists (&mask_mode
)
593 && convert_optab_handler (op
, vmode
, mask_mode
) != CODE_FOR_nothing
)
599 /* Return true if there is a compare_and_swap pattern. */
602 can_compare_and_swap_p (machine_mode mode
, bool allow_libcall
)
604 enum insn_code icode
;
606 /* Check for __atomic_compare_and_swap. */
607 icode
= direct_optab_handler (atomic_compare_and_swap_optab
, mode
);
608 if (icode
!= CODE_FOR_nothing
)
611 /* Check for __sync_compare_and_swap. */
612 icode
= optab_handler (sync_compare_and_swap_optab
, mode
);
613 if (icode
!= CODE_FOR_nothing
)
615 if (allow_libcall
&& optab_libfunc (sync_compare_and_swap_optab
, mode
))
618 /* No inline compare and swap. */
622 /* Return true if an atomic exchange can be performed. */
625 can_atomic_exchange_p (machine_mode mode
, bool allow_libcall
)
627 enum insn_code icode
;
629 /* Check for __atomic_exchange. */
630 icode
= direct_optab_handler (atomic_exchange_optab
, mode
);
631 if (icode
!= CODE_FOR_nothing
)
634 /* Don't check __sync_test_and_set, as on some platforms that
635 has reduced functionality. Targets that really do support
636 a proper exchange should simply be updated to the __atomics. */
638 return can_compare_and_swap_p (mode
, allow_libcall
);
641 /* Return true if an atomic load can be performed without falling back to
642 a compare-and-swap. */
645 can_atomic_load_p (machine_mode mode
)
647 enum insn_code icode
;
649 /* Does the target supports the load directly? */
650 icode
= direct_optab_handler (atomic_load_optab
, mode
);
651 if (icode
!= CODE_FOR_nothing
)
654 /* If the size of the object is greater than word size on this target,
655 then we assume that a load will not be atomic. Also see
656 expand_atomic_load. */
657 return GET_MODE_PRECISION (mode
) <= BITS_PER_WORD
;
660 /* Determine whether "1 << x" is relatively cheap in word_mode. */
663 lshift_cheap_p (bool speed_p
)
665 /* FIXME: This should be made target dependent via this "this_target"
666 mechanism, similar to e.g. can_copy_init_p in gcse.c. */
667 static bool init
[2] = { false, false };
668 static bool cheap
[2] = { true, true };
670 /* If the targer has no lshift in word_mode, the operation will most
671 probably not be cheap. ??? Does GCC even work for such targets? */
672 if (optab_handler (ashl_optab
, word_mode
) == CODE_FOR_nothing
)
677 rtx reg
= gen_raw_REG (word_mode
, 10000);
678 int cost
= set_src_cost (gen_rtx_ASHIFT (word_mode
, const1_rtx
, reg
),
680 cheap
[speed_p
] = cost
< COSTS_N_INSNS (3);
681 init
[speed_p
] = true;
684 return cheap
[speed_p
];