gcc/
[official-gcc.git] / gcc / tree-ssa-ccp.c
blobae120a8ff955d704e973bfec804be1d1caf1eee7
1 /* Conditional constant propagation pass for the GNU compiler.
2 Copyright (C) 2000-2016 Free Software Foundation, Inc.
3 Adapted from original RTL SSA-CCP by Daniel Berlin <dberlin@dberlin.org>
4 Adapted to GIMPLE trees by Diego Novillo <dnovillo@redhat.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 3, or (at your option) any
11 later version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT
14 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* Conditional constant propagation (CCP) is based on the SSA
23 propagation engine (tree-ssa-propagate.c). Constant assignments of
24 the form VAR = CST are propagated from the assignments into uses of
25 VAR, which in turn may generate new constants. The simulation uses
26 a four level lattice to keep track of constant values associated
27 with SSA names. Given an SSA name V_i, it may take one of the
28 following values:
30 UNINITIALIZED -> the initial state of the value. This value
31 is replaced with a correct initial value
32 the first time the value is used, so the
33 rest of the pass does not need to care about
34 it. Using this value simplifies initialization
35 of the pass, and prevents us from needlessly
36 scanning statements that are never reached.
38 UNDEFINED -> V_i is a local variable whose definition
39 has not been processed yet. Therefore we
40 don't yet know if its value is a constant
41 or not.
43 CONSTANT -> V_i has been found to hold a constant
44 value C.
46 VARYING -> V_i cannot take a constant value, or if it
47 does, it is not possible to determine it
48 at compile time.
50 The core of SSA-CCP is in ccp_visit_stmt and ccp_visit_phi_node:
52 1- In ccp_visit_stmt, we are interested in assignments whose RHS
53 evaluates into a constant and conditional jumps whose predicate
54 evaluates into a boolean true or false. When an assignment of
55 the form V_i = CONST is found, V_i's lattice value is set to
56 CONSTANT and CONST is associated with it. This causes the
57 propagation engine to add all the SSA edges coming out the
58 assignment into the worklists, so that statements that use V_i
59 can be visited.
61 If the statement is a conditional with a constant predicate, we
62 mark the outgoing edges as executable or not executable
63 depending on the predicate's value. This is then used when
64 visiting PHI nodes to know when a PHI argument can be ignored.
67 2- In ccp_visit_phi_node, if all the PHI arguments evaluate to the
68 same constant C, then the LHS of the PHI is set to C. This
69 evaluation is known as the "meet operation". Since one of the
70 goals of this evaluation is to optimistically return constant
71 values as often as possible, it uses two main short cuts:
73 - If an argument is flowing in through a non-executable edge, it
74 is ignored. This is useful in cases like this:
76 if (PRED)
77 a_9 = 3;
78 else
79 a_10 = 100;
80 a_11 = PHI (a_9, a_10)
82 If PRED is known to always evaluate to false, then we can
83 assume that a_11 will always take its value from a_10, meaning
84 that instead of consider it VARYING (a_9 and a_10 have
85 different values), we can consider it CONSTANT 100.
87 - If an argument has an UNDEFINED value, then it does not affect
88 the outcome of the meet operation. If a variable V_i has an
89 UNDEFINED value, it means that either its defining statement
90 hasn't been visited yet or V_i has no defining statement, in
91 which case the original symbol 'V' is being used
92 uninitialized. Since 'V' is a local variable, the compiler
93 may assume any initial value for it.
96 After propagation, every variable V_i that ends up with a lattice
97 value of CONSTANT will have the associated constant value in the
98 array CONST_VAL[i].VALUE. That is fed into substitute_and_fold for
99 final substitution and folding.
101 This algorithm uses wide-ints at the max precision of the target.
102 This means that, with one uninteresting exception, variables with
103 UNSIGNED types never go to VARYING because the bits above the
104 precision of the type of the variable are always zero. The
105 uninteresting case is a variable of UNSIGNED type that has the
106 maximum precision of the target. Such variables can go to VARYING,
107 but this causes no loss of infomation since these variables will
108 never be extended.
110 References:
112 Constant propagation with conditional branches,
113 Wegman and Zadeck, ACM TOPLAS 13(2):181-210.
115 Building an Optimizing Compiler,
116 Robert Morgan, Butterworth-Heinemann, 1998, Section 8.9.
118 Advanced Compiler Design and Implementation,
119 Steven Muchnick, Morgan Kaufmann, 1997, Section 12.6 */
121 #include "config.h"
122 #include "system.h"
123 #include "coretypes.h"
124 #include "backend.h"
125 #include "target.h"
126 #include "tree.h"
127 #include "gimple.h"
128 #include "tree-pass.h"
129 #include "ssa.h"
130 #include "gimple-pretty-print.h"
131 #include "fold-const.h"
132 #include "gimple-fold.h"
133 #include "tree-eh.h"
134 #include "gimplify.h"
135 #include "gimple-iterator.h"
136 #include "tree-cfg.h"
137 #include "tree-ssa-propagate.h"
138 #include "dbgcnt.h"
139 #include "params.h"
140 #include "builtins.h"
141 #include "tree-chkp.h"
142 #include "cfgloop.h"
143 #include "stor-layout.h"
144 #include "optabs-query.h"
147 /* Possible lattice values. */
148 typedef enum
150 UNINITIALIZED,
151 UNDEFINED,
152 CONSTANT,
153 VARYING
154 } ccp_lattice_t;
156 struct ccp_prop_value_t {
157 /* Lattice value. */
158 ccp_lattice_t lattice_val;
160 /* Propagated value. */
161 tree value;
163 /* Mask that applies to the propagated value during CCP. For X
164 with a CONSTANT lattice value X & ~mask == value & ~mask. The
165 zero bits in the mask cover constant values. The ones mean no
166 information. */
167 widest_int mask;
170 /* Array of propagated constant values. After propagation,
171 CONST_VAL[I].VALUE holds the constant value for SSA_NAME(I). If
172 the constant is held in an SSA name representing a memory store
173 (i.e., a VDEF), CONST_VAL[I].MEM_REF will contain the actual
174 memory reference used to store (i.e., the LHS of the assignment
175 doing the store). */
176 static ccp_prop_value_t *const_val;
177 static unsigned n_const_val;
179 static void canonicalize_value (ccp_prop_value_t *);
180 static bool ccp_fold_stmt (gimple_stmt_iterator *);
181 static void ccp_lattice_meet (ccp_prop_value_t *, ccp_prop_value_t *);
183 /* Dump constant propagation value VAL to file OUTF prefixed by PREFIX. */
185 static void
186 dump_lattice_value (FILE *outf, const char *prefix, ccp_prop_value_t val)
188 switch (val.lattice_val)
190 case UNINITIALIZED:
191 fprintf (outf, "%sUNINITIALIZED", prefix);
192 break;
193 case UNDEFINED:
194 fprintf (outf, "%sUNDEFINED", prefix);
195 break;
196 case VARYING:
197 fprintf (outf, "%sVARYING", prefix);
198 break;
199 case CONSTANT:
200 if (TREE_CODE (val.value) != INTEGER_CST
201 || val.mask == 0)
203 fprintf (outf, "%sCONSTANT ", prefix);
204 print_generic_expr (outf, val.value, dump_flags);
206 else
208 widest_int cval = wi::bit_and_not (wi::to_widest (val.value),
209 val.mask);
210 fprintf (outf, "%sCONSTANT ", prefix);
211 print_hex (cval, outf);
212 fprintf (outf, " (");
213 print_hex (val.mask, outf);
214 fprintf (outf, ")");
216 break;
217 default:
218 gcc_unreachable ();
223 /* Print lattice value VAL to stderr. */
225 void debug_lattice_value (ccp_prop_value_t val);
227 DEBUG_FUNCTION void
228 debug_lattice_value (ccp_prop_value_t val)
230 dump_lattice_value (stderr, "", val);
231 fprintf (stderr, "\n");
234 /* Extend NONZERO_BITS to a full mask, with the upper bits being set. */
236 static widest_int
237 extend_mask (const wide_int &nonzero_bits)
239 return (wi::mask <widest_int> (wi::get_precision (nonzero_bits), true)
240 | widest_int::from (nonzero_bits, UNSIGNED));
243 /* Compute a default value for variable VAR and store it in the
244 CONST_VAL array. The following rules are used to get default
245 values:
247 1- Global and static variables that are declared constant are
248 considered CONSTANT.
250 2- Any other value is considered UNDEFINED. This is useful when
251 considering PHI nodes. PHI arguments that are undefined do not
252 change the constant value of the PHI node, which allows for more
253 constants to be propagated.
255 3- Variables defined by statements other than assignments and PHI
256 nodes are considered VARYING.
258 4- Initial values of variables that are not GIMPLE registers are
259 considered VARYING. */
261 static ccp_prop_value_t
262 get_default_value (tree var)
264 ccp_prop_value_t val = { UNINITIALIZED, NULL_TREE, 0 };
265 gimple *stmt;
267 stmt = SSA_NAME_DEF_STMT (var);
269 if (gimple_nop_p (stmt))
271 /* Variables defined by an empty statement are those used
272 before being initialized. If VAR is a local variable, we
273 can assume initially that it is UNDEFINED, otherwise we must
274 consider it VARYING. */
275 if (!virtual_operand_p (var)
276 && SSA_NAME_VAR (var)
277 && TREE_CODE (SSA_NAME_VAR (var)) == VAR_DECL)
278 val.lattice_val = UNDEFINED;
279 else
281 val.lattice_val = VARYING;
282 val.mask = -1;
283 if (flag_tree_bit_ccp)
285 wide_int nonzero_bits = get_nonzero_bits (var);
286 if (nonzero_bits != -1)
288 val.lattice_val = CONSTANT;
289 val.value = build_zero_cst (TREE_TYPE (var));
290 val.mask = extend_mask (nonzero_bits);
295 else if (is_gimple_assign (stmt))
297 tree cst;
298 if (gimple_assign_single_p (stmt)
299 && DECL_P (gimple_assign_rhs1 (stmt))
300 && (cst = get_symbol_constant_value (gimple_assign_rhs1 (stmt))))
302 val.lattice_val = CONSTANT;
303 val.value = cst;
305 else
307 /* Any other variable defined by an assignment is considered
308 UNDEFINED. */
309 val.lattice_val = UNDEFINED;
312 else if ((is_gimple_call (stmt)
313 && gimple_call_lhs (stmt) != NULL_TREE)
314 || gimple_code (stmt) == GIMPLE_PHI)
316 /* A variable defined by a call or a PHI node is considered
317 UNDEFINED. */
318 val.lattice_val = UNDEFINED;
320 else
322 /* Otherwise, VAR will never take on a constant value. */
323 val.lattice_val = VARYING;
324 val.mask = -1;
327 return val;
331 /* Get the constant value associated with variable VAR. */
333 static inline ccp_prop_value_t *
334 get_value (tree var)
336 ccp_prop_value_t *val;
338 if (const_val == NULL
339 || SSA_NAME_VERSION (var) >= n_const_val)
340 return NULL;
342 val = &const_val[SSA_NAME_VERSION (var)];
343 if (val->lattice_val == UNINITIALIZED)
344 *val = get_default_value (var);
346 canonicalize_value (val);
348 return val;
351 /* Return the constant tree value associated with VAR. */
353 static inline tree
354 get_constant_value (tree var)
356 ccp_prop_value_t *val;
357 if (TREE_CODE (var) != SSA_NAME)
359 if (is_gimple_min_invariant (var))
360 return var;
361 return NULL_TREE;
363 val = get_value (var);
364 if (val
365 && val->lattice_val == CONSTANT
366 && (TREE_CODE (val->value) != INTEGER_CST
367 || val->mask == 0))
368 return val->value;
369 return NULL_TREE;
372 /* Sets the value associated with VAR to VARYING. */
374 static inline void
375 set_value_varying (tree var)
377 ccp_prop_value_t *val = &const_val[SSA_NAME_VERSION (var)];
379 val->lattice_val = VARYING;
380 val->value = NULL_TREE;
381 val->mask = -1;
384 /* For integer constants, make sure to drop TREE_OVERFLOW. */
386 static void
387 canonicalize_value (ccp_prop_value_t *val)
389 if (val->lattice_val != CONSTANT)
390 return;
392 if (TREE_OVERFLOW_P (val->value))
393 val->value = drop_tree_overflow (val->value);
396 /* Return whether the lattice transition is valid. */
398 static bool
399 valid_lattice_transition (ccp_prop_value_t old_val, ccp_prop_value_t new_val)
401 /* Lattice transitions must always be monotonically increasing in
402 value. */
403 if (old_val.lattice_val < new_val.lattice_val)
404 return true;
406 if (old_val.lattice_val != new_val.lattice_val)
407 return false;
409 if (!old_val.value && !new_val.value)
410 return true;
412 /* Now both lattice values are CONSTANT. */
414 /* Allow arbitrary copy changes as we might look through PHI <a_1, ...>
415 when only a single copy edge is executable. */
416 if (TREE_CODE (old_val.value) == SSA_NAME
417 && TREE_CODE (new_val.value) == SSA_NAME)
418 return true;
420 /* Allow transitioning from a constant to a copy. */
421 if (is_gimple_min_invariant (old_val.value)
422 && TREE_CODE (new_val.value) == SSA_NAME)
423 return true;
425 /* Allow transitioning from PHI <&x, not executable> == &x
426 to PHI <&x, &y> == common alignment. */
427 if (TREE_CODE (old_val.value) != INTEGER_CST
428 && TREE_CODE (new_val.value) == INTEGER_CST)
429 return true;
431 /* Bit-lattices have to agree in the still valid bits. */
432 if (TREE_CODE (old_val.value) == INTEGER_CST
433 && TREE_CODE (new_val.value) == INTEGER_CST)
434 return (wi::bit_and_not (wi::to_widest (old_val.value), new_val.mask)
435 == wi::bit_and_not (wi::to_widest (new_val.value), new_val.mask));
437 /* Otherwise constant values have to agree. */
438 if (operand_equal_p (old_val.value, new_val.value, 0))
439 return true;
441 /* At least the kinds and types should agree now. */
442 if (TREE_CODE (old_val.value) != TREE_CODE (new_val.value)
443 || !types_compatible_p (TREE_TYPE (old_val.value),
444 TREE_TYPE (new_val.value)))
445 return false;
447 /* For floats and !HONOR_NANS allow transitions from (partial) NaN
448 to non-NaN. */
449 tree type = TREE_TYPE (new_val.value);
450 if (SCALAR_FLOAT_TYPE_P (type)
451 && !HONOR_NANS (type))
453 if (REAL_VALUE_ISNAN (TREE_REAL_CST (old_val.value)))
454 return true;
456 else if (VECTOR_FLOAT_TYPE_P (type)
457 && !HONOR_NANS (type))
459 for (unsigned i = 0; i < VECTOR_CST_NELTS (old_val.value); ++i)
460 if (!REAL_VALUE_ISNAN
461 (TREE_REAL_CST (VECTOR_CST_ELT (old_val.value, i)))
462 && !operand_equal_p (VECTOR_CST_ELT (old_val.value, i),
463 VECTOR_CST_ELT (new_val.value, i), 0))
464 return false;
465 return true;
467 else if (COMPLEX_FLOAT_TYPE_P (type)
468 && !HONOR_NANS (type))
470 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_REALPART (old_val.value)))
471 && !operand_equal_p (TREE_REALPART (old_val.value),
472 TREE_REALPART (new_val.value), 0))
473 return false;
474 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_IMAGPART (old_val.value)))
475 && !operand_equal_p (TREE_IMAGPART (old_val.value),
476 TREE_IMAGPART (new_val.value), 0))
477 return false;
478 return true;
480 return false;
483 /* Set the value for variable VAR to NEW_VAL. Return true if the new
484 value is different from VAR's previous value. */
486 static bool
487 set_lattice_value (tree var, ccp_prop_value_t *new_val)
489 /* We can deal with old UNINITIALIZED values just fine here. */
490 ccp_prop_value_t *old_val = &const_val[SSA_NAME_VERSION (var)];
492 canonicalize_value (new_val);
494 /* We have to be careful to not go up the bitwise lattice
495 represented by the mask. Instead of dropping to VARYING
496 use the meet operator to retain a conservative value.
497 Missed optimizations like PR65851 makes this necessary.
498 It also ensures we converge to a stable lattice solution. */
499 if (new_val->lattice_val == CONSTANT
500 && old_val->lattice_val == CONSTANT
501 && TREE_CODE (new_val->value) != SSA_NAME)
502 ccp_lattice_meet (new_val, old_val);
504 gcc_checking_assert (valid_lattice_transition (*old_val, *new_val));
506 /* If *OLD_VAL and NEW_VAL are the same, return false to inform the
507 caller that this was a non-transition. */
508 if (old_val->lattice_val != new_val->lattice_val
509 || (new_val->lattice_val == CONSTANT
510 && (TREE_CODE (new_val->value) != TREE_CODE (old_val->value)
511 || (TREE_CODE (new_val->value) == INTEGER_CST
512 && (new_val->mask != old_val->mask
513 || (wi::bit_and_not (wi::to_widest (old_val->value),
514 new_val->mask)
515 != wi::bit_and_not (wi::to_widest (new_val->value),
516 new_val->mask))))
517 || (TREE_CODE (new_val->value) != INTEGER_CST
518 && !operand_equal_p (new_val->value, old_val->value, 0)))))
520 /* ??? We would like to delay creation of INTEGER_CSTs from
521 partially constants here. */
523 if (dump_file && (dump_flags & TDF_DETAILS))
525 dump_lattice_value (dump_file, "Lattice value changed to ", *new_val);
526 fprintf (dump_file, ". Adding SSA edges to worklist.\n");
529 *old_val = *new_val;
531 gcc_assert (new_val->lattice_val != UNINITIALIZED);
532 return true;
535 return false;
538 static ccp_prop_value_t get_value_for_expr (tree, bool);
539 static ccp_prop_value_t bit_value_binop (enum tree_code, tree, tree, tree);
540 static void bit_value_binop_1 (enum tree_code, tree, widest_int *, widest_int *,
541 tree, const widest_int &, const widest_int &,
542 tree, const widest_int &, const widest_int &);
544 /* Return a widest_int that can be used for bitwise simplifications
545 from VAL. */
547 static widest_int
548 value_to_wide_int (ccp_prop_value_t val)
550 if (val.value
551 && TREE_CODE (val.value) == INTEGER_CST)
552 return wi::to_widest (val.value);
554 return 0;
557 /* Return the value for the address expression EXPR based on alignment
558 information. */
560 static ccp_prop_value_t
561 get_value_from_alignment (tree expr)
563 tree type = TREE_TYPE (expr);
564 ccp_prop_value_t val;
565 unsigned HOST_WIDE_INT bitpos;
566 unsigned int align;
568 gcc_assert (TREE_CODE (expr) == ADDR_EXPR);
570 get_pointer_alignment_1 (expr, &align, &bitpos);
571 val.mask = (POINTER_TYPE_P (type) || TYPE_UNSIGNED (type)
572 ? wi::mask <widest_int> (TYPE_PRECISION (type), false)
573 : -1).and_not (align / BITS_PER_UNIT - 1);
574 val.lattice_val
575 = wi::sext (val.mask, TYPE_PRECISION (type)) == -1 ? VARYING : CONSTANT;
576 if (val.lattice_val == CONSTANT)
577 val.value = build_int_cstu (type, bitpos / BITS_PER_UNIT);
578 else
579 val.value = NULL_TREE;
581 return val;
584 /* Return the value for the tree operand EXPR. If FOR_BITS_P is true
585 return constant bits extracted from alignment information for
586 invariant addresses. */
588 static ccp_prop_value_t
589 get_value_for_expr (tree expr, bool for_bits_p)
591 ccp_prop_value_t val;
593 if (TREE_CODE (expr) == SSA_NAME)
595 val = *get_value (expr);
596 if (for_bits_p
597 && val.lattice_val == CONSTANT
598 && TREE_CODE (val.value) == ADDR_EXPR)
599 val = get_value_from_alignment (val.value);
600 /* Fall back to a copy value. */
601 if (!for_bits_p
602 && val.lattice_val == VARYING
603 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (expr))
605 val.lattice_val = CONSTANT;
606 val.value = expr;
607 val.mask = -1;
610 else if (is_gimple_min_invariant (expr)
611 && (!for_bits_p || TREE_CODE (expr) != ADDR_EXPR))
613 val.lattice_val = CONSTANT;
614 val.value = expr;
615 val.mask = 0;
616 canonicalize_value (&val);
618 else if (TREE_CODE (expr) == ADDR_EXPR)
619 val = get_value_from_alignment (expr);
620 else
622 val.lattice_val = VARYING;
623 val.mask = -1;
624 val.value = NULL_TREE;
627 if (val.lattice_val == VARYING
628 && TYPE_UNSIGNED (TREE_TYPE (expr)))
629 val.mask = wi::zext (val.mask, TYPE_PRECISION (TREE_TYPE (expr)));
631 return val;
634 /* Return the likely CCP lattice value for STMT.
636 If STMT has no operands, then return CONSTANT.
638 Else if undefinedness of operands of STMT cause its value to be
639 undefined, then return UNDEFINED.
641 Else if any operands of STMT are constants, then return CONSTANT.
643 Else return VARYING. */
645 static ccp_lattice_t
646 likely_value (gimple *stmt)
648 bool has_constant_operand, has_undefined_operand, all_undefined_operands;
649 bool has_nsa_operand;
650 tree use;
651 ssa_op_iter iter;
652 unsigned i;
654 enum gimple_code code = gimple_code (stmt);
656 /* This function appears to be called only for assignments, calls,
657 conditionals, and switches, due to the logic in visit_stmt. */
658 gcc_assert (code == GIMPLE_ASSIGN
659 || code == GIMPLE_CALL
660 || code == GIMPLE_COND
661 || code == GIMPLE_SWITCH);
663 /* If the statement has volatile operands, it won't fold to a
664 constant value. */
665 if (gimple_has_volatile_ops (stmt))
666 return VARYING;
668 /* Arrive here for more complex cases. */
669 has_constant_operand = false;
670 has_undefined_operand = false;
671 all_undefined_operands = true;
672 has_nsa_operand = false;
673 FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
675 ccp_prop_value_t *val = get_value (use);
677 if (val->lattice_val == UNDEFINED)
678 has_undefined_operand = true;
679 else
680 all_undefined_operands = false;
682 if (val->lattice_val == CONSTANT)
683 has_constant_operand = true;
685 if (SSA_NAME_IS_DEFAULT_DEF (use)
686 || !prop_simulate_again_p (SSA_NAME_DEF_STMT (use)))
687 has_nsa_operand = true;
690 /* There may be constants in regular rhs operands. For calls we
691 have to ignore lhs, fndecl and static chain, otherwise only
692 the lhs. */
693 for (i = (is_gimple_call (stmt) ? 2 : 0) + gimple_has_lhs (stmt);
694 i < gimple_num_ops (stmt); ++i)
696 tree op = gimple_op (stmt, i);
697 if (!op || TREE_CODE (op) == SSA_NAME)
698 continue;
699 if (is_gimple_min_invariant (op))
700 has_constant_operand = true;
703 if (has_constant_operand)
704 all_undefined_operands = false;
706 if (has_undefined_operand
707 && code == GIMPLE_CALL
708 && gimple_call_internal_p (stmt))
709 switch (gimple_call_internal_fn (stmt))
711 /* These 3 builtins use the first argument just as a magic
712 way how to find out a decl uid. */
713 case IFN_GOMP_SIMD_LANE:
714 case IFN_GOMP_SIMD_VF:
715 case IFN_GOMP_SIMD_LAST_LANE:
716 has_undefined_operand = false;
717 break;
718 default:
719 break;
722 /* If the operation combines operands like COMPLEX_EXPR make sure to
723 not mark the result UNDEFINED if only one part of the result is
724 undefined. */
725 if (has_undefined_operand && all_undefined_operands)
726 return UNDEFINED;
727 else if (code == GIMPLE_ASSIGN && has_undefined_operand)
729 switch (gimple_assign_rhs_code (stmt))
731 /* Unary operators are handled with all_undefined_operands. */
732 case PLUS_EXPR:
733 case MINUS_EXPR:
734 case POINTER_PLUS_EXPR:
735 /* Not MIN_EXPR, MAX_EXPR. One VARYING operand may be selected.
736 Not bitwise operators, one VARYING operand may specify the
737 result completely. Not logical operators for the same reason.
738 Not COMPLEX_EXPR as one VARYING operand makes the result partly
739 not UNDEFINED. Not *DIV_EXPR, comparisons and shifts because
740 the undefined operand may be promoted. */
741 return UNDEFINED;
743 case ADDR_EXPR:
744 /* If any part of an address is UNDEFINED, like the index
745 of an ARRAY_EXPR, then treat the result as UNDEFINED. */
746 return UNDEFINED;
748 default:
752 /* If there was an UNDEFINED operand but the result may be not UNDEFINED
753 fall back to CONSTANT. During iteration UNDEFINED may still drop
754 to CONSTANT. */
755 if (has_undefined_operand)
756 return CONSTANT;
758 /* We do not consider virtual operands here -- load from read-only
759 memory may have only VARYING virtual operands, but still be
760 constant. Also we can combine the stmt with definitions from
761 operands whose definitions are not simulated again. */
762 if (has_constant_operand
763 || has_nsa_operand
764 || gimple_references_memory_p (stmt))
765 return CONSTANT;
767 return VARYING;
770 /* Returns true if STMT cannot be constant. */
772 static bool
773 surely_varying_stmt_p (gimple *stmt)
775 /* If the statement has operands that we cannot handle, it cannot be
776 constant. */
777 if (gimple_has_volatile_ops (stmt))
778 return true;
780 /* If it is a call and does not return a value or is not a
781 builtin and not an indirect call or a call to function with
782 assume_aligned/alloc_align attribute, it is varying. */
783 if (is_gimple_call (stmt))
785 tree fndecl, fntype = gimple_call_fntype (stmt);
786 if (!gimple_call_lhs (stmt)
787 || ((fndecl = gimple_call_fndecl (stmt)) != NULL_TREE
788 && !DECL_BUILT_IN (fndecl)
789 && !lookup_attribute ("assume_aligned",
790 TYPE_ATTRIBUTES (fntype))
791 && !lookup_attribute ("alloc_align",
792 TYPE_ATTRIBUTES (fntype))))
793 return true;
796 /* Any other store operation is not interesting. */
797 else if (gimple_vdef (stmt))
798 return true;
800 /* Anything other than assignments and conditional jumps are not
801 interesting for CCP. */
802 if (gimple_code (stmt) != GIMPLE_ASSIGN
803 && gimple_code (stmt) != GIMPLE_COND
804 && gimple_code (stmt) != GIMPLE_SWITCH
805 && gimple_code (stmt) != GIMPLE_CALL)
806 return true;
808 return false;
811 /* Initialize local data structures for CCP. */
813 static void
814 ccp_initialize (void)
816 basic_block bb;
818 n_const_val = num_ssa_names;
819 const_val = XCNEWVEC (ccp_prop_value_t, n_const_val);
821 /* Initialize simulation flags for PHI nodes and statements. */
822 FOR_EACH_BB_FN (bb, cfun)
824 gimple_stmt_iterator i;
826 for (i = gsi_start_bb (bb); !gsi_end_p (i); gsi_next (&i))
828 gimple *stmt = gsi_stmt (i);
829 bool is_varying;
831 /* If the statement is a control insn, then we do not
832 want to avoid simulating the statement once. Failure
833 to do so means that those edges will never get added. */
834 if (stmt_ends_bb_p (stmt))
835 is_varying = false;
836 else
837 is_varying = surely_varying_stmt_p (stmt);
839 if (is_varying)
841 tree def;
842 ssa_op_iter iter;
844 /* If the statement will not produce a constant, mark
845 all its outputs VARYING. */
846 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
847 set_value_varying (def);
849 prop_set_simulate_again (stmt, !is_varying);
853 /* Now process PHI nodes. We never clear the simulate_again flag on
854 phi nodes, since we do not know which edges are executable yet,
855 except for phi nodes for virtual operands when we do not do store ccp. */
856 FOR_EACH_BB_FN (bb, cfun)
858 gphi_iterator i;
860 for (i = gsi_start_phis (bb); !gsi_end_p (i); gsi_next (&i))
862 gphi *phi = i.phi ();
864 if (virtual_operand_p (gimple_phi_result (phi)))
865 prop_set_simulate_again (phi, false);
866 else
867 prop_set_simulate_again (phi, true);
872 /* Debug count support. Reset the values of ssa names
873 VARYING when the total number ssa names analyzed is
874 beyond the debug count specified. */
876 static void
877 do_dbg_cnt (void)
879 unsigned i;
880 for (i = 0; i < num_ssa_names; i++)
882 if (!dbg_cnt (ccp))
884 const_val[i].lattice_val = VARYING;
885 const_val[i].mask = -1;
886 const_val[i].value = NULL_TREE;
892 /* Do final substitution of propagated values, cleanup the flowgraph and
893 free allocated storage. If NONZERO_P, record nonzero bits.
895 Return TRUE when something was optimized. */
897 static bool
898 ccp_finalize (bool nonzero_p)
900 bool something_changed;
901 unsigned i;
903 do_dbg_cnt ();
905 /* Derive alignment and misalignment information from partially
906 constant pointers in the lattice or nonzero bits from partially
907 constant integers. */
908 for (i = 1; i < num_ssa_names; ++i)
910 tree name = ssa_name (i);
911 ccp_prop_value_t *val;
912 unsigned int tem, align;
914 if (!name
915 || (!POINTER_TYPE_P (TREE_TYPE (name))
916 && (!INTEGRAL_TYPE_P (TREE_TYPE (name))
917 /* Don't record nonzero bits before IPA to avoid
918 using too much memory. */
919 || !nonzero_p)))
920 continue;
922 val = get_value (name);
923 if (val->lattice_val != CONSTANT
924 || TREE_CODE (val->value) != INTEGER_CST)
925 continue;
927 if (POINTER_TYPE_P (TREE_TYPE (name)))
929 /* Trailing mask bits specify the alignment, trailing value
930 bits the misalignment. */
931 tem = val->mask.to_uhwi ();
932 align = (tem & -tem);
933 if (align > 1)
934 set_ptr_info_alignment (get_ptr_info (name), align,
935 (TREE_INT_CST_LOW (val->value)
936 & (align - 1)));
938 else
940 unsigned int precision = TYPE_PRECISION (TREE_TYPE (val->value));
941 wide_int nonzero_bits = wide_int::from (val->mask, precision,
942 UNSIGNED) | val->value;
943 nonzero_bits &= get_nonzero_bits (name);
944 set_nonzero_bits (name, nonzero_bits);
948 /* Perform substitutions based on the known constant values. */
949 something_changed = substitute_and_fold (get_constant_value,
950 ccp_fold_stmt, true);
952 free (const_val);
953 const_val = NULL;
954 return something_changed;;
958 /* Compute the meet operator between *VAL1 and *VAL2. Store the result
959 in VAL1.
961 any M UNDEFINED = any
962 any M VARYING = VARYING
963 Ci M Cj = Ci if (i == j)
964 Ci M Cj = VARYING if (i != j)
967 static void
968 ccp_lattice_meet (ccp_prop_value_t *val1, ccp_prop_value_t *val2)
970 if (val1->lattice_val == UNDEFINED
971 /* For UNDEFINED M SSA we can't always SSA because its definition
972 may not dominate the PHI node. Doing optimistic copy propagation
973 also causes a lot of gcc.dg/uninit-pred*.c FAILs. */
974 && (val2->lattice_val != CONSTANT
975 || TREE_CODE (val2->value) != SSA_NAME))
977 /* UNDEFINED M any = any */
978 *val1 = *val2;
980 else if (val2->lattice_val == UNDEFINED
981 /* See above. */
982 && (val1->lattice_val != CONSTANT
983 || TREE_CODE (val1->value) != SSA_NAME))
985 /* any M UNDEFINED = any
986 Nothing to do. VAL1 already contains the value we want. */
989 else if (val1->lattice_val == VARYING
990 || val2->lattice_val == VARYING)
992 /* any M VARYING = VARYING. */
993 val1->lattice_val = VARYING;
994 val1->mask = -1;
995 val1->value = NULL_TREE;
997 else if (val1->lattice_val == CONSTANT
998 && val2->lattice_val == CONSTANT
999 && TREE_CODE (val1->value) == INTEGER_CST
1000 && TREE_CODE (val2->value) == INTEGER_CST)
1002 /* Ci M Cj = Ci if (i == j)
1003 Ci M Cj = VARYING if (i != j)
1005 For INTEGER_CSTs mask unequal bits. If no equal bits remain,
1006 drop to varying. */
1007 val1->mask = (val1->mask | val2->mask
1008 | (wi::to_widest (val1->value)
1009 ^ wi::to_widest (val2->value)));
1010 if (wi::sext (val1->mask, TYPE_PRECISION (TREE_TYPE (val1->value))) == -1)
1012 val1->lattice_val = VARYING;
1013 val1->value = NULL_TREE;
1016 else if (val1->lattice_val == CONSTANT
1017 && val2->lattice_val == CONSTANT
1018 && operand_equal_p (val1->value, val2->value, 0))
1020 /* Ci M Cj = Ci if (i == j)
1021 Ci M Cj = VARYING if (i != j)
1023 VAL1 already contains the value we want for equivalent values. */
1025 else if (val1->lattice_val == CONSTANT
1026 && val2->lattice_val == CONSTANT
1027 && (TREE_CODE (val1->value) == ADDR_EXPR
1028 || TREE_CODE (val2->value) == ADDR_EXPR))
1030 /* When not equal addresses are involved try meeting for
1031 alignment. */
1032 ccp_prop_value_t tem = *val2;
1033 if (TREE_CODE (val1->value) == ADDR_EXPR)
1034 *val1 = get_value_for_expr (val1->value, true);
1035 if (TREE_CODE (val2->value) == ADDR_EXPR)
1036 tem = get_value_for_expr (val2->value, true);
1037 ccp_lattice_meet (val1, &tem);
1039 else
1041 /* Any other combination is VARYING. */
1042 val1->lattice_val = VARYING;
1043 val1->mask = -1;
1044 val1->value = NULL_TREE;
1049 /* Loop through the PHI_NODE's parameters for BLOCK and compare their
1050 lattice values to determine PHI_NODE's lattice value. The value of a
1051 PHI node is determined calling ccp_lattice_meet with all the arguments
1052 of the PHI node that are incoming via executable edges. */
1054 static enum ssa_prop_result
1055 ccp_visit_phi_node (gphi *phi)
1057 unsigned i;
1058 ccp_prop_value_t new_val;
1060 if (dump_file && (dump_flags & TDF_DETAILS))
1062 fprintf (dump_file, "\nVisiting PHI node: ");
1063 print_gimple_stmt (dump_file, phi, 0, dump_flags);
1066 new_val.lattice_val = UNDEFINED;
1067 new_val.value = NULL_TREE;
1068 new_val.mask = 0;
1070 bool first = true;
1071 bool non_exec_edge = false;
1072 for (i = 0; i < gimple_phi_num_args (phi); i++)
1074 /* Compute the meet operator over all the PHI arguments flowing
1075 through executable edges. */
1076 edge e = gimple_phi_arg_edge (phi, i);
1078 if (dump_file && (dump_flags & TDF_DETAILS))
1080 fprintf (dump_file,
1081 "\n Argument #%d (%d -> %d %sexecutable)\n",
1082 i, e->src->index, e->dest->index,
1083 (e->flags & EDGE_EXECUTABLE) ? "" : "not ");
1086 /* If the incoming edge is executable, Compute the meet operator for
1087 the existing value of the PHI node and the current PHI argument. */
1088 if (e->flags & EDGE_EXECUTABLE)
1090 tree arg = gimple_phi_arg (phi, i)->def;
1091 ccp_prop_value_t arg_val = get_value_for_expr (arg, false);
1093 if (first)
1095 new_val = arg_val;
1096 first = false;
1098 else
1099 ccp_lattice_meet (&new_val, &arg_val);
1101 if (dump_file && (dump_flags & TDF_DETAILS))
1103 fprintf (dump_file, "\t");
1104 print_generic_expr (dump_file, arg, dump_flags);
1105 dump_lattice_value (dump_file, "\tValue: ", arg_val);
1106 fprintf (dump_file, "\n");
1109 if (new_val.lattice_val == VARYING)
1110 break;
1112 else
1113 non_exec_edge = true;
1116 /* In case there were non-executable edges and the value is a copy
1117 make sure its definition dominates the PHI node. */
1118 if (non_exec_edge
1119 && new_val.lattice_val == CONSTANT
1120 && TREE_CODE (new_val.value) == SSA_NAME
1121 && ! SSA_NAME_IS_DEFAULT_DEF (new_val.value)
1122 && ! dominated_by_p (CDI_DOMINATORS, gimple_bb (phi),
1123 gimple_bb (SSA_NAME_DEF_STMT (new_val.value))))
1125 new_val.lattice_val = VARYING;
1126 new_val.value = NULL_TREE;
1127 new_val.mask = -1;
1130 if (dump_file && (dump_flags & TDF_DETAILS))
1132 dump_lattice_value (dump_file, "\n PHI node value: ", new_val);
1133 fprintf (dump_file, "\n\n");
1136 /* Make the transition to the new value. */
1137 if (set_lattice_value (gimple_phi_result (phi), &new_val))
1139 if (new_val.lattice_val == VARYING)
1140 return SSA_PROP_VARYING;
1141 else
1142 return SSA_PROP_INTERESTING;
1144 else
1145 return SSA_PROP_NOT_INTERESTING;
1148 /* Return the constant value for OP or OP otherwise. */
1150 static tree
1151 valueize_op (tree op)
1153 if (TREE_CODE (op) == SSA_NAME)
1155 tree tem = get_constant_value (op);
1156 if (tem)
1157 return tem;
1159 return op;
1162 /* Return the constant value for OP, but signal to not follow SSA
1163 edges if the definition may be simulated again. */
1165 static tree
1166 valueize_op_1 (tree op)
1168 if (TREE_CODE (op) == SSA_NAME)
1170 /* If the definition may be simulated again we cannot follow
1171 this SSA edge as the SSA propagator does not necessarily
1172 re-visit the use. */
1173 gimple *def_stmt = SSA_NAME_DEF_STMT (op);
1174 if (!gimple_nop_p (def_stmt)
1175 && prop_simulate_again_p (def_stmt))
1176 return NULL_TREE;
1177 tree tem = get_constant_value (op);
1178 if (tem)
1179 return tem;
1181 return op;
1184 /* CCP specific front-end to the non-destructive constant folding
1185 routines.
1187 Attempt to simplify the RHS of STMT knowing that one or more
1188 operands are constants.
1190 If simplification is possible, return the simplified RHS,
1191 otherwise return the original RHS or NULL_TREE. */
1193 static tree
1194 ccp_fold (gimple *stmt)
1196 location_t loc = gimple_location (stmt);
1197 switch (gimple_code (stmt))
1199 case GIMPLE_COND:
1201 /* Handle comparison operators that can appear in GIMPLE form. */
1202 tree op0 = valueize_op (gimple_cond_lhs (stmt));
1203 tree op1 = valueize_op (gimple_cond_rhs (stmt));
1204 enum tree_code code = gimple_cond_code (stmt);
1205 return fold_binary_loc (loc, code, boolean_type_node, op0, op1);
1208 case GIMPLE_SWITCH:
1210 /* Return the constant switch index. */
1211 return valueize_op (gimple_switch_index (as_a <gswitch *> (stmt)));
1214 case GIMPLE_ASSIGN:
1215 case GIMPLE_CALL:
1216 return gimple_fold_stmt_to_constant_1 (stmt,
1217 valueize_op, valueize_op_1);
1219 default:
1220 gcc_unreachable ();
1224 /* Apply the operation CODE in type TYPE to the value, mask pair
1225 RVAL and RMASK representing a value of type RTYPE and set
1226 the value, mask pair *VAL and *MASK to the result. */
1228 static void
1229 bit_value_unop_1 (enum tree_code code, tree type,
1230 widest_int *val, widest_int *mask,
1231 tree rtype, const widest_int &rval, const widest_int &rmask)
1233 switch (code)
1235 case BIT_NOT_EXPR:
1236 *mask = rmask;
1237 *val = ~rval;
1238 break;
1240 case NEGATE_EXPR:
1242 widest_int temv, temm;
1243 /* Return ~rval + 1. */
1244 bit_value_unop_1 (BIT_NOT_EXPR, type, &temv, &temm, type, rval, rmask);
1245 bit_value_binop_1 (PLUS_EXPR, type, val, mask,
1246 type, temv, temm, type, 1, 0);
1247 break;
1250 CASE_CONVERT:
1252 signop sgn;
1254 /* First extend mask and value according to the original type. */
1255 sgn = TYPE_SIGN (rtype);
1256 *mask = wi::ext (rmask, TYPE_PRECISION (rtype), sgn);
1257 *val = wi::ext (rval, TYPE_PRECISION (rtype), sgn);
1259 /* Then extend mask and value according to the target type. */
1260 sgn = TYPE_SIGN (type);
1261 *mask = wi::ext (*mask, TYPE_PRECISION (type), sgn);
1262 *val = wi::ext (*val, TYPE_PRECISION (type), sgn);
1263 break;
1266 default:
1267 *mask = -1;
1268 break;
1272 /* Apply the operation CODE in type TYPE to the value, mask pairs
1273 R1VAL, R1MASK and R2VAL, R2MASK representing a values of type R1TYPE
1274 and R2TYPE and set the value, mask pair *VAL and *MASK to the result. */
1276 static void
1277 bit_value_binop_1 (enum tree_code code, tree type,
1278 widest_int *val, widest_int *mask,
1279 tree r1type, const widest_int &r1val,
1280 const widest_int &r1mask, tree r2type,
1281 const widest_int &r2val, const widest_int &r2mask)
1283 signop sgn = TYPE_SIGN (type);
1284 int width = TYPE_PRECISION (type);
1285 bool swap_p = false;
1287 /* Assume we'll get a constant result. Use an initial non varying
1288 value, we fall back to varying in the end if necessary. */
1289 *mask = -1;
1291 switch (code)
1293 case BIT_AND_EXPR:
1294 /* The mask is constant where there is a known not
1295 set bit, (m1 | m2) & ((v1 | m1) & (v2 | m2)) */
1296 *mask = (r1mask | r2mask) & (r1val | r1mask) & (r2val | r2mask);
1297 *val = r1val & r2val;
1298 break;
1300 case BIT_IOR_EXPR:
1301 /* The mask is constant where there is a known
1302 set bit, (m1 | m2) & ~((v1 & ~m1) | (v2 & ~m2)). */
1303 *mask = (r1mask | r2mask)
1304 .and_not (r1val.and_not (r1mask) | r2val.and_not (r2mask));
1305 *val = r1val | r2val;
1306 break;
1308 case BIT_XOR_EXPR:
1309 /* m1 | m2 */
1310 *mask = r1mask | r2mask;
1311 *val = r1val ^ r2val;
1312 break;
1314 case LROTATE_EXPR:
1315 case RROTATE_EXPR:
1316 if (r2mask == 0)
1318 widest_int shift = r2val;
1319 if (shift == 0)
1321 *mask = r1mask;
1322 *val = r1val;
1324 else
1326 if (wi::neg_p (shift))
1328 shift = -shift;
1329 if (code == RROTATE_EXPR)
1330 code = LROTATE_EXPR;
1331 else
1332 code = RROTATE_EXPR;
1334 if (code == RROTATE_EXPR)
1336 *mask = wi::rrotate (r1mask, shift, width);
1337 *val = wi::rrotate (r1val, shift, width);
1339 else
1341 *mask = wi::lrotate (r1mask, shift, width);
1342 *val = wi::lrotate (r1val, shift, width);
1346 break;
1348 case LSHIFT_EXPR:
1349 case RSHIFT_EXPR:
1350 /* ??? We can handle partially known shift counts if we know
1351 its sign. That way we can tell that (x << (y | 8)) & 255
1352 is zero. */
1353 if (r2mask == 0)
1355 widest_int shift = r2val;
1356 if (shift == 0)
1358 *mask = r1mask;
1359 *val = r1val;
1361 else
1363 if (wi::neg_p (shift))
1365 shift = -shift;
1366 if (code == RSHIFT_EXPR)
1367 code = LSHIFT_EXPR;
1368 else
1369 code = RSHIFT_EXPR;
1371 if (code == RSHIFT_EXPR)
1373 *mask = wi::rshift (wi::ext (r1mask, width, sgn), shift, sgn);
1374 *val = wi::rshift (wi::ext (r1val, width, sgn), shift, sgn);
1376 else
1378 *mask = wi::ext (r1mask << shift, width, sgn);
1379 *val = wi::ext (r1val << shift, width, sgn);
1383 break;
1385 case PLUS_EXPR:
1386 case POINTER_PLUS_EXPR:
1388 /* Do the addition with unknown bits set to zero, to give carry-ins of
1389 zero wherever possible. */
1390 widest_int lo = r1val.and_not (r1mask) + r2val.and_not (r2mask);
1391 lo = wi::ext (lo, width, sgn);
1392 /* Do the addition with unknown bits set to one, to give carry-ins of
1393 one wherever possible. */
1394 widest_int hi = (r1val | r1mask) + (r2val | r2mask);
1395 hi = wi::ext (hi, width, sgn);
1396 /* Each bit in the result is known if (a) the corresponding bits in
1397 both inputs are known, and (b) the carry-in to that bit position
1398 is known. We can check condition (b) by seeing if we got the same
1399 result with minimised carries as with maximised carries. */
1400 *mask = r1mask | r2mask | (lo ^ hi);
1401 *mask = wi::ext (*mask, width, sgn);
1402 /* It shouldn't matter whether we choose lo or hi here. */
1403 *val = lo;
1404 break;
1407 case MINUS_EXPR:
1409 widest_int temv, temm;
1410 bit_value_unop_1 (NEGATE_EXPR, r2type, &temv, &temm,
1411 r2type, r2val, r2mask);
1412 bit_value_binop_1 (PLUS_EXPR, type, val, mask,
1413 r1type, r1val, r1mask,
1414 r2type, temv, temm);
1415 break;
1418 case MULT_EXPR:
1420 /* Just track trailing zeros in both operands and transfer
1421 them to the other. */
1422 int r1tz = wi::ctz (r1val | r1mask);
1423 int r2tz = wi::ctz (r2val | r2mask);
1424 if (r1tz + r2tz >= width)
1426 *mask = 0;
1427 *val = 0;
1429 else if (r1tz + r2tz > 0)
1431 *mask = wi::ext (wi::mask <widest_int> (r1tz + r2tz, true),
1432 width, sgn);
1433 *val = 0;
1435 break;
1438 case EQ_EXPR:
1439 case NE_EXPR:
1441 widest_int m = r1mask | r2mask;
1442 if (r1val.and_not (m) != r2val.and_not (m))
1444 *mask = 0;
1445 *val = ((code == EQ_EXPR) ? 0 : 1);
1447 else
1449 /* We know the result of a comparison is always one or zero. */
1450 *mask = 1;
1451 *val = 0;
1453 break;
1456 case GE_EXPR:
1457 case GT_EXPR:
1458 swap_p = true;
1459 code = swap_tree_comparison (code);
1460 /* Fall through. */
1461 case LT_EXPR:
1462 case LE_EXPR:
1464 int minmax, maxmin;
1466 const widest_int &o1val = swap_p ? r2val : r1val;
1467 const widest_int &o1mask = swap_p ? r2mask : r1mask;
1468 const widest_int &o2val = swap_p ? r1val : r2val;
1469 const widest_int &o2mask = swap_p ? r1mask : r2mask;
1471 /* If the most significant bits are not known we know nothing. */
1472 if (wi::neg_p (o1mask) || wi::neg_p (o2mask))
1473 break;
1475 /* For comparisons the signedness is in the comparison operands. */
1476 sgn = TYPE_SIGN (r1type);
1478 /* If we know the most significant bits we know the values
1479 value ranges by means of treating varying bits as zero
1480 or one. Do a cross comparison of the max/min pairs. */
1481 maxmin = wi::cmp (o1val | o1mask, o2val.and_not (o2mask), sgn);
1482 minmax = wi::cmp (o1val.and_not (o1mask), o2val | o2mask, sgn);
1483 if (maxmin < 0) /* o1 is less than o2. */
1485 *mask = 0;
1486 *val = 1;
1488 else if (minmax > 0) /* o1 is not less or equal to o2. */
1490 *mask = 0;
1491 *val = 0;
1493 else if (maxmin == minmax) /* o1 and o2 are equal. */
1495 /* This probably should never happen as we'd have
1496 folded the thing during fully constant value folding. */
1497 *mask = 0;
1498 *val = (code == LE_EXPR ? 1 : 0);
1500 else
1502 /* We know the result of a comparison is always one or zero. */
1503 *mask = 1;
1504 *val = 0;
1506 break;
1509 default:;
1513 /* Return the propagation value when applying the operation CODE to
1514 the value RHS yielding type TYPE. */
1516 static ccp_prop_value_t
1517 bit_value_unop (enum tree_code code, tree type, tree rhs)
1519 ccp_prop_value_t rval = get_value_for_expr (rhs, true);
1520 widest_int value, mask;
1521 ccp_prop_value_t val;
1523 if (rval.lattice_val == UNDEFINED)
1524 return rval;
1526 gcc_assert ((rval.lattice_val == CONSTANT
1527 && TREE_CODE (rval.value) == INTEGER_CST)
1528 || wi::sext (rval.mask, TYPE_PRECISION (TREE_TYPE (rhs))) == -1);
1529 bit_value_unop_1 (code, type, &value, &mask,
1530 TREE_TYPE (rhs), value_to_wide_int (rval), rval.mask);
1531 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1533 val.lattice_val = CONSTANT;
1534 val.mask = mask;
1535 /* ??? Delay building trees here. */
1536 val.value = wide_int_to_tree (type, value);
1538 else
1540 val.lattice_val = VARYING;
1541 val.value = NULL_TREE;
1542 val.mask = -1;
1544 return val;
1547 /* Return the propagation value when applying the operation CODE to
1548 the values RHS1 and RHS2 yielding type TYPE. */
1550 static ccp_prop_value_t
1551 bit_value_binop (enum tree_code code, tree type, tree rhs1, tree rhs2)
1553 ccp_prop_value_t r1val = get_value_for_expr (rhs1, true);
1554 ccp_prop_value_t r2val = get_value_for_expr (rhs2, true);
1555 widest_int value, mask;
1556 ccp_prop_value_t val;
1558 if (r1val.lattice_val == UNDEFINED
1559 || r2val.lattice_val == UNDEFINED)
1561 val.lattice_val = VARYING;
1562 val.value = NULL_TREE;
1563 val.mask = -1;
1564 return val;
1567 gcc_assert ((r1val.lattice_val == CONSTANT
1568 && TREE_CODE (r1val.value) == INTEGER_CST)
1569 || wi::sext (r1val.mask,
1570 TYPE_PRECISION (TREE_TYPE (rhs1))) == -1);
1571 gcc_assert ((r2val.lattice_val == CONSTANT
1572 && TREE_CODE (r2val.value) == INTEGER_CST)
1573 || wi::sext (r2val.mask,
1574 TYPE_PRECISION (TREE_TYPE (rhs2))) == -1);
1575 bit_value_binop_1 (code, type, &value, &mask,
1576 TREE_TYPE (rhs1), value_to_wide_int (r1val), r1val.mask,
1577 TREE_TYPE (rhs2), value_to_wide_int (r2val), r2val.mask);
1578 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1580 val.lattice_val = CONSTANT;
1581 val.mask = mask;
1582 /* ??? Delay building trees here. */
1583 val.value = wide_int_to_tree (type, value);
1585 else
1587 val.lattice_val = VARYING;
1588 val.value = NULL_TREE;
1589 val.mask = -1;
1591 return val;
1594 /* Return the propagation value for __builtin_assume_aligned
1595 and functions with assume_aligned or alloc_aligned attribute.
1596 For __builtin_assume_aligned, ATTR is NULL_TREE,
1597 for assume_aligned attribute ATTR is non-NULL and ALLOC_ALIGNED
1598 is false, for alloc_aligned attribute ATTR is non-NULL and
1599 ALLOC_ALIGNED is true. */
1601 static ccp_prop_value_t
1602 bit_value_assume_aligned (gimple *stmt, tree attr, ccp_prop_value_t ptrval,
1603 bool alloc_aligned)
1605 tree align, misalign = NULL_TREE, type;
1606 unsigned HOST_WIDE_INT aligni, misaligni = 0;
1607 ccp_prop_value_t alignval;
1608 widest_int value, mask;
1609 ccp_prop_value_t val;
1611 if (attr == NULL_TREE)
1613 tree ptr = gimple_call_arg (stmt, 0);
1614 type = TREE_TYPE (ptr);
1615 ptrval = get_value_for_expr (ptr, true);
1617 else
1619 tree lhs = gimple_call_lhs (stmt);
1620 type = TREE_TYPE (lhs);
1623 if (ptrval.lattice_val == UNDEFINED)
1624 return ptrval;
1625 gcc_assert ((ptrval.lattice_val == CONSTANT
1626 && TREE_CODE (ptrval.value) == INTEGER_CST)
1627 || wi::sext (ptrval.mask, TYPE_PRECISION (type)) == -1);
1628 if (attr == NULL_TREE)
1630 /* Get aligni and misaligni from __builtin_assume_aligned. */
1631 align = gimple_call_arg (stmt, 1);
1632 if (!tree_fits_uhwi_p (align))
1633 return ptrval;
1634 aligni = tree_to_uhwi (align);
1635 if (gimple_call_num_args (stmt) > 2)
1637 misalign = gimple_call_arg (stmt, 2);
1638 if (!tree_fits_uhwi_p (misalign))
1639 return ptrval;
1640 misaligni = tree_to_uhwi (misalign);
1643 else
1645 /* Get aligni and misaligni from assume_aligned or
1646 alloc_align attributes. */
1647 if (TREE_VALUE (attr) == NULL_TREE)
1648 return ptrval;
1649 attr = TREE_VALUE (attr);
1650 align = TREE_VALUE (attr);
1651 if (!tree_fits_uhwi_p (align))
1652 return ptrval;
1653 aligni = tree_to_uhwi (align);
1654 if (alloc_aligned)
1656 if (aligni == 0 || aligni > gimple_call_num_args (stmt))
1657 return ptrval;
1658 align = gimple_call_arg (stmt, aligni - 1);
1659 if (!tree_fits_uhwi_p (align))
1660 return ptrval;
1661 aligni = tree_to_uhwi (align);
1663 else if (TREE_CHAIN (attr) && TREE_VALUE (TREE_CHAIN (attr)))
1665 misalign = TREE_VALUE (TREE_CHAIN (attr));
1666 if (!tree_fits_uhwi_p (misalign))
1667 return ptrval;
1668 misaligni = tree_to_uhwi (misalign);
1671 if (aligni <= 1 || (aligni & (aligni - 1)) != 0 || misaligni >= aligni)
1672 return ptrval;
1674 align = build_int_cst_type (type, -aligni);
1675 alignval = get_value_for_expr (align, true);
1676 bit_value_binop_1 (BIT_AND_EXPR, type, &value, &mask,
1677 type, value_to_wide_int (ptrval), ptrval.mask,
1678 type, value_to_wide_int (alignval), alignval.mask);
1679 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1681 val.lattice_val = CONSTANT;
1682 val.mask = mask;
1683 gcc_assert ((mask.to_uhwi () & (aligni - 1)) == 0);
1684 gcc_assert ((value.to_uhwi () & (aligni - 1)) == 0);
1685 value |= misaligni;
1686 /* ??? Delay building trees here. */
1687 val.value = wide_int_to_tree (type, value);
1689 else
1691 val.lattice_val = VARYING;
1692 val.value = NULL_TREE;
1693 val.mask = -1;
1695 return val;
1698 /* Evaluate statement STMT.
1699 Valid only for assignments, calls, conditionals, and switches. */
1701 static ccp_prop_value_t
1702 evaluate_stmt (gimple *stmt)
1704 ccp_prop_value_t val;
1705 tree simplified = NULL_TREE;
1706 ccp_lattice_t likelyvalue = likely_value (stmt);
1707 bool is_constant = false;
1708 unsigned int align;
1710 if (dump_file && (dump_flags & TDF_DETAILS))
1712 fprintf (dump_file, "which is likely ");
1713 switch (likelyvalue)
1715 case CONSTANT:
1716 fprintf (dump_file, "CONSTANT");
1717 break;
1718 case UNDEFINED:
1719 fprintf (dump_file, "UNDEFINED");
1720 break;
1721 case VARYING:
1722 fprintf (dump_file, "VARYING");
1723 break;
1724 default:;
1726 fprintf (dump_file, "\n");
1729 /* If the statement is likely to have a CONSTANT result, then try
1730 to fold the statement to determine the constant value. */
1731 /* FIXME. This is the only place that we call ccp_fold.
1732 Since likely_value never returns CONSTANT for calls, we will
1733 not attempt to fold them, including builtins that may profit. */
1734 if (likelyvalue == CONSTANT)
1736 fold_defer_overflow_warnings ();
1737 simplified = ccp_fold (stmt);
1738 if (simplified && TREE_CODE (simplified) == SSA_NAME)
1740 val = *get_value (simplified);
1741 if (val.lattice_val != VARYING)
1743 fold_undefer_overflow_warnings (true, stmt, 0);
1744 return val;
1747 is_constant = simplified && is_gimple_min_invariant (simplified);
1748 fold_undefer_overflow_warnings (is_constant, stmt, 0);
1749 if (is_constant)
1751 /* The statement produced a constant value. */
1752 val.lattice_val = CONSTANT;
1753 val.value = simplified;
1754 val.mask = 0;
1755 return val;
1758 /* If the statement is likely to have a VARYING result, then do not
1759 bother folding the statement. */
1760 else if (likelyvalue == VARYING)
1762 enum gimple_code code = gimple_code (stmt);
1763 if (code == GIMPLE_ASSIGN)
1765 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1767 /* Other cases cannot satisfy is_gimple_min_invariant
1768 without folding. */
1769 if (get_gimple_rhs_class (subcode) == GIMPLE_SINGLE_RHS)
1770 simplified = gimple_assign_rhs1 (stmt);
1772 else if (code == GIMPLE_SWITCH)
1773 simplified = gimple_switch_index (as_a <gswitch *> (stmt));
1774 else
1775 /* These cannot satisfy is_gimple_min_invariant without folding. */
1776 gcc_assert (code == GIMPLE_CALL || code == GIMPLE_COND);
1777 is_constant = simplified && is_gimple_min_invariant (simplified);
1778 if (is_constant)
1780 /* The statement produced a constant value. */
1781 val.lattice_val = CONSTANT;
1782 val.value = simplified;
1783 val.mask = 0;
1786 /* If the statement result is likely UNDEFINED, make it so. */
1787 else if (likelyvalue == UNDEFINED)
1789 val.lattice_val = UNDEFINED;
1790 val.value = NULL_TREE;
1791 val.mask = 0;
1792 return val;
1795 /* Resort to simplification for bitwise tracking. */
1796 if (flag_tree_bit_ccp
1797 && (likelyvalue == CONSTANT || is_gimple_call (stmt)
1798 || (gimple_assign_single_p (stmt)
1799 && gimple_assign_rhs_code (stmt) == ADDR_EXPR))
1800 && !is_constant)
1802 enum gimple_code code = gimple_code (stmt);
1803 val.lattice_val = VARYING;
1804 val.value = NULL_TREE;
1805 val.mask = -1;
1806 if (code == GIMPLE_ASSIGN)
1808 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1809 tree rhs1 = gimple_assign_rhs1 (stmt);
1810 tree lhs = gimple_assign_lhs (stmt);
1811 if ((INTEGRAL_TYPE_P (TREE_TYPE (lhs))
1812 || POINTER_TYPE_P (TREE_TYPE (lhs)))
1813 && (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1814 || POINTER_TYPE_P (TREE_TYPE (rhs1))))
1815 switch (get_gimple_rhs_class (subcode))
1817 case GIMPLE_SINGLE_RHS:
1818 val = get_value_for_expr (rhs1, true);
1819 break;
1821 case GIMPLE_UNARY_RHS:
1822 val = bit_value_unop (subcode, TREE_TYPE (lhs), rhs1);
1823 break;
1825 case GIMPLE_BINARY_RHS:
1826 val = bit_value_binop (subcode, TREE_TYPE (lhs), rhs1,
1827 gimple_assign_rhs2 (stmt));
1828 break;
1830 default:;
1833 else if (code == GIMPLE_COND)
1835 enum tree_code code = gimple_cond_code (stmt);
1836 tree rhs1 = gimple_cond_lhs (stmt);
1837 tree rhs2 = gimple_cond_rhs (stmt);
1838 if (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1839 || POINTER_TYPE_P (TREE_TYPE (rhs1)))
1840 val = bit_value_binop (code, TREE_TYPE (rhs1), rhs1, rhs2);
1842 else if (gimple_call_builtin_p (stmt, BUILT_IN_NORMAL))
1844 tree fndecl = gimple_call_fndecl (stmt);
1845 switch (DECL_FUNCTION_CODE (fndecl))
1847 case BUILT_IN_MALLOC:
1848 case BUILT_IN_REALLOC:
1849 case BUILT_IN_CALLOC:
1850 case BUILT_IN_STRDUP:
1851 case BUILT_IN_STRNDUP:
1852 val.lattice_val = CONSTANT;
1853 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1854 val.mask = ~((HOST_WIDE_INT) MALLOC_ABI_ALIGNMENT
1855 / BITS_PER_UNIT - 1);
1856 break;
1858 case BUILT_IN_ALLOCA:
1859 case BUILT_IN_ALLOCA_WITH_ALIGN:
1860 align = (DECL_FUNCTION_CODE (fndecl) == BUILT_IN_ALLOCA_WITH_ALIGN
1861 ? TREE_INT_CST_LOW (gimple_call_arg (stmt, 1))
1862 : BIGGEST_ALIGNMENT);
1863 val.lattice_val = CONSTANT;
1864 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1865 val.mask = ~((HOST_WIDE_INT) align / BITS_PER_UNIT - 1);
1866 break;
1868 /* These builtins return their first argument, unmodified. */
1869 case BUILT_IN_MEMCPY:
1870 case BUILT_IN_MEMMOVE:
1871 case BUILT_IN_MEMSET:
1872 case BUILT_IN_STRCPY:
1873 case BUILT_IN_STRNCPY:
1874 case BUILT_IN_MEMCPY_CHK:
1875 case BUILT_IN_MEMMOVE_CHK:
1876 case BUILT_IN_MEMSET_CHK:
1877 case BUILT_IN_STRCPY_CHK:
1878 case BUILT_IN_STRNCPY_CHK:
1879 val = get_value_for_expr (gimple_call_arg (stmt, 0), true);
1880 break;
1882 case BUILT_IN_ASSUME_ALIGNED:
1883 val = bit_value_assume_aligned (stmt, NULL_TREE, val, false);
1884 break;
1886 case BUILT_IN_ALIGNED_ALLOC:
1888 tree align = get_constant_value (gimple_call_arg (stmt, 0));
1889 if (align
1890 && tree_fits_uhwi_p (align))
1892 unsigned HOST_WIDE_INT aligni = tree_to_uhwi (align);
1893 if (aligni > 1
1894 /* align must be power-of-two */
1895 && (aligni & (aligni - 1)) == 0)
1897 val.lattice_val = CONSTANT;
1898 val.value = build_int_cst (ptr_type_node, 0);
1899 val.mask = -aligni;
1902 break;
1905 default:;
1908 if (is_gimple_call (stmt) && gimple_call_lhs (stmt))
1910 tree fntype = gimple_call_fntype (stmt);
1911 if (fntype)
1913 tree attrs = lookup_attribute ("assume_aligned",
1914 TYPE_ATTRIBUTES (fntype));
1915 if (attrs)
1916 val = bit_value_assume_aligned (stmt, attrs, val, false);
1917 attrs = lookup_attribute ("alloc_align",
1918 TYPE_ATTRIBUTES (fntype));
1919 if (attrs)
1920 val = bit_value_assume_aligned (stmt, attrs, val, true);
1923 is_constant = (val.lattice_val == CONSTANT);
1926 if (flag_tree_bit_ccp
1927 && ((is_constant && TREE_CODE (val.value) == INTEGER_CST)
1928 || !is_constant)
1929 && gimple_get_lhs (stmt)
1930 && TREE_CODE (gimple_get_lhs (stmt)) == SSA_NAME)
1932 tree lhs = gimple_get_lhs (stmt);
1933 wide_int nonzero_bits = get_nonzero_bits (lhs);
1934 if (nonzero_bits != -1)
1936 if (!is_constant)
1938 val.lattice_val = CONSTANT;
1939 val.value = build_zero_cst (TREE_TYPE (lhs));
1940 val.mask = extend_mask (nonzero_bits);
1941 is_constant = true;
1943 else
1945 if (wi::bit_and_not (val.value, nonzero_bits) != 0)
1946 val.value = wide_int_to_tree (TREE_TYPE (lhs),
1947 nonzero_bits & val.value);
1948 if (nonzero_bits == 0)
1949 val.mask = 0;
1950 else
1951 val.mask = val.mask & extend_mask (nonzero_bits);
1956 /* The statement produced a nonconstant value. */
1957 if (!is_constant)
1959 /* The statement produced a copy. */
1960 if (simplified && TREE_CODE (simplified) == SSA_NAME
1961 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (simplified))
1963 val.lattice_val = CONSTANT;
1964 val.value = simplified;
1965 val.mask = -1;
1967 /* The statement is VARYING. */
1968 else
1970 val.lattice_val = VARYING;
1971 val.value = NULL_TREE;
1972 val.mask = -1;
1976 return val;
1979 typedef hash_table<nofree_ptr_hash<gimple> > gimple_htab;
1981 /* Given a BUILT_IN_STACK_SAVE value SAVED_VAL, insert a clobber of VAR before
1982 each matching BUILT_IN_STACK_RESTORE. Mark visited phis in VISITED. */
1984 static void
1985 insert_clobber_before_stack_restore (tree saved_val, tree var,
1986 gimple_htab **visited)
1988 gimple *stmt;
1989 gassign *clobber_stmt;
1990 tree clobber;
1991 imm_use_iterator iter;
1992 gimple_stmt_iterator i;
1993 gimple **slot;
1995 FOR_EACH_IMM_USE_STMT (stmt, iter, saved_val)
1996 if (gimple_call_builtin_p (stmt, BUILT_IN_STACK_RESTORE))
1998 clobber = build_constructor (TREE_TYPE (var),
1999 NULL);
2000 TREE_THIS_VOLATILE (clobber) = 1;
2001 clobber_stmt = gimple_build_assign (var, clobber);
2003 i = gsi_for_stmt (stmt);
2004 gsi_insert_before (&i, clobber_stmt, GSI_SAME_STMT);
2006 else if (gimple_code (stmt) == GIMPLE_PHI)
2008 if (!*visited)
2009 *visited = new gimple_htab (10);
2011 slot = (*visited)->find_slot (stmt, INSERT);
2012 if (*slot != NULL)
2013 continue;
2015 *slot = stmt;
2016 insert_clobber_before_stack_restore (gimple_phi_result (stmt), var,
2017 visited);
2019 else if (gimple_assign_ssa_name_copy_p (stmt))
2020 insert_clobber_before_stack_restore (gimple_assign_lhs (stmt), var,
2021 visited);
2022 else if (chkp_gimple_call_builtin_p (stmt, BUILT_IN_CHKP_BNDRET))
2023 continue;
2024 else
2025 gcc_assert (is_gimple_debug (stmt));
2028 /* Advance the iterator to the previous non-debug gimple statement in the same
2029 or dominating basic block. */
2031 static inline void
2032 gsi_prev_dom_bb_nondebug (gimple_stmt_iterator *i)
2034 basic_block dom;
2036 gsi_prev_nondebug (i);
2037 while (gsi_end_p (*i))
2039 dom = get_immediate_dominator (CDI_DOMINATORS, i->bb);
2040 if (dom == NULL || dom == ENTRY_BLOCK_PTR_FOR_FN (cfun))
2041 return;
2043 *i = gsi_last_bb (dom);
2047 /* Find a BUILT_IN_STACK_SAVE dominating gsi_stmt (I), and insert
2048 a clobber of VAR before each matching BUILT_IN_STACK_RESTORE.
2050 It is possible that BUILT_IN_STACK_SAVE cannot be find in a dominator when a
2051 previous pass (such as DOM) duplicated it along multiple paths to a BB. In
2052 that case the function gives up without inserting the clobbers. */
2054 static void
2055 insert_clobbers_for_var (gimple_stmt_iterator i, tree var)
2057 gimple *stmt;
2058 tree saved_val;
2059 gimple_htab *visited = NULL;
2061 for (; !gsi_end_p (i); gsi_prev_dom_bb_nondebug (&i))
2063 stmt = gsi_stmt (i);
2065 if (!gimple_call_builtin_p (stmt, BUILT_IN_STACK_SAVE))
2066 continue;
2068 saved_val = gimple_call_lhs (stmt);
2069 if (saved_val == NULL_TREE)
2070 continue;
2072 insert_clobber_before_stack_restore (saved_val, var, &visited);
2073 break;
2076 delete visited;
2079 /* Detects a __builtin_alloca_with_align with constant size argument. Declares
2080 fixed-size array and returns the address, if found, otherwise returns
2081 NULL_TREE. */
2083 static tree
2084 fold_builtin_alloca_with_align (gimple *stmt)
2086 unsigned HOST_WIDE_INT size, threshold, n_elem;
2087 tree lhs, arg, block, var, elem_type, array_type;
2089 /* Get lhs. */
2090 lhs = gimple_call_lhs (stmt);
2091 if (lhs == NULL_TREE)
2092 return NULL_TREE;
2094 /* Detect constant argument. */
2095 arg = get_constant_value (gimple_call_arg (stmt, 0));
2096 if (arg == NULL_TREE
2097 || TREE_CODE (arg) != INTEGER_CST
2098 || !tree_fits_uhwi_p (arg))
2099 return NULL_TREE;
2101 size = tree_to_uhwi (arg);
2103 /* Heuristic: don't fold large allocas. */
2104 threshold = (unsigned HOST_WIDE_INT)PARAM_VALUE (PARAM_LARGE_STACK_FRAME);
2105 /* In case the alloca is located at function entry, it has the same lifetime
2106 as a declared array, so we allow a larger size. */
2107 block = gimple_block (stmt);
2108 if (!(cfun->after_inlining
2109 && block
2110 && TREE_CODE (BLOCK_SUPERCONTEXT (block)) == FUNCTION_DECL))
2111 threshold /= 10;
2112 if (size > threshold)
2113 return NULL_TREE;
2115 /* Declare array. */
2116 elem_type = build_nonstandard_integer_type (BITS_PER_UNIT, 1);
2117 n_elem = size * 8 / BITS_PER_UNIT;
2118 array_type = build_array_type_nelts (elem_type, n_elem);
2119 var = create_tmp_var (array_type);
2120 SET_DECL_ALIGN (var, TREE_INT_CST_LOW (gimple_call_arg (stmt, 1)));
2122 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (lhs);
2123 if (pi != NULL && !pi->pt.anything)
2125 bool singleton_p;
2126 unsigned uid;
2127 singleton_p = pt_solution_singleton_p (&pi->pt, &uid);
2128 gcc_assert (singleton_p);
2129 SET_DECL_PT_UID (var, uid);
2133 /* Fold alloca to the address of the array. */
2134 return fold_convert (TREE_TYPE (lhs), build_fold_addr_expr (var));
2137 /* Fold the stmt at *GSI with CCP specific information that propagating
2138 and regular folding does not catch. */
2140 static bool
2141 ccp_fold_stmt (gimple_stmt_iterator *gsi)
2143 gimple *stmt = gsi_stmt (*gsi);
2145 switch (gimple_code (stmt))
2147 case GIMPLE_COND:
2149 gcond *cond_stmt = as_a <gcond *> (stmt);
2150 ccp_prop_value_t val;
2151 /* Statement evaluation will handle type mismatches in constants
2152 more gracefully than the final propagation. This allows us to
2153 fold more conditionals here. */
2154 val = evaluate_stmt (stmt);
2155 if (val.lattice_val != CONSTANT
2156 || val.mask != 0)
2157 return false;
2159 if (dump_file)
2161 fprintf (dump_file, "Folding predicate ");
2162 print_gimple_expr (dump_file, stmt, 0, 0);
2163 fprintf (dump_file, " to ");
2164 print_generic_expr (dump_file, val.value, 0);
2165 fprintf (dump_file, "\n");
2168 if (integer_zerop (val.value))
2169 gimple_cond_make_false (cond_stmt);
2170 else
2171 gimple_cond_make_true (cond_stmt);
2173 return true;
2176 case GIMPLE_CALL:
2178 tree lhs = gimple_call_lhs (stmt);
2179 int flags = gimple_call_flags (stmt);
2180 tree val;
2181 tree argt;
2182 bool changed = false;
2183 unsigned i;
2185 /* If the call was folded into a constant make sure it goes
2186 away even if we cannot propagate into all uses because of
2187 type issues. */
2188 if (lhs
2189 && TREE_CODE (lhs) == SSA_NAME
2190 && (val = get_constant_value (lhs))
2191 /* Don't optimize away calls that have side-effects. */
2192 && (flags & (ECF_CONST|ECF_PURE)) != 0
2193 && (flags & ECF_LOOPING_CONST_OR_PURE) == 0)
2195 tree new_rhs = unshare_expr (val);
2196 bool res;
2197 if (!useless_type_conversion_p (TREE_TYPE (lhs),
2198 TREE_TYPE (new_rhs)))
2199 new_rhs = fold_convert (TREE_TYPE (lhs), new_rhs);
2200 res = update_call_from_tree (gsi, new_rhs);
2201 gcc_assert (res);
2202 return true;
2205 /* Internal calls provide no argument types, so the extra laxity
2206 for normal calls does not apply. */
2207 if (gimple_call_internal_p (stmt))
2208 return false;
2210 /* The heuristic of fold_builtin_alloca_with_align differs before and
2211 after inlining, so we don't require the arg to be changed into a
2212 constant for folding, but just to be constant. */
2213 if (gimple_call_builtin_p (stmt, BUILT_IN_ALLOCA_WITH_ALIGN))
2215 tree new_rhs = fold_builtin_alloca_with_align (stmt);
2216 if (new_rhs)
2218 bool res = update_call_from_tree (gsi, new_rhs);
2219 tree var = TREE_OPERAND (TREE_OPERAND (new_rhs, 0),0);
2220 gcc_assert (res);
2221 insert_clobbers_for_var (*gsi, var);
2222 return true;
2226 /* Propagate into the call arguments. Compared to replace_uses_in
2227 this can use the argument slot types for type verification
2228 instead of the current argument type. We also can safely
2229 drop qualifiers here as we are dealing with constants anyway. */
2230 argt = TYPE_ARG_TYPES (gimple_call_fntype (stmt));
2231 for (i = 0; i < gimple_call_num_args (stmt) && argt;
2232 ++i, argt = TREE_CHAIN (argt))
2234 tree arg = gimple_call_arg (stmt, i);
2235 if (TREE_CODE (arg) == SSA_NAME
2236 && (val = get_constant_value (arg))
2237 && useless_type_conversion_p
2238 (TYPE_MAIN_VARIANT (TREE_VALUE (argt)),
2239 TYPE_MAIN_VARIANT (TREE_TYPE (val))))
2241 gimple_call_set_arg (stmt, i, unshare_expr (val));
2242 changed = true;
2246 return changed;
2249 case GIMPLE_ASSIGN:
2251 tree lhs = gimple_assign_lhs (stmt);
2252 tree val;
2254 /* If we have a load that turned out to be constant replace it
2255 as we cannot propagate into all uses in all cases. */
2256 if (gimple_assign_single_p (stmt)
2257 && TREE_CODE (lhs) == SSA_NAME
2258 && (val = get_constant_value (lhs)))
2260 tree rhs = unshare_expr (val);
2261 if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs)))
2262 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (lhs), rhs);
2263 gimple_assign_set_rhs_from_tree (gsi, rhs);
2264 return true;
2267 return false;
2270 default:
2271 return false;
2275 /* Visit the assignment statement STMT. Set the value of its LHS to the
2276 value computed by the RHS and store LHS in *OUTPUT_P. If STMT
2277 creates virtual definitions, set the value of each new name to that
2278 of the RHS (if we can derive a constant out of the RHS).
2279 Value-returning call statements also perform an assignment, and
2280 are handled here. */
2282 static enum ssa_prop_result
2283 visit_assignment (gimple *stmt, tree *output_p)
2285 ccp_prop_value_t val;
2286 enum ssa_prop_result retval = SSA_PROP_NOT_INTERESTING;
2288 tree lhs = gimple_get_lhs (stmt);
2289 if (TREE_CODE (lhs) == SSA_NAME)
2291 /* Evaluate the statement, which could be
2292 either a GIMPLE_ASSIGN or a GIMPLE_CALL. */
2293 val = evaluate_stmt (stmt);
2295 /* If STMT is an assignment to an SSA_NAME, we only have one
2296 value to set. */
2297 if (set_lattice_value (lhs, &val))
2299 *output_p = lhs;
2300 if (val.lattice_val == VARYING)
2301 retval = SSA_PROP_VARYING;
2302 else
2303 retval = SSA_PROP_INTERESTING;
2307 return retval;
2311 /* Visit the conditional statement STMT. Return SSA_PROP_INTERESTING
2312 if it can determine which edge will be taken. Otherwise, return
2313 SSA_PROP_VARYING. */
2315 static enum ssa_prop_result
2316 visit_cond_stmt (gimple *stmt, edge *taken_edge_p)
2318 ccp_prop_value_t val;
2319 basic_block block;
2321 block = gimple_bb (stmt);
2322 val = evaluate_stmt (stmt);
2323 if (val.lattice_val != CONSTANT
2324 || val.mask != 0)
2325 return SSA_PROP_VARYING;
2327 /* Find which edge out of the conditional block will be taken and add it
2328 to the worklist. If no single edge can be determined statically,
2329 return SSA_PROP_VARYING to feed all the outgoing edges to the
2330 propagation engine. */
2331 *taken_edge_p = find_taken_edge (block, val.value);
2332 if (*taken_edge_p)
2333 return SSA_PROP_INTERESTING;
2334 else
2335 return SSA_PROP_VARYING;
2339 /* Evaluate statement STMT. If the statement produces an output value and
2340 its evaluation changes the lattice value of its output, return
2341 SSA_PROP_INTERESTING and set *OUTPUT_P to the SSA_NAME holding the
2342 output value.
2344 If STMT is a conditional branch and we can determine its truth
2345 value, set *TAKEN_EDGE_P accordingly. If STMT produces a varying
2346 value, return SSA_PROP_VARYING. */
2348 static enum ssa_prop_result
2349 ccp_visit_stmt (gimple *stmt, edge *taken_edge_p, tree *output_p)
2351 tree def;
2352 ssa_op_iter iter;
2354 if (dump_file && (dump_flags & TDF_DETAILS))
2356 fprintf (dump_file, "\nVisiting statement:\n");
2357 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
2360 switch (gimple_code (stmt))
2362 case GIMPLE_ASSIGN:
2363 /* If the statement is an assignment that produces a single
2364 output value, evaluate its RHS to see if the lattice value of
2365 its output has changed. */
2366 return visit_assignment (stmt, output_p);
2368 case GIMPLE_CALL:
2369 /* A value-returning call also performs an assignment. */
2370 if (gimple_call_lhs (stmt) != NULL_TREE)
2371 return visit_assignment (stmt, output_p);
2372 break;
2374 case GIMPLE_COND:
2375 case GIMPLE_SWITCH:
2376 /* If STMT is a conditional branch, see if we can determine
2377 which branch will be taken. */
2378 /* FIXME. It appears that we should be able to optimize
2379 computed GOTOs here as well. */
2380 return visit_cond_stmt (stmt, taken_edge_p);
2382 default:
2383 break;
2386 /* Any other kind of statement is not interesting for constant
2387 propagation and, therefore, not worth simulating. */
2388 if (dump_file && (dump_flags & TDF_DETAILS))
2389 fprintf (dump_file, "No interesting values produced. Marked VARYING.\n");
2391 /* Definitions made by statements other than assignments to
2392 SSA_NAMEs represent unknown modifications to their outputs.
2393 Mark them VARYING. */
2394 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
2395 set_value_varying (def);
2397 return SSA_PROP_VARYING;
2401 /* Main entry point for SSA Conditional Constant Propagation. If NONZERO_P,
2402 record nonzero bits. */
2404 static unsigned int
2405 do_ssa_ccp (bool nonzero_p)
2407 unsigned int todo = 0;
2408 calculate_dominance_info (CDI_DOMINATORS);
2410 ccp_initialize ();
2411 ssa_propagate (ccp_visit_stmt, ccp_visit_phi_node);
2412 if (ccp_finalize (nonzero_p))
2414 todo = (TODO_cleanup_cfg | TODO_update_ssa);
2416 /* ccp_finalize does not preserve loop-closed ssa. */
2417 loops_state_clear (LOOP_CLOSED_SSA);
2420 free_dominance_info (CDI_DOMINATORS);
2421 return todo;
2425 namespace {
2427 const pass_data pass_data_ccp =
2429 GIMPLE_PASS, /* type */
2430 "ccp", /* name */
2431 OPTGROUP_NONE, /* optinfo_flags */
2432 TV_TREE_CCP, /* tv_id */
2433 ( PROP_cfg | PROP_ssa ), /* properties_required */
2434 0, /* properties_provided */
2435 0, /* properties_destroyed */
2436 0, /* todo_flags_start */
2437 TODO_update_address_taken, /* todo_flags_finish */
2440 class pass_ccp : public gimple_opt_pass
2442 public:
2443 pass_ccp (gcc::context *ctxt)
2444 : gimple_opt_pass (pass_data_ccp, ctxt), nonzero_p (false)
2447 /* opt_pass methods: */
2448 opt_pass * clone () { return new pass_ccp (m_ctxt); }
2449 void set_pass_param (unsigned int n, bool param)
2451 gcc_assert (n == 0);
2452 nonzero_p = param;
2454 virtual bool gate (function *) { return flag_tree_ccp != 0; }
2455 virtual unsigned int execute (function *) { return do_ssa_ccp (nonzero_p); }
2457 private:
2458 /* Determines whether the pass instance records nonzero bits. */
2459 bool nonzero_p;
2460 }; // class pass_ccp
2462 } // anon namespace
2464 gimple_opt_pass *
2465 make_pass_ccp (gcc::context *ctxt)
2467 return new pass_ccp (ctxt);
2472 /* Try to optimize out __builtin_stack_restore. Optimize it out
2473 if there is another __builtin_stack_restore in the same basic
2474 block and no calls or ASM_EXPRs are in between, or if this block's
2475 only outgoing edge is to EXIT_BLOCK and there are no calls or
2476 ASM_EXPRs after this __builtin_stack_restore. */
2478 static tree
2479 optimize_stack_restore (gimple_stmt_iterator i)
2481 tree callee;
2482 gimple *stmt;
2484 basic_block bb = gsi_bb (i);
2485 gimple *call = gsi_stmt (i);
2487 if (gimple_code (call) != GIMPLE_CALL
2488 || gimple_call_num_args (call) != 1
2489 || TREE_CODE (gimple_call_arg (call, 0)) != SSA_NAME
2490 || !POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, 0))))
2491 return NULL_TREE;
2493 for (gsi_next (&i); !gsi_end_p (i); gsi_next (&i))
2495 stmt = gsi_stmt (i);
2496 if (gimple_code (stmt) == GIMPLE_ASM)
2497 return NULL_TREE;
2498 if (gimple_code (stmt) != GIMPLE_CALL)
2499 continue;
2501 callee = gimple_call_fndecl (stmt);
2502 if (!callee
2503 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
2504 /* All regular builtins are ok, just obviously not alloca. */
2505 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA
2506 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA_WITH_ALIGN)
2507 return NULL_TREE;
2509 if (DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_RESTORE)
2510 goto second_stack_restore;
2513 if (!gsi_end_p (i))
2514 return NULL_TREE;
2516 /* Allow one successor of the exit block, or zero successors. */
2517 switch (EDGE_COUNT (bb->succs))
2519 case 0:
2520 break;
2521 case 1:
2522 if (single_succ_edge (bb)->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
2523 return NULL_TREE;
2524 break;
2525 default:
2526 return NULL_TREE;
2528 second_stack_restore:
2530 /* If there's exactly one use, then zap the call to __builtin_stack_save.
2531 If there are multiple uses, then the last one should remove the call.
2532 In any case, whether the call to __builtin_stack_save can be removed
2533 or not is irrelevant to removing the call to __builtin_stack_restore. */
2534 if (has_single_use (gimple_call_arg (call, 0)))
2536 gimple *stack_save = SSA_NAME_DEF_STMT (gimple_call_arg (call, 0));
2537 if (is_gimple_call (stack_save))
2539 callee = gimple_call_fndecl (stack_save);
2540 if (callee
2541 && DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL
2542 && DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_SAVE)
2544 gimple_stmt_iterator stack_save_gsi;
2545 tree rhs;
2547 stack_save_gsi = gsi_for_stmt (stack_save);
2548 rhs = build_int_cst (TREE_TYPE (gimple_call_arg (call, 0)), 0);
2549 update_call_from_tree (&stack_save_gsi, rhs);
2554 /* No effect, so the statement will be deleted. */
2555 return integer_zero_node;
2558 /* If va_list type is a simple pointer and nothing special is needed,
2559 optimize __builtin_va_start (&ap, 0) into ap = __builtin_next_arg (0),
2560 __builtin_va_end (&ap) out as NOP and __builtin_va_copy into a simple
2561 pointer assignment. */
2563 static tree
2564 optimize_stdarg_builtin (gimple *call)
2566 tree callee, lhs, rhs, cfun_va_list;
2567 bool va_list_simple_ptr;
2568 location_t loc = gimple_location (call);
2570 if (gimple_code (call) != GIMPLE_CALL)
2571 return NULL_TREE;
2573 callee = gimple_call_fndecl (call);
2575 cfun_va_list = targetm.fn_abi_va_list (callee);
2576 va_list_simple_ptr = POINTER_TYPE_P (cfun_va_list)
2577 && (TREE_TYPE (cfun_va_list) == void_type_node
2578 || TREE_TYPE (cfun_va_list) == char_type_node);
2580 switch (DECL_FUNCTION_CODE (callee))
2582 case BUILT_IN_VA_START:
2583 if (!va_list_simple_ptr
2584 || targetm.expand_builtin_va_start != NULL
2585 || !builtin_decl_explicit_p (BUILT_IN_NEXT_ARG))
2586 return NULL_TREE;
2588 if (gimple_call_num_args (call) != 2)
2589 return NULL_TREE;
2591 lhs = gimple_call_arg (call, 0);
2592 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2593 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2594 != TYPE_MAIN_VARIANT (cfun_va_list))
2595 return NULL_TREE;
2597 lhs = build_fold_indirect_ref_loc (loc, lhs);
2598 rhs = build_call_expr_loc (loc, builtin_decl_explicit (BUILT_IN_NEXT_ARG),
2599 1, integer_zero_node);
2600 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2601 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2603 case BUILT_IN_VA_COPY:
2604 if (!va_list_simple_ptr)
2605 return NULL_TREE;
2607 if (gimple_call_num_args (call) != 2)
2608 return NULL_TREE;
2610 lhs = gimple_call_arg (call, 0);
2611 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2612 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2613 != TYPE_MAIN_VARIANT (cfun_va_list))
2614 return NULL_TREE;
2616 lhs = build_fold_indirect_ref_loc (loc, lhs);
2617 rhs = gimple_call_arg (call, 1);
2618 if (TYPE_MAIN_VARIANT (TREE_TYPE (rhs))
2619 != TYPE_MAIN_VARIANT (cfun_va_list))
2620 return NULL_TREE;
2622 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2623 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2625 case BUILT_IN_VA_END:
2626 /* No effect, so the statement will be deleted. */
2627 return integer_zero_node;
2629 default:
2630 gcc_unreachable ();
2634 /* Attemp to make the block of __builtin_unreachable I unreachable by changing
2635 the incoming jumps. Return true if at least one jump was changed. */
2637 static bool
2638 optimize_unreachable (gimple_stmt_iterator i)
2640 basic_block bb = gsi_bb (i);
2641 gimple_stmt_iterator gsi;
2642 gimple *stmt;
2643 edge_iterator ei;
2644 edge e;
2645 bool ret;
2647 if (flag_sanitize & SANITIZE_UNREACHABLE)
2648 return false;
2650 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2652 stmt = gsi_stmt (gsi);
2654 if (is_gimple_debug (stmt))
2655 continue;
2657 if (glabel *label_stmt = dyn_cast <glabel *> (stmt))
2659 /* Verify we do not need to preserve the label. */
2660 if (FORCED_LABEL (gimple_label_label (label_stmt)))
2661 return false;
2663 continue;
2666 /* Only handle the case that __builtin_unreachable is the first statement
2667 in the block. We rely on DCE to remove stmts without side-effects
2668 before __builtin_unreachable. */
2669 if (gsi_stmt (gsi) != gsi_stmt (i))
2670 return false;
2673 ret = false;
2674 FOR_EACH_EDGE (e, ei, bb->preds)
2676 gsi = gsi_last_bb (e->src);
2677 if (gsi_end_p (gsi))
2678 continue;
2680 stmt = gsi_stmt (gsi);
2681 if (gcond *cond_stmt = dyn_cast <gcond *> (stmt))
2683 if (e->flags & EDGE_TRUE_VALUE)
2684 gimple_cond_make_false (cond_stmt);
2685 else if (e->flags & EDGE_FALSE_VALUE)
2686 gimple_cond_make_true (cond_stmt);
2687 else
2688 gcc_unreachable ();
2689 update_stmt (cond_stmt);
2691 else
2693 /* Todo: handle other cases, f.i. switch statement. */
2694 continue;
2697 ret = true;
2700 return ret;
2703 /* Optimize
2704 mask_2 = 1 << cnt_1;
2705 _4 = __atomic_fetch_or_* (ptr_6, mask_2, _3);
2706 _5 = _4 & mask_2;
2708 _4 = ATOMIC_BIT_TEST_AND_SET (ptr_6, cnt_1, 0, _3);
2709 _5 = _4;
2710 If _5 is only used in _5 != 0 or _5 == 0 comparisons, 1
2711 is passed instead of 0, and the builtin just returns a zero
2712 or 1 value instead of the actual bit.
2713 Similarly for __sync_fetch_and_or_* (without the ", _3" part
2714 in there), and/or if mask_2 is a power of 2 constant.
2715 Similarly for xor instead of or, use ATOMIC_BIT_TEST_AND_COMPLEMENT
2716 in that case. And similarly for and instead of or, except that
2717 the second argument to the builtin needs to be one's complement
2718 of the mask instead of mask. */
2720 static void
2721 optimize_atomic_bit_test_and (gimple_stmt_iterator *gsip,
2722 enum internal_fn fn, bool has_model_arg,
2723 bool after)
2725 gimple *call = gsi_stmt (*gsip);
2726 tree lhs = gimple_call_lhs (call);
2727 use_operand_p use_p;
2728 gimple *use_stmt;
2729 tree mask, bit;
2730 optab optab;
2732 if (!flag_inline_atomics
2733 || optimize_debug
2734 || !gimple_call_builtin_p (call, BUILT_IN_NORMAL)
2735 || !lhs
2736 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs)
2737 || !single_imm_use (lhs, &use_p, &use_stmt)
2738 || !is_gimple_assign (use_stmt)
2739 || gimple_assign_rhs_code (use_stmt) != BIT_AND_EXPR
2740 || !gimple_vdef (call))
2741 return;
2743 switch (fn)
2745 case IFN_ATOMIC_BIT_TEST_AND_SET:
2746 optab = atomic_bit_test_and_set_optab;
2747 break;
2748 case IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT:
2749 optab = atomic_bit_test_and_complement_optab;
2750 break;
2751 case IFN_ATOMIC_BIT_TEST_AND_RESET:
2752 optab = atomic_bit_test_and_reset_optab;
2753 break;
2754 default:
2755 return;
2758 if (optab_handler (optab, TYPE_MODE (TREE_TYPE (lhs))) == CODE_FOR_nothing)
2759 return;
2761 mask = gimple_call_arg (call, 1);
2762 tree use_lhs = gimple_assign_lhs (use_stmt);
2763 if (!use_lhs)
2764 return;
2766 if (TREE_CODE (mask) == INTEGER_CST)
2768 if (fn == IFN_ATOMIC_BIT_TEST_AND_RESET)
2769 mask = const_unop (BIT_NOT_EXPR, TREE_TYPE (mask), mask);
2770 mask = fold_convert (TREE_TYPE (lhs), mask);
2771 int ibit = tree_log2 (mask);
2772 if (ibit < 0)
2773 return;
2774 bit = build_int_cst (TREE_TYPE (lhs), ibit);
2776 else if (TREE_CODE (mask) == SSA_NAME)
2778 gimple *g = SSA_NAME_DEF_STMT (mask);
2779 if (fn == IFN_ATOMIC_BIT_TEST_AND_RESET)
2781 if (!is_gimple_assign (g)
2782 || gimple_assign_rhs_code (g) != BIT_NOT_EXPR)
2783 return;
2784 mask = gimple_assign_rhs1 (g);
2785 if (TREE_CODE (mask) != SSA_NAME)
2786 return;
2787 g = SSA_NAME_DEF_STMT (mask);
2789 if (!is_gimple_assign (g)
2790 || gimple_assign_rhs_code (g) != LSHIFT_EXPR
2791 || !integer_onep (gimple_assign_rhs1 (g)))
2792 return;
2793 bit = gimple_assign_rhs2 (g);
2795 else
2796 return;
2798 if (gimple_assign_rhs1 (use_stmt) == lhs)
2800 if (!operand_equal_p (gimple_assign_rhs2 (use_stmt), mask, 0))
2801 return;
2803 else if (gimple_assign_rhs2 (use_stmt) != lhs
2804 || !operand_equal_p (gimple_assign_rhs1 (use_stmt), mask, 0))
2805 return;
2807 bool use_bool = true;
2808 bool has_debug_uses = false;
2809 imm_use_iterator iter;
2810 gimple *g;
2812 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (use_lhs))
2813 use_bool = false;
2814 FOR_EACH_IMM_USE_STMT (g, iter, use_lhs)
2816 enum tree_code code = ERROR_MARK;
2817 tree op0, op1;
2818 if (is_gimple_debug (g))
2820 has_debug_uses = true;
2821 continue;
2823 else if (is_gimple_assign (g))
2824 switch (gimple_assign_rhs_code (g))
2826 case COND_EXPR:
2827 op1 = gimple_assign_rhs1 (g);
2828 code = TREE_CODE (op1);
2829 op0 = TREE_OPERAND (op1, 0);
2830 op1 = TREE_OPERAND (op1, 1);
2831 break;
2832 case EQ_EXPR:
2833 case NE_EXPR:
2834 code = gimple_assign_rhs_code (g);
2835 op0 = gimple_assign_rhs1 (g);
2836 op1 = gimple_assign_rhs2 (g);
2837 break;
2838 default:
2839 break;
2841 else if (gimple_code (g) == GIMPLE_COND)
2843 code = gimple_cond_code (g);
2844 op0 = gimple_cond_lhs (g);
2845 op1 = gimple_cond_rhs (g);
2848 if ((code == EQ_EXPR || code == NE_EXPR)
2849 && op0 == use_lhs
2850 && integer_zerop (op1))
2852 use_operand_p use_p;
2853 int n = 0;
2854 FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
2855 n++;
2856 if (n == 1)
2857 continue;
2860 use_bool = false;
2861 BREAK_FROM_IMM_USE_STMT (iter);
2864 tree new_lhs = make_ssa_name (TREE_TYPE (lhs));
2865 tree flag = build_int_cst (TREE_TYPE (lhs), use_bool);
2866 if (has_model_arg)
2867 g = gimple_build_call_internal (fn, 4, gimple_call_arg (call, 0),
2868 bit, flag, gimple_call_arg (call, 2));
2869 else
2870 g = gimple_build_call_internal (fn, 3, gimple_call_arg (call, 0),
2871 bit, flag);
2872 gimple_call_set_lhs (g, new_lhs);
2873 gimple_set_location (g, gimple_location (call));
2874 gimple_set_vuse (g, gimple_vuse (call));
2875 gimple_set_vdef (g, gimple_vdef (call));
2876 SSA_NAME_DEF_STMT (gimple_vdef (call)) = g;
2877 gimple_stmt_iterator gsi = *gsip;
2878 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2879 if (after)
2881 /* The internal function returns the value of the specified bit
2882 before the atomic operation. If we are interested in the value
2883 of the specified bit after the atomic operation (makes only sense
2884 for xor, otherwise the bit content is compile time known),
2885 we need to invert the bit. */
2886 g = gimple_build_assign (make_ssa_name (TREE_TYPE (lhs)),
2887 BIT_XOR_EXPR, new_lhs,
2888 use_bool ? build_int_cst (TREE_TYPE (lhs), 1)
2889 : mask);
2890 new_lhs = gimple_assign_lhs (g);
2891 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2893 if (use_bool && has_debug_uses)
2895 tree temp = make_node (DEBUG_EXPR_DECL);
2896 DECL_ARTIFICIAL (temp) = 1;
2897 TREE_TYPE (temp) = TREE_TYPE (lhs);
2898 DECL_MODE (temp) = TYPE_MODE (TREE_TYPE (lhs));
2899 tree t = build2 (LSHIFT_EXPR, TREE_TYPE (lhs), new_lhs, bit);
2900 g = gimple_build_debug_bind (temp, t, g);
2901 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2902 FOR_EACH_IMM_USE_STMT (g, iter, use_lhs)
2903 if (is_gimple_debug (g))
2905 use_operand_p use_p;
2906 FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
2907 SET_USE (use_p, temp);
2908 update_stmt (g);
2911 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_lhs)
2912 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (use_lhs);
2913 replace_uses_by (use_lhs, new_lhs);
2914 gsi = gsi_for_stmt (use_stmt);
2915 gsi_remove (&gsi, true);
2916 release_defs (use_stmt);
2917 gsi_remove (gsip, true);
2918 release_ssa_name (lhs);
2921 /* A simple pass that attempts to fold all builtin functions. This pass
2922 is run after we've propagated as many constants as we can. */
2924 namespace {
2926 const pass_data pass_data_fold_builtins =
2928 GIMPLE_PASS, /* type */
2929 "fab", /* name */
2930 OPTGROUP_NONE, /* optinfo_flags */
2931 TV_NONE, /* tv_id */
2932 ( PROP_cfg | PROP_ssa ), /* properties_required */
2933 0, /* properties_provided */
2934 0, /* properties_destroyed */
2935 0, /* todo_flags_start */
2936 TODO_update_ssa, /* todo_flags_finish */
2939 class pass_fold_builtins : public gimple_opt_pass
2941 public:
2942 pass_fold_builtins (gcc::context *ctxt)
2943 : gimple_opt_pass (pass_data_fold_builtins, ctxt)
2946 /* opt_pass methods: */
2947 opt_pass * clone () { return new pass_fold_builtins (m_ctxt); }
2948 virtual unsigned int execute (function *);
2950 }; // class pass_fold_builtins
2952 unsigned int
2953 pass_fold_builtins::execute (function *fun)
2955 bool cfg_changed = false;
2956 basic_block bb;
2957 unsigned int todoflags = 0;
2959 FOR_EACH_BB_FN (bb, fun)
2961 gimple_stmt_iterator i;
2962 for (i = gsi_start_bb (bb); !gsi_end_p (i); )
2964 gimple *stmt, *old_stmt;
2965 tree callee;
2966 enum built_in_function fcode;
2968 stmt = gsi_stmt (i);
2970 if (gimple_code (stmt) != GIMPLE_CALL)
2972 /* Remove all *ssaname_N ={v} {CLOBBER}; stmts,
2973 after the last GIMPLE DSE they aren't needed and might
2974 unnecessarily keep the SSA_NAMEs live. */
2975 if (gimple_clobber_p (stmt))
2977 tree lhs = gimple_assign_lhs (stmt);
2978 if (TREE_CODE (lhs) == MEM_REF
2979 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
2981 unlink_stmt_vdef (stmt);
2982 gsi_remove (&i, true);
2983 release_defs (stmt);
2984 continue;
2987 gsi_next (&i);
2988 continue;
2991 callee = gimple_call_fndecl (stmt);
2992 if (!callee || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL)
2994 gsi_next (&i);
2995 continue;
2998 fcode = DECL_FUNCTION_CODE (callee);
2999 if (fold_stmt (&i))
3001 else
3003 tree result = NULL_TREE;
3004 switch (DECL_FUNCTION_CODE (callee))
3006 case BUILT_IN_CONSTANT_P:
3007 /* Resolve __builtin_constant_p. If it hasn't been
3008 folded to integer_one_node by now, it's fairly
3009 certain that the value simply isn't constant. */
3010 result = integer_zero_node;
3011 break;
3013 case BUILT_IN_ASSUME_ALIGNED:
3014 /* Remove __builtin_assume_aligned. */
3015 result = gimple_call_arg (stmt, 0);
3016 break;
3018 case BUILT_IN_STACK_RESTORE:
3019 result = optimize_stack_restore (i);
3020 if (result)
3021 break;
3022 gsi_next (&i);
3023 continue;
3025 case BUILT_IN_UNREACHABLE:
3026 if (optimize_unreachable (i))
3027 cfg_changed = true;
3028 break;
3030 case BUILT_IN_ATOMIC_FETCH_OR_1:
3031 case BUILT_IN_ATOMIC_FETCH_OR_2:
3032 case BUILT_IN_ATOMIC_FETCH_OR_4:
3033 case BUILT_IN_ATOMIC_FETCH_OR_8:
3034 case BUILT_IN_ATOMIC_FETCH_OR_16:
3035 optimize_atomic_bit_test_and (&i,
3036 IFN_ATOMIC_BIT_TEST_AND_SET,
3037 true, false);
3038 break;
3039 case BUILT_IN_SYNC_FETCH_AND_OR_1:
3040 case BUILT_IN_SYNC_FETCH_AND_OR_2:
3041 case BUILT_IN_SYNC_FETCH_AND_OR_4:
3042 case BUILT_IN_SYNC_FETCH_AND_OR_8:
3043 case BUILT_IN_SYNC_FETCH_AND_OR_16:
3044 optimize_atomic_bit_test_and (&i,
3045 IFN_ATOMIC_BIT_TEST_AND_SET,
3046 false, false);
3047 break;
3049 case BUILT_IN_ATOMIC_FETCH_XOR_1:
3050 case BUILT_IN_ATOMIC_FETCH_XOR_2:
3051 case BUILT_IN_ATOMIC_FETCH_XOR_4:
3052 case BUILT_IN_ATOMIC_FETCH_XOR_8:
3053 case BUILT_IN_ATOMIC_FETCH_XOR_16:
3054 optimize_atomic_bit_test_and
3055 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, true, false);
3056 break;
3057 case BUILT_IN_SYNC_FETCH_AND_XOR_1:
3058 case BUILT_IN_SYNC_FETCH_AND_XOR_2:
3059 case BUILT_IN_SYNC_FETCH_AND_XOR_4:
3060 case BUILT_IN_SYNC_FETCH_AND_XOR_8:
3061 case BUILT_IN_SYNC_FETCH_AND_XOR_16:
3062 optimize_atomic_bit_test_and
3063 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, false, false);
3064 break;
3066 case BUILT_IN_ATOMIC_XOR_FETCH_1:
3067 case BUILT_IN_ATOMIC_XOR_FETCH_2:
3068 case BUILT_IN_ATOMIC_XOR_FETCH_4:
3069 case BUILT_IN_ATOMIC_XOR_FETCH_8:
3070 case BUILT_IN_ATOMIC_XOR_FETCH_16:
3071 optimize_atomic_bit_test_and
3072 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, true, true);
3073 break;
3074 case BUILT_IN_SYNC_XOR_AND_FETCH_1:
3075 case BUILT_IN_SYNC_XOR_AND_FETCH_2:
3076 case BUILT_IN_SYNC_XOR_AND_FETCH_4:
3077 case BUILT_IN_SYNC_XOR_AND_FETCH_8:
3078 case BUILT_IN_SYNC_XOR_AND_FETCH_16:
3079 optimize_atomic_bit_test_and
3080 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, false, true);
3081 break;
3083 case BUILT_IN_ATOMIC_FETCH_AND_1:
3084 case BUILT_IN_ATOMIC_FETCH_AND_2:
3085 case BUILT_IN_ATOMIC_FETCH_AND_4:
3086 case BUILT_IN_ATOMIC_FETCH_AND_8:
3087 case BUILT_IN_ATOMIC_FETCH_AND_16:
3088 optimize_atomic_bit_test_and (&i,
3089 IFN_ATOMIC_BIT_TEST_AND_RESET,
3090 true, false);
3091 break;
3092 case BUILT_IN_SYNC_FETCH_AND_AND_1:
3093 case BUILT_IN_SYNC_FETCH_AND_AND_2:
3094 case BUILT_IN_SYNC_FETCH_AND_AND_4:
3095 case BUILT_IN_SYNC_FETCH_AND_AND_8:
3096 case BUILT_IN_SYNC_FETCH_AND_AND_16:
3097 optimize_atomic_bit_test_and (&i,
3098 IFN_ATOMIC_BIT_TEST_AND_RESET,
3099 false, false);
3100 break;
3102 case BUILT_IN_VA_START:
3103 case BUILT_IN_VA_END:
3104 case BUILT_IN_VA_COPY:
3105 /* These shouldn't be folded before pass_stdarg. */
3106 result = optimize_stdarg_builtin (stmt);
3107 if (result)
3108 break;
3109 /* FALLTHRU */
3111 default:;
3114 if (!result)
3116 gsi_next (&i);
3117 continue;
3120 if (!update_call_from_tree (&i, result))
3121 gimplify_and_update_call_from_tree (&i, result);
3124 todoflags |= TODO_update_address_taken;
3126 if (dump_file && (dump_flags & TDF_DETAILS))
3128 fprintf (dump_file, "Simplified\n ");
3129 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
3132 old_stmt = stmt;
3133 stmt = gsi_stmt (i);
3134 update_stmt (stmt);
3136 if (maybe_clean_or_replace_eh_stmt (old_stmt, stmt)
3137 && gimple_purge_dead_eh_edges (bb))
3138 cfg_changed = true;
3140 if (dump_file && (dump_flags & TDF_DETAILS))
3142 fprintf (dump_file, "to\n ");
3143 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
3144 fprintf (dump_file, "\n");
3147 /* Retry the same statement if it changed into another
3148 builtin, there might be new opportunities now. */
3149 if (gimple_code (stmt) != GIMPLE_CALL)
3151 gsi_next (&i);
3152 continue;
3154 callee = gimple_call_fndecl (stmt);
3155 if (!callee
3156 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
3157 || DECL_FUNCTION_CODE (callee) == fcode)
3158 gsi_next (&i);
3162 /* Delete unreachable blocks. */
3163 if (cfg_changed)
3164 todoflags |= TODO_cleanup_cfg;
3166 return todoflags;
3169 } // anon namespace
3171 gimple_opt_pass *
3172 make_pass_fold_builtins (gcc::context *ctxt)
3174 return new pass_fold_builtins (ctxt);