* config/i386/i386.h (TARGET_SUPPORTS_WIDE_INT): New define.
[official-gcc.git] / gcc / tree-ssa-ccp.c
blobebd493d50e78684e48d6bd647339c244464f1573
1 /* Conditional constant propagation pass for the GNU compiler.
2 Copyright (C) 2000-2015 Free Software Foundation, Inc.
3 Adapted from original RTL SSA-CCP by Daniel Berlin <dberlin@dberlin.org>
4 Adapted to GIMPLE trees by Diego Novillo <dnovillo@redhat.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 3, or (at your option) any
11 later version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT
14 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* Conditional constant propagation (CCP) is based on the SSA
23 propagation engine (tree-ssa-propagate.c). Constant assignments of
24 the form VAR = CST are propagated from the assignments into uses of
25 VAR, which in turn may generate new constants. The simulation uses
26 a four level lattice to keep track of constant values associated
27 with SSA names. Given an SSA name V_i, it may take one of the
28 following values:
30 UNINITIALIZED -> the initial state of the value. This value
31 is replaced with a correct initial value
32 the first time the value is used, so the
33 rest of the pass does not need to care about
34 it. Using this value simplifies initialization
35 of the pass, and prevents us from needlessly
36 scanning statements that are never reached.
38 UNDEFINED -> V_i is a local variable whose definition
39 has not been processed yet. Therefore we
40 don't yet know if its value is a constant
41 or not.
43 CONSTANT -> V_i has been found to hold a constant
44 value C.
46 VARYING -> V_i cannot take a constant value, or if it
47 does, it is not possible to determine it
48 at compile time.
50 The core of SSA-CCP is in ccp_visit_stmt and ccp_visit_phi_node:
52 1- In ccp_visit_stmt, we are interested in assignments whose RHS
53 evaluates into a constant and conditional jumps whose predicate
54 evaluates into a boolean true or false. When an assignment of
55 the form V_i = CONST is found, V_i's lattice value is set to
56 CONSTANT and CONST is associated with it. This causes the
57 propagation engine to add all the SSA edges coming out the
58 assignment into the worklists, so that statements that use V_i
59 can be visited.
61 If the statement is a conditional with a constant predicate, we
62 mark the outgoing edges as executable or not executable
63 depending on the predicate's value. This is then used when
64 visiting PHI nodes to know when a PHI argument can be ignored.
67 2- In ccp_visit_phi_node, if all the PHI arguments evaluate to the
68 same constant C, then the LHS of the PHI is set to C. This
69 evaluation is known as the "meet operation". Since one of the
70 goals of this evaluation is to optimistically return constant
71 values as often as possible, it uses two main short cuts:
73 - If an argument is flowing in through a non-executable edge, it
74 is ignored. This is useful in cases like this:
76 if (PRED)
77 a_9 = 3;
78 else
79 a_10 = 100;
80 a_11 = PHI (a_9, a_10)
82 If PRED is known to always evaluate to false, then we can
83 assume that a_11 will always take its value from a_10, meaning
84 that instead of consider it VARYING (a_9 and a_10 have
85 different values), we can consider it CONSTANT 100.
87 - If an argument has an UNDEFINED value, then it does not affect
88 the outcome of the meet operation. If a variable V_i has an
89 UNDEFINED value, it means that either its defining statement
90 hasn't been visited yet or V_i has no defining statement, in
91 which case the original symbol 'V' is being used
92 uninitialized. Since 'V' is a local variable, the compiler
93 may assume any initial value for it.
96 After propagation, every variable V_i that ends up with a lattice
97 value of CONSTANT will have the associated constant value in the
98 array CONST_VAL[i].VALUE. That is fed into substitute_and_fold for
99 final substitution and folding.
101 This algorithm uses wide-ints at the max precision of the target.
102 This means that, with one uninteresting exception, variables with
103 UNSIGNED types never go to VARYING because the bits above the
104 precision of the type of the variable are always zero. The
105 uninteresting case is a variable of UNSIGNED type that has the
106 maximum precision of the target. Such variables can go to VARYING,
107 but this causes no loss of infomation since these variables will
108 never be extended.
110 References:
112 Constant propagation with conditional branches,
113 Wegman and Zadeck, ACM TOPLAS 13(2):181-210.
115 Building an Optimizing Compiler,
116 Robert Morgan, Butterworth-Heinemann, 1998, Section 8.9.
118 Advanced Compiler Design and Implementation,
119 Steven Muchnick, Morgan Kaufmann, 1997, Section 12.6 */
121 #include "config.h"
122 #include "system.h"
123 #include "coretypes.h"
124 #include "tm.h"
125 #include "hash-set.h"
126 #include "machmode.h"
127 #include "vec.h"
128 #include "double-int.h"
129 #include "input.h"
130 #include "alias.h"
131 #include "symtab.h"
132 #include "wide-int.h"
133 #include "inchash.h"
134 #include "real.h"
135 #include "tree.h"
136 #include "fold-const.h"
137 #include "stor-layout.h"
138 #include "flags.h"
139 #include "tm_p.h"
140 #include "predict.h"
141 #include "hard-reg-set.h"
142 #include "input.h"
143 #include "function.h"
144 #include "dominance.h"
145 #include "cfg.h"
146 #include "basic-block.h"
147 #include "gimple-pretty-print.h"
148 #include "hash-table.h"
149 #include "tree-ssa-alias.h"
150 #include "internal-fn.h"
151 #include "gimple-fold.h"
152 #include "tree-eh.h"
153 #include "gimple-expr.h"
154 #include "is-a.h"
155 #include "gimple.h"
156 #include "gimplify.h"
157 #include "gimple-iterator.h"
158 #include "gimple-ssa.h"
159 #include "tree-cfg.h"
160 #include "tree-phinodes.h"
161 #include "ssa-iterators.h"
162 #include "stringpool.h"
163 #include "tree-ssanames.h"
164 #include "tree-pass.h"
165 #include "tree-ssa-propagate.h"
166 #include "value-prof.h"
167 #include "langhooks.h"
168 #include "target.h"
169 #include "diagnostic-core.h"
170 #include "dbgcnt.h"
171 #include "params.h"
172 #include "wide-int-print.h"
173 #include "builtins.h"
174 #include "tree-chkp.h"
177 /* Possible lattice values. */
178 typedef enum
180 UNINITIALIZED,
181 UNDEFINED,
182 CONSTANT,
183 VARYING
184 } ccp_lattice_t;
186 struct ccp_prop_value_t {
187 /* Lattice value. */
188 ccp_lattice_t lattice_val;
190 /* Propagated value. */
191 tree value;
193 /* Mask that applies to the propagated value during CCP. For X
194 with a CONSTANT lattice value X & ~mask == value & ~mask. The
195 zero bits in the mask cover constant values. The ones mean no
196 information. */
197 widest_int mask;
200 /* Array of propagated constant values. After propagation,
201 CONST_VAL[I].VALUE holds the constant value for SSA_NAME(I). If
202 the constant is held in an SSA name representing a memory store
203 (i.e., a VDEF), CONST_VAL[I].MEM_REF will contain the actual
204 memory reference used to store (i.e., the LHS of the assignment
205 doing the store). */
206 static ccp_prop_value_t *const_val;
207 static unsigned n_const_val;
209 static void canonicalize_value (ccp_prop_value_t *);
210 static bool ccp_fold_stmt (gimple_stmt_iterator *);
211 static void ccp_lattice_meet (ccp_prop_value_t *, ccp_prop_value_t *);
213 /* Dump constant propagation value VAL to file OUTF prefixed by PREFIX. */
215 static void
216 dump_lattice_value (FILE *outf, const char *prefix, ccp_prop_value_t val)
218 switch (val.lattice_val)
220 case UNINITIALIZED:
221 fprintf (outf, "%sUNINITIALIZED", prefix);
222 break;
223 case UNDEFINED:
224 fprintf (outf, "%sUNDEFINED", prefix);
225 break;
226 case VARYING:
227 fprintf (outf, "%sVARYING", prefix);
228 break;
229 case CONSTANT:
230 if (TREE_CODE (val.value) != INTEGER_CST
231 || val.mask == 0)
233 fprintf (outf, "%sCONSTANT ", prefix);
234 print_generic_expr (outf, val.value, dump_flags);
236 else
238 widest_int cval = wi::bit_and_not (wi::to_widest (val.value),
239 val.mask);
240 fprintf (outf, "%sCONSTANT ", prefix);
241 print_hex (cval, outf);
242 fprintf (outf, " (");
243 print_hex (val.mask, outf);
244 fprintf (outf, ")");
246 break;
247 default:
248 gcc_unreachable ();
253 /* Print lattice value VAL to stderr. */
255 void debug_lattice_value (ccp_prop_value_t val);
257 DEBUG_FUNCTION void
258 debug_lattice_value (ccp_prop_value_t val)
260 dump_lattice_value (stderr, "", val);
261 fprintf (stderr, "\n");
264 /* Extend NONZERO_BITS to a full mask, with the upper bits being set. */
266 static widest_int
267 extend_mask (const wide_int &nonzero_bits)
269 return (wi::mask <widest_int> (wi::get_precision (nonzero_bits), true)
270 | widest_int::from (nonzero_bits, UNSIGNED));
273 /* Compute a default value for variable VAR and store it in the
274 CONST_VAL array. The following rules are used to get default
275 values:
277 1- Global and static variables that are declared constant are
278 considered CONSTANT.
280 2- Any other value is considered UNDEFINED. This is useful when
281 considering PHI nodes. PHI arguments that are undefined do not
282 change the constant value of the PHI node, which allows for more
283 constants to be propagated.
285 3- Variables defined by statements other than assignments and PHI
286 nodes are considered VARYING.
288 4- Initial values of variables that are not GIMPLE registers are
289 considered VARYING. */
291 static ccp_prop_value_t
292 get_default_value (tree var)
294 ccp_prop_value_t val = { UNINITIALIZED, NULL_TREE, 0 };
295 gimple stmt;
297 stmt = SSA_NAME_DEF_STMT (var);
299 if (gimple_nop_p (stmt))
301 /* Variables defined by an empty statement are those used
302 before being initialized. If VAR is a local variable, we
303 can assume initially that it is UNDEFINED, otherwise we must
304 consider it VARYING. */
305 if (!virtual_operand_p (var)
306 && TREE_CODE (SSA_NAME_VAR (var)) == VAR_DECL)
307 val.lattice_val = UNDEFINED;
308 else
310 val.lattice_val = VARYING;
311 val.mask = -1;
312 if (flag_tree_bit_ccp)
314 wide_int nonzero_bits = get_nonzero_bits (var);
315 if (nonzero_bits != -1)
317 val.lattice_val = CONSTANT;
318 val.value = build_zero_cst (TREE_TYPE (var));
319 val.mask = extend_mask (nonzero_bits);
324 else if (is_gimple_assign (stmt))
326 tree cst;
327 if (gimple_assign_single_p (stmt)
328 && DECL_P (gimple_assign_rhs1 (stmt))
329 && (cst = get_symbol_constant_value (gimple_assign_rhs1 (stmt))))
331 val.lattice_val = CONSTANT;
332 val.value = cst;
334 else
336 /* Any other variable defined by an assignment is considered
337 UNDEFINED. */
338 val.lattice_val = UNDEFINED;
341 else if ((is_gimple_call (stmt)
342 && gimple_call_lhs (stmt) != NULL_TREE)
343 || gimple_code (stmt) == GIMPLE_PHI)
345 /* A variable defined by a call or a PHI node is considered
346 UNDEFINED. */
347 val.lattice_val = UNDEFINED;
349 else
351 /* Otherwise, VAR will never take on a constant value. */
352 val.lattice_val = VARYING;
353 val.mask = -1;
356 return val;
360 /* Get the constant value associated with variable VAR. */
362 static inline ccp_prop_value_t *
363 get_value (tree var)
365 ccp_prop_value_t *val;
367 if (const_val == NULL
368 || SSA_NAME_VERSION (var) >= n_const_val)
369 return NULL;
371 val = &const_val[SSA_NAME_VERSION (var)];
372 if (val->lattice_val == UNINITIALIZED)
373 *val = get_default_value (var);
375 canonicalize_value (val);
377 return val;
380 /* Return the constant tree value associated with VAR. */
382 static inline tree
383 get_constant_value (tree var)
385 ccp_prop_value_t *val;
386 if (TREE_CODE (var) != SSA_NAME)
388 if (is_gimple_min_invariant (var))
389 return var;
390 return NULL_TREE;
392 val = get_value (var);
393 if (val
394 && val->lattice_val == CONSTANT
395 && (TREE_CODE (val->value) != INTEGER_CST
396 || val->mask == 0))
397 return val->value;
398 return NULL_TREE;
401 /* Sets the value associated with VAR to VARYING. */
403 static inline void
404 set_value_varying (tree var)
406 ccp_prop_value_t *val = &const_val[SSA_NAME_VERSION (var)];
408 val->lattice_val = VARYING;
409 val->value = NULL_TREE;
410 val->mask = -1;
413 /* For integer constants, make sure to drop TREE_OVERFLOW. */
415 static void
416 canonicalize_value (ccp_prop_value_t *val)
418 if (val->lattice_val != CONSTANT)
419 return;
421 if (TREE_OVERFLOW_P (val->value))
422 val->value = drop_tree_overflow (val->value);
425 /* Return whether the lattice transition is valid. */
427 static bool
428 valid_lattice_transition (ccp_prop_value_t old_val, ccp_prop_value_t new_val)
430 /* Lattice transitions must always be monotonically increasing in
431 value. */
432 if (old_val.lattice_val < new_val.lattice_val)
433 return true;
435 if (old_val.lattice_val != new_val.lattice_val)
436 return false;
438 if (!old_val.value && !new_val.value)
439 return true;
441 /* Now both lattice values are CONSTANT. */
443 /* Allow arbitrary copy changes as we might look through PHI <a_1, ...>
444 when only a single copy edge is executable. */
445 if (TREE_CODE (old_val.value) == SSA_NAME
446 && TREE_CODE (new_val.value) == SSA_NAME)
447 return true;
449 /* Allow transitioning from a constant to a copy. */
450 if (is_gimple_min_invariant (old_val.value)
451 && TREE_CODE (new_val.value) == SSA_NAME)
452 return true;
454 /* Allow transitioning from PHI <&x, not executable> == &x
455 to PHI <&x, &y> == common alignment. */
456 if (TREE_CODE (old_val.value) != INTEGER_CST
457 && TREE_CODE (new_val.value) == INTEGER_CST)
458 return true;
460 /* Bit-lattices have to agree in the still valid bits. */
461 if (TREE_CODE (old_val.value) == INTEGER_CST
462 && TREE_CODE (new_val.value) == INTEGER_CST)
463 return (wi::bit_and_not (wi::to_widest (old_val.value), new_val.mask)
464 == wi::bit_and_not (wi::to_widest (new_val.value), new_val.mask));
466 /* Otherwise constant values have to agree. */
467 if (operand_equal_p (old_val.value, new_val.value, 0))
468 return true;
470 /* At least the kinds and types should agree now. */
471 if (TREE_CODE (old_val.value) != TREE_CODE (new_val.value)
472 || !types_compatible_p (TREE_TYPE (old_val.value),
473 TREE_TYPE (new_val.value)))
474 return false;
476 /* For floats and !HONOR_NANS allow transitions from (partial) NaN
477 to non-NaN. */
478 tree type = TREE_TYPE (new_val.value);
479 if (SCALAR_FLOAT_TYPE_P (type)
480 && !HONOR_NANS (type))
482 if (REAL_VALUE_ISNAN (TREE_REAL_CST (old_val.value)))
483 return true;
485 else if (VECTOR_FLOAT_TYPE_P (type)
486 && !HONOR_NANS (type))
488 for (unsigned i = 0; i < VECTOR_CST_NELTS (old_val.value); ++i)
489 if (!REAL_VALUE_ISNAN
490 (TREE_REAL_CST (VECTOR_CST_ELT (old_val.value, i)))
491 && !operand_equal_p (VECTOR_CST_ELT (old_val.value, i),
492 VECTOR_CST_ELT (new_val.value, i), 0))
493 return false;
494 return true;
496 else if (COMPLEX_FLOAT_TYPE_P (type)
497 && !HONOR_NANS (type))
499 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_REALPART (old_val.value)))
500 && !operand_equal_p (TREE_REALPART (old_val.value),
501 TREE_REALPART (new_val.value), 0))
502 return false;
503 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_IMAGPART (old_val.value)))
504 && !operand_equal_p (TREE_IMAGPART (old_val.value),
505 TREE_IMAGPART (new_val.value), 0))
506 return false;
507 return true;
509 return false;
512 /* Set the value for variable VAR to NEW_VAL. Return true if the new
513 value is different from VAR's previous value. */
515 static bool
516 set_lattice_value (tree var, ccp_prop_value_t *new_val)
518 /* We can deal with old UNINITIALIZED values just fine here. */
519 ccp_prop_value_t *old_val = &const_val[SSA_NAME_VERSION (var)];
521 canonicalize_value (new_val);
523 /* We have to be careful to not go up the bitwise lattice
524 represented by the mask. Instead of dropping to VARYING
525 use the meet operator to retain a conservative value.
526 Missed optimizations like PR65851 makes this necessary.
527 It also ensures we converge to a stable lattice solution. */
528 if (new_val->lattice_val == CONSTANT
529 && old_val->lattice_val == CONSTANT
530 && TREE_CODE (new_val->value) != SSA_NAME)
531 ccp_lattice_meet (new_val, old_val);
533 gcc_checking_assert (valid_lattice_transition (*old_val, *new_val));
535 /* If *OLD_VAL and NEW_VAL are the same, return false to inform the
536 caller that this was a non-transition. */
537 if (old_val->lattice_val != new_val->lattice_val
538 || (new_val->lattice_val == CONSTANT
539 && (TREE_CODE (new_val->value) != TREE_CODE (old_val->value)
540 || (TREE_CODE (new_val->value) == INTEGER_CST
541 && (new_val->mask != old_val->mask
542 || (wi::bit_and_not (wi::to_widest (old_val->value),
543 new_val->mask)
544 != wi::bit_and_not (wi::to_widest (new_val->value),
545 new_val->mask))))
546 || (TREE_CODE (new_val->value) != INTEGER_CST
547 && !operand_equal_p (new_val->value, old_val->value, 0)))))
549 /* ??? We would like to delay creation of INTEGER_CSTs from
550 partially constants here. */
552 if (dump_file && (dump_flags & TDF_DETAILS))
554 dump_lattice_value (dump_file, "Lattice value changed to ", *new_val);
555 fprintf (dump_file, ". Adding SSA edges to worklist.\n");
558 *old_val = *new_val;
560 gcc_assert (new_val->lattice_val != UNINITIALIZED);
561 return true;
564 return false;
567 static ccp_prop_value_t get_value_for_expr (tree, bool);
568 static ccp_prop_value_t bit_value_binop (enum tree_code, tree, tree, tree);
569 static void bit_value_binop_1 (enum tree_code, tree, widest_int *, widest_int *,
570 tree, const widest_int &, const widest_int &,
571 tree, const widest_int &, const widest_int &);
573 /* Return a widest_int that can be used for bitwise simplifications
574 from VAL. */
576 static widest_int
577 value_to_wide_int (ccp_prop_value_t val)
579 if (val.value
580 && TREE_CODE (val.value) == INTEGER_CST)
581 return wi::to_widest (val.value);
583 return 0;
586 /* Return the value for the address expression EXPR based on alignment
587 information. */
589 static ccp_prop_value_t
590 get_value_from_alignment (tree expr)
592 tree type = TREE_TYPE (expr);
593 ccp_prop_value_t val;
594 unsigned HOST_WIDE_INT bitpos;
595 unsigned int align;
597 gcc_assert (TREE_CODE (expr) == ADDR_EXPR);
599 get_pointer_alignment_1 (expr, &align, &bitpos);
600 val.mask = (POINTER_TYPE_P (type) || TYPE_UNSIGNED (type)
601 ? wi::mask <widest_int> (TYPE_PRECISION (type), false)
602 : -1).and_not (align / BITS_PER_UNIT - 1);
603 val.lattice_val
604 = wi::sext (val.mask, TYPE_PRECISION (type)) == -1 ? VARYING : CONSTANT;
605 if (val.lattice_val == CONSTANT)
606 val.value = build_int_cstu (type, bitpos / BITS_PER_UNIT);
607 else
608 val.value = NULL_TREE;
610 return val;
613 /* Return the value for the tree operand EXPR. If FOR_BITS_P is true
614 return constant bits extracted from alignment information for
615 invariant addresses. */
617 static ccp_prop_value_t
618 get_value_for_expr (tree expr, bool for_bits_p)
620 ccp_prop_value_t val;
622 if (TREE_CODE (expr) == SSA_NAME)
624 val = *get_value (expr);
625 if (for_bits_p
626 && val.lattice_val == CONSTANT
627 && TREE_CODE (val.value) == ADDR_EXPR)
628 val = get_value_from_alignment (val.value);
629 /* Fall back to a copy value. */
630 if (!for_bits_p
631 && val.lattice_val == VARYING
632 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (expr))
634 val.lattice_val = CONSTANT;
635 val.value = expr;
636 val.mask = -1;
639 else if (is_gimple_min_invariant (expr)
640 && (!for_bits_p || TREE_CODE (expr) != ADDR_EXPR))
642 val.lattice_val = CONSTANT;
643 val.value = expr;
644 val.mask = 0;
645 canonicalize_value (&val);
647 else if (TREE_CODE (expr) == ADDR_EXPR)
648 val = get_value_from_alignment (expr);
649 else
651 val.lattice_val = VARYING;
652 val.mask = -1;
653 val.value = NULL_TREE;
655 return val;
658 /* Return the likely CCP lattice value for STMT.
660 If STMT has no operands, then return CONSTANT.
662 Else if undefinedness of operands of STMT cause its value to be
663 undefined, then return UNDEFINED.
665 Else if any operands of STMT are constants, then return CONSTANT.
667 Else return VARYING. */
669 static ccp_lattice_t
670 likely_value (gimple stmt)
672 bool has_constant_operand, has_undefined_operand, all_undefined_operands;
673 bool has_nsa_operand;
674 tree use;
675 ssa_op_iter iter;
676 unsigned i;
678 enum gimple_code code = gimple_code (stmt);
680 /* This function appears to be called only for assignments, calls,
681 conditionals, and switches, due to the logic in visit_stmt. */
682 gcc_assert (code == GIMPLE_ASSIGN
683 || code == GIMPLE_CALL
684 || code == GIMPLE_COND
685 || code == GIMPLE_SWITCH);
687 /* If the statement has volatile operands, it won't fold to a
688 constant value. */
689 if (gimple_has_volatile_ops (stmt))
690 return VARYING;
692 /* Arrive here for more complex cases. */
693 has_constant_operand = false;
694 has_undefined_operand = false;
695 all_undefined_operands = true;
696 has_nsa_operand = false;
697 FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
699 ccp_prop_value_t *val = get_value (use);
701 if (val->lattice_val == UNDEFINED)
702 has_undefined_operand = true;
703 else
704 all_undefined_operands = false;
706 if (val->lattice_val == CONSTANT)
707 has_constant_operand = true;
709 if (SSA_NAME_IS_DEFAULT_DEF (use)
710 || !prop_simulate_again_p (SSA_NAME_DEF_STMT (use)))
711 has_nsa_operand = true;
714 /* There may be constants in regular rhs operands. For calls we
715 have to ignore lhs, fndecl and static chain, otherwise only
716 the lhs. */
717 for (i = (is_gimple_call (stmt) ? 2 : 0) + gimple_has_lhs (stmt);
718 i < gimple_num_ops (stmt); ++i)
720 tree op = gimple_op (stmt, i);
721 if (!op || TREE_CODE (op) == SSA_NAME)
722 continue;
723 if (is_gimple_min_invariant (op))
724 has_constant_operand = true;
727 if (has_constant_operand)
728 all_undefined_operands = false;
730 if (has_undefined_operand
731 && code == GIMPLE_CALL
732 && gimple_call_internal_p (stmt))
733 switch (gimple_call_internal_fn (stmt))
735 /* These 3 builtins use the first argument just as a magic
736 way how to find out a decl uid. */
737 case IFN_GOMP_SIMD_LANE:
738 case IFN_GOMP_SIMD_VF:
739 case IFN_GOMP_SIMD_LAST_LANE:
740 has_undefined_operand = false;
741 break;
742 default:
743 break;
746 /* If the operation combines operands like COMPLEX_EXPR make sure to
747 not mark the result UNDEFINED if only one part of the result is
748 undefined. */
749 if (has_undefined_operand && all_undefined_operands)
750 return UNDEFINED;
751 else if (code == GIMPLE_ASSIGN && has_undefined_operand)
753 switch (gimple_assign_rhs_code (stmt))
755 /* Unary operators are handled with all_undefined_operands. */
756 case PLUS_EXPR:
757 case MINUS_EXPR:
758 case POINTER_PLUS_EXPR:
759 /* Not MIN_EXPR, MAX_EXPR. One VARYING operand may be selected.
760 Not bitwise operators, one VARYING operand may specify the
761 result completely. Not logical operators for the same reason.
762 Not COMPLEX_EXPR as one VARYING operand makes the result partly
763 not UNDEFINED. Not *DIV_EXPR, comparisons and shifts because
764 the undefined operand may be promoted. */
765 return UNDEFINED;
767 case ADDR_EXPR:
768 /* If any part of an address is UNDEFINED, like the index
769 of an ARRAY_EXPR, then treat the result as UNDEFINED. */
770 return UNDEFINED;
772 default:
776 /* If there was an UNDEFINED operand but the result may be not UNDEFINED
777 fall back to CONSTANT. During iteration UNDEFINED may still drop
778 to CONSTANT. */
779 if (has_undefined_operand)
780 return CONSTANT;
782 /* We do not consider virtual operands here -- load from read-only
783 memory may have only VARYING virtual operands, but still be
784 constant. Also we can combine the stmt with definitions from
785 operands whose definitions are not simulated again. */
786 if (has_constant_operand
787 || has_nsa_operand
788 || gimple_references_memory_p (stmt))
789 return CONSTANT;
791 return VARYING;
794 /* Returns true if STMT cannot be constant. */
796 static bool
797 surely_varying_stmt_p (gimple stmt)
799 /* If the statement has operands that we cannot handle, it cannot be
800 constant. */
801 if (gimple_has_volatile_ops (stmt))
802 return true;
804 /* If it is a call and does not return a value or is not a
805 builtin and not an indirect call or a call to function with
806 assume_aligned/alloc_align attribute, it is varying. */
807 if (is_gimple_call (stmt))
809 tree fndecl, fntype = gimple_call_fntype (stmt);
810 if (!gimple_call_lhs (stmt)
811 || ((fndecl = gimple_call_fndecl (stmt)) != NULL_TREE
812 && !DECL_BUILT_IN (fndecl)
813 && !lookup_attribute ("assume_aligned",
814 TYPE_ATTRIBUTES (fntype))
815 && !lookup_attribute ("alloc_align",
816 TYPE_ATTRIBUTES (fntype))))
817 return true;
820 /* Any other store operation is not interesting. */
821 else if (gimple_vdef (stmt))
822 return true;
824 /* Anything other than assignments and conditional jumps are not
825 interesting for CCP. */
826 if (gimple_code (stmt) != GIMPLE_ASSIGN
827 && gimple_code (stmt) != GIMPLE_COND
828 && gimple_code (stmt) != GIMPLE_SWITCH
829 && gimple_code (stmt) != GIMPLE_CALL)
830 return true;
832 return false;
835 /* Initialize local data structures for CCP. */
837 static void
838 ccp_initialize (void)
840 basic_block bb;
842 n_const_val = num_ssa_names;
843 const_val = XCNEWVEC (ccp_prop_value_t, n_const_val);
845 /* Initialize simulation flags for PHI nodes and statements. */
846 FOR_EACH_BB_FN (bb, cfun)
848 gimple_stmt_iterator i;
850 for (i = gsi_start_bb (bb); !gsi_end_p (i); gsi_next (&i))
852 gimple stmt = gsi_stmt (i);
853 bool is_varying;
855 /* If the statement is a control insn, then we do not
856 want to avoid simulating the statement once. Failure
857 to do so means that those edges will never get added. */
858 if (stmt_ends_bb_p (stmt))
859 is_varying = false;
860 else
861 is_varying = surely_varying_stmt_p (stmt);
863 if (is_varying)
865 tree def;
866 ssa_op_iter iter;
868 /* If the statement will not produce a constant, mark
869 all its outputs VARYING. */
870 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
871 set_value_varying (def);
873 prop_set_simulate_again (stmt, !is_varying);
877 /* Now process PHI nodes. We never clear the simulate_again flag on
878 phi nodes, since we do not know which edges are executable yet,
879 except for phi nodes for virtual operands when we do not do store ccp. */
880 FOR_EACH_BB_FN (bb, cfun)
882 gphi_iterator i;
884 for (i = gsi_start_phis (bb); !gsi_end_p (i); gsi_next (&i))
886 gphi *phi = i.phi ();
888 if (virtual_operand_p (gimple_phi_result (phi)))
889 prop_set_simulate_again (phi, false);
890 else
891 prop_set_simulate_again (phi, true);
896 /* Debug count support. Reset the values of ssa names
897 VARYING when the total number ssa names analyzed is
898 beyond the debug count specified. */
900 static void
901 do_dbg_cnt (void)
903 unsigned i;
904 for (i = 0; i < num_ssa_names; i++)
906 if (!dbg_cnt (ccp))
908 const_val[i].lattice_val = VARYING;
909 const_val[i].mask = -1;
910 const_val[i].value = NULL_TREE;
916 /* Do final substitution of propagated values, cleanup the flowgraph and
917 free allocated storage.
919 Return TRUE when something was optimized. */
921 static bool
922 ccp_finalize (void)
924 bool something_changed;
925 unsigned i;
927 do_dbg_cnt ();
929 /* Derive alignment and misalignment information from partially
930 constant pointers in the lattice or nonzero bits from partially
931 constant integers. */
932 for (i = 1; i < num_ssa_names; ++i)
934 tree name = ssa_name (i);
935 ccp_prop_value_t *val;
936 unsigned int tem, align;
938 if (!name
939 || (!POINTER_TYPE_P (TREE_TYPE (name))
940 && (!INTEGRAL_TYPE_P (TREE_TYPE (name))
941 /* Don't record nonzero bits before IPA to avoid
942 using too much memory. */
943 || first_pass_instance)))
944 continue;
946 val = get_value (name);
947 if (val->lattice_val != CONSTANT
948 || TREE_CODE (val->value) != INTEGER_CST)
949 continue;
951 if (POINTER_TYPE_P (TREE_TYPE (name)))
953 /* Trailing mask bits specify the alignment, trailing value
954 bits the misalignment. */
955 tem = val->mask.to_uhwi ();
956 align = (tem & -tem);
957 if (align > 1)
958 set_ptr_info_alignment (get_ptr_info (name), align,
959 (TREE_INT_CST_LOW (val->value)
960 & (align - 1)));
962 else
964 unsigned int precision = TYPE_PRECISION (TREE_TYPE (val->value));
965 wide_int nonzero_bits = wide_int::from (val->mask, precision,
966 UNSIGNED) | val->value;
967 nonzero_bits &= get_nonzero_bits (name);
968 set_nonzero_bits (name, nonzero_bits);
972 /* Perform substitutions based on the known constant values. */
973 something_changed = substitute_and_fold (get_constant_value,
974 ccp_fold_stmt, true);
976 free (const_val);
977 const_val = NULL;
978 return something_changed;;
982 /* Compute the meet operator between *VAL1 and *VAL2. Store the result
983 in VAL1.
985 any M UNDEFINED = any
986 any M VARYING = VARYING
987 Ci M Cj = Ci if (i == j)
988 Ci M Cj = VARYING if (i != j)
991 static void
992 ccp_lattice_meet (ccp_prop_value_t *val1, ccp_prop_value_t *val2)
994 if (val1->lattice_val == UNDEFINED
995 /* For UNDEFINED M SSA we can't always SSA because its definition
996 may not dominate the PHI node. Doing optimistic copy propagation
997 also causes a lot of gcc.dg/uninit-pred*.c FAILs. */
998 && (val2->lattice_val != CONSTANT
999 || TREE_CODE (val2->value) != SSA_NAME))
1001 /* UNDEFINED M any = any */
1002 *val1 = *val2;
1004 else if (val2->lattice_val == UNDEFINED
1005 /* See above. */
1006 && (val1->lattice_val != CONSTANT
1007 || TREE_CODE (val1->value) != SSA_NAME))
1009 /* any M UNDEFINED = any
1010 Nothing to do. VAL1 already contains the value we want. */
1013 else if (val1->lattice_val == VARYING
1014 || val2->lattice_val == VARYING)
1016 /* any M VARYING = VARYING. */
1017 val1->lattice_val = VARYING;
1018 val1->mask = -1;
1019 val1->value = NULL_TREE;
1021 else if (val1->lattice_val == CONSTANT
1022 && val2->lattice_val == CONSTANT
1023 && TREE_CODE (val1->value) == INTEGER_CST
1024 && TREE_CODE (val2->value) == INTEGER_CST)
1026 /* Ci M Cj = Ci if (i == j)
1027 Ci M Cj = VARYING if (i != j)
1029 For INTEGER_CSTs mask unequal bits. If no equal bits remain,
1030 drop to varying. */
1031 val1->mask = (val1->mask | val2->mask
1032 | (wi::to_widest (val1->value)
1033 ^ wi::to_widest (val2->value)));
1034 if (wi::sext (val1->mask, TYPE_PRECISION (TREE_TYPE (val1->value))) == -1)
1036 val1->lattice_val = VARYING;
1037 val1->value = NULL_TREE;
1040 else if (val1->lattice_val == CONSTANT
1041 && val2->lattice_val == CONSTANT
1042 && operand_equal_p (val1->value, val2->value, 0))
1044 /* Ci M Cj = Ci if (i == j)
1045 Ci M Cj = VARYING if (i != j)
1047 VAL1 already contains the value we want for equivalent values. */
1049 else if (val1->lattice_val == CONSTANT
1050 && val2->lattice_val == CONSTANT
1051 && (TREE_CODE (val1->value) == ADDR_EXPR
1052 || TREE_CODE (val2->value) == ADDR_EXPR))
1054 /* When not equal addresses are involved try meeting for
1055 alignment. */
1056 ccp_prop_value_t tem = *val2;
1057 if (TREE_CODE (val1->value) == ADDR_EXPR)
1058 *val1 = get_value_for_expr (val1->value, true);
1059 if (TREE_CODE (val2->value) == ADDR_EXPR)
1060 tem = get_value_for_expr (val2->value, true);
1061 ccp_lattice_meet (val1, &tem);
1063 else
1065 /* Any other combination is VARYING. */
1066 val1->lattice_val = VARYING;
1067 val1->mask = -1;
1068 val1->value = NULL_TREE;
1073 /* Loop through the PHI_NODE's parameters for BLOCK and compare their
1074 lattice values to determine PHI_NODE's lattice value. The value of a
1075 PHI node is determined calling ccp_lattice_meet with all the arguments
1076 of the PHI node that are incoming via executable edges. */
1078 static enum ssa_prop_result
1079 ccp_visit_phi_node (gphi *phi)
1081 unsigned i;
1082 ccp_prop_value_t new_val;
1084 if (dump_file && (dump_flags & TDF_DETAILS))
1086 fprintf (dump_file, "\nVisiting PHI node: ");
1087 print_gimple_stmt (dump_file, phi, 0, dump_flags);
1090 new_val.lattice_val = UNDEFINED;
1091 new_val.value = NULL_TREE;
1092 new_val.mask = 0;
1094 bool first = true;
1095 for (i = 0; i < gimple_phi_num_args (phi); i++)
1097 /* Compute the meet operator over all the PHI arguments flowing
1098 through executable edges. */
1099 edge e = gimple_phi_arg_edge (phi, i);
1101 if (dump_file && (dump_flags & TDF_DETAILS))
1103 fprintf (dump_file,
1104 "\n Argument #%d (%d -> %d %sexecutable)\n",
1105 i, e->src->index, e->dest->index,
1106 (e->flags & EDGE_EXECUTABLE) ? "" : "not ");
1109 /* If the incoming edge is executable, Compute the meet operator for
1110 the existing value of the PHI node and the current PHI argument. */
1111 if (e->flags & EDGE_EXECUTABLE)
1113 tree arg = gimple_phi_arg (phi, i)->def;
1114 ccp_prop_value_t arg_val = get_value_for_expr (arg, false);
1116 if (first)
1118 new_val = arg_val;
1119 first = false;
1121 else
1122 ccp_lattice_meet (&new_val, &arg_val);
1124 if (dump_file && (dump_flags & TDF_DETAILS))
1126 fprintf (dump_file, "\t");
1127 print_generic_expr (dump_file, arg, dump_flags);
1128 dump_lattice_value (dump_file, "\tValue: ", arg_val);
1129 fprintf (dump_file, "\n");
1132 if (new_val.lattice_val == VARYING)
1133 break;
1137 if (dump_file && (dump_flags & TDF_DETAILS))
1139 dump_lattice_value (dump_file, "\n PHI node value: ", new_val);
1140 fprintf (dump_file, "\n\n");
1143 /* Make the transition to the new value. */
1144 if (set_lattice_value (gimple_phi_result (phi), &new_val))
1146 if (new_val.lattice_val == VARYING)
1147 return SSA_PROP_VARYING;
1148 else
1149 return SSA_PROP_INTERESTING;
1151 else
1152 return SSA_PROP_NOT_INTERESTING;
1155 /* Return the constant value for OP or OP otherwise. */
1157 static tree
1158 valueize_op (tree op)
1160 if (TREE_CODE (op) == SSA_NAME)
1162 tree tem = get_constant_value (op);
1163 if (tem)
1164 return tem;
1166 return op;
1169 /* Return the constant value for OP, but signal to not follow SSA
1170 edges if the definition may be simulated again. */
1172 static tree
1173 valueize_op_1 (tree op)
1175 if (TREE_CODE (op) == SSA_NAME)
1177 /* If the definition may be simulated again we cannot follow
1178 this SSA edge as the SSA propagator does not necessarily
1179 re-visit the use. */
1180 gimple def_stmt = SSA_NAME_DEF_STMT (op);
1181 if (!gimple_nop_p (def_stmt)
1182 && prop_simulate_again_p (def_stmt))
1183 return NULL_TREE;
1184 tree tem = get_constant_value (op);
1185 if (tem)
1186 return tem;
1188 return op;
1191 /* CCP specific front-end to the non-destructive constant folding
1192 routines.
1194 Attempt to simplify the RHS of STMT knowing that one or more
1195 operands are constants.
1197 If simplification is possible, return the simplified RHS,
1198 otherwise return the original RHS or NULL_TREE. */
1200 static tree
1201 ccp_fold (gimple stmt)
1203 location_t loc = gimple_location (stmt);
1204 switch (gimple_code (stmt))
1206 case GIMPLE_COND:
1208 /* Handle comparison operators that can appear in GIMPLE form. */
1209 tree op0 = valueize_op (gimple_cond_lhs (stmt));
1210 tree op1 = valueize_op (gimple_cond_rhs (stmt));
1211 enum tree_code code = gimple_cond_code (stmt);
1212 return fold_binary_loc (loc, code, boolean_type_node, op0, op1);
1215 case GIMPLE_SWITCH:
1217 /* Return the constant switch index. */
1218 return valueize_op (gimple_switch_index (as_a <gswitch *> (stmt)));
1221 case GIMPLE_ASSIGN:
1222 case GIMPLE_CALL:
1223 return gimple_fold_stmt_to_constant_1 (stmt,
1224 valueize_op, valueize_op_1);
1226 default:
1227 gcc_unreachable ();
1231 /* Apply the operation CODE in type TYPE to the value, mask pair
1232 RVAL and RMASK representing a value of type RTYPE and set
1233 the value, mask pair *VAL and *MASK to the result. */
1235 static void
1236 bit_value_unop_1 (enum tree_code code, tree type,
1237 widest_int *val, widest_int *mask,
1238 tree rtype, const widest_int &rval, const widest_int &rmask)
1240 switch (code)
1242 case BIT_NOT_EXPR:
1243 *mask = rmask;
1244 *val = ~rval;
1245 break;
1247 case NEGATE_EXPR:
1249 widest_int temv, temm;
1250 /* Return ~rval + 1. */
1251 bit_value_unop_1 (BIT_NOT_EXPR, type, &temv, &temm, type, rval, rmask);
1252 bit_value_binop_1 (PLUS_EXPR, type, val, mask,
1253 type, temv, temm, type, 1, 0);
1254 break;
1257 CASE_CONVERT:
1259 signop sgn;
1261 /* First extend mask and value according to the original type. */
1262 sgn = TYPE_SIGN (rtype);
1263 *mask = wi::ext (rmask, TYPE_PRECISION (rtype), sgn);
1264 *val = wi::ext (rval, TYPE_PRECISION (rtype), sgn);
1266 /* Then extend mask and value according to the target type. */
1267 sgn = TYPE_SIGN (type);
1268 *mask = wi::ext (*mask, TYPE_PRECISION (type), sgn);
1269 *val = wi::ext (*val, TYPE_PRECISION (type), sgn);
1270 break;
1273 default:
1274 *mask = -1;
1275 break;
1279 /* Apply the operation CODE in type TYPE to the value, mask pairs
1280 R1VAL, R1MASK and R2VAL, R2MASK representing a values of type R1TYPE
1281 and R2TYPE and set the value, mask pair *VAL and *MASK to the result. */
1283 static void
1284 bit_value_binop_1 (enum tree_code code, tree type,
1285 widest_int *val, widest_int *mask,
1286 tree r1type, const widest_int &r1val,
1287 const widest_int &r1mask, tree r2type,
1288 const widest_int &r2val, const widest_int &r2mask)
1290 signop sgn = TYPE_SIGN (type);
1291 int width = TYPE_PRECISION (type);
1292 bool swap_p = false;
1294 /* Assume we'll get a constant result. Use an initial non varying
1295 value, we fall back to varying in the end if necessary. */
1296 *mask = -1;
1298 switch (code)
1300 case BIT_AND_EXPR:
1301 /* The mask is constant where there is a known not
1302 set bit, (m1 | m2) & ((v1 | m1) & (v2 | m2)) */
1303 *mask = (r1mask | r2mask) & (r1val | r1mask) & (r2val | r2mask);
1304 *val = r1val & r2val;
1305 break;
1307 case BIT_IOR_EXPR:
1308 /* The mask is constant where there is a known
1309 set bit, (m1 | m2) & ~((v1 & ~m1) | (v2 & ~m2)). */
1310 *mask = (r1mask | r2mask)
1311 .and_not (r1val.and_not (r1mask) | r2val.and_not (r2mask));
1312 *val = r1val | r2val;
1313 break;
1315 case BIT_XOR_EXPR:
1316 /* m1 | m2 */
1317 *mask = r1mask | r2mask;
1318 *val = r1val ^ r2val;
1319 break;
1321 case LROTATE_EXPR:
1322 case RROTATE_EXPR:
1323 if (r2mask == 0)
1325 widest_int shift = r2val;
1326 if (shift == 0)
1328 *mask = r1mask;
1329 *val = r1val;
1331 else
1333 if (wi::neg_p (shift))
1335 shift = -shift;
1336 if (code == RROTATE_EXPR)
1337 code = LROTATE_EXPR;
1338 else
1339 code = RROTATE_EXPR;
1341 if (code == RROTATE_EXPR)
1343 *mask = wi::rrotate (r1mask, shift, width);
1344 *val = wi::rrotate (r1val, shift, width);
1346 else
1348 *mask = wi::lrotate (r1mask, shift, width);
1349 *val = wi::lrotate (r1val, shift, width);
1353 break;
1355 case LSHIFT_EXPR:
1356 case RSHIFT_EXPR:
1357 /* ??? We can handle partially known shift counts if we know
1358 its sign. That way we can tell that (x << (y | 8)) & 255
1359 is zero. */
1360 if (r2mask == 0)
1362 widest_int shift = r2val;
1363 if (shift == 0)
1365 *mask = r1mask;
1366 *val = r1val;
1368 else
1370 if (wi::neg_p (shift))
1372 shift = -shift;
1373 if (code == RSHIFT_EXPR)
1374 code = LSHIFT_EXPR;
1375 else
1376 code = RSHIFT_EXPR;
1378 if (code == RSHIFT_EXPR)
1380 *mask = wi::rshift (wi::ext (r1mask, width, sgn), shift, sgn);
1381 *val = wi::rshift (wi::ext (r1val, width, sgn), shift, sgn);
1383 else
1385 *mask = wi::ext (wi::lshift (r1mask, shift), width, sgn);
1386 *val = wi::ext (wi::lshift (r1val, shift), width, sgn);
1390 break;
1392 case PLUS_EXPR:
1393 case POINTER_PLUS_EXPR:
1395 /* Do the addition with unknown bits set to zero, to give carry-ins of
1396 zero wherever possible. */
1397 widest_int lo = r1val.and_not (r1mask) + r2val.and_not (r2mask);
1398 lo = wi::ext (lo, width, sgn);
1399 /* Do the addition with unknown bits set to one, to give carry-ins of
1400 one wherever possible. */
1401 widest_int hi = (r1val | r1mask) + (r2val | r2mask);
1402 hi = wi::ext (hi, width, sgn);
1403 /* Each bit in the result is known if (a) the corresponding bits in
1404 both inputs are known, and (b) the carry-in to that bit position
1405 is known. We can check condition (b) by seeing if we got the same
1406 result with minimised carries as with maximised carries. */
1407 *mask = r1mask | r2mask | (lo ^ hi);
1408 *mask = wi::ext (*mask, width, sgn);
1409 /* It shouldn't matter whether we choose lo or hi here. */
1410 *val = lo;
1411 break;
1414 case MINUS_EXPR:
1416 widest_int temv, temm;
1417 bit_value_unop_1 (NEGATE_EXPR, r2type, &temv, &temm,
1418 r2type, r2val, r2mask);
1419 bit_value_binop_1 (PLUS_EXPR, type, val, mask,
1420 r1type, r1val, r1mask,
1421 r2type, temv, temm);
1422 break;
1425 case MULT_EXPR:
1427 /* Just track trailing zeros in both operands and transfer
1428 them to the other. */
1429 int r1tz = wi::ctz (r1val | r1mask);
1430 int r2tz = wi::ctz (r2val | r2mask);
1431 if (r1tz + r2tz >= width)
1433 *mask = 0;
1434 *val = 0;
1436 else if (r1tz + r2tz > 0)
1438 *mask = wi::ext (wi::mask <widest_int> (r1tz + r2tz, true),
1439 width, sgn);
1440 *val = 0;
1442 break;
1445 case EQ_EXPR:
1446 case NE_EXPR:
1448 widest_int m = r1mask | r2mask;
1449 if (r1val.and_not (m) != r2val.and_not (m))
1451 *mask = 0;
1452 *val = ((code == EQ_EXPR) ? 0 : 1);
1454 else
1456 /* We know the result of a comparison is always one or zero. */
1457 *mask = 1;
1458 *val = 0;
1460 break;
1463 case GE_EXPR:
1464 case GT_EXPR:
1465 swap_p = true;
1466 code = swap_tree_comparison (code);
1467 /* Fall through. */
1468 case LT_EXPR:
1469 case LE_EXPR:
1471 int minmax, maxmin;
1473 const widest_int &o1val = swap_p ? r2val : r1val;
1474 const widest_int &o1mask = swap_p ? r2mask : r1mask;
1475 const widest_int &o2val = swap_p ? r1val : r2val;
1476 const widest_int &o2mask = swap_p ? r1mask : r2mask;
1478 /* If the most significant bits are not known we know nothing. */
1479 if (wi::neg_p (o1mask) || wi::neg_p (o2mask))
1480 break;
1482 /* For comparisons the signedness is in the comparison operands. */
1483 sgn = TYPE_SIGN (r1type);
1485 /* If we know the most significant bits we know the values
1486 value ranges by means of treating varying bits as zero
1487 or one. Do a cross comparison of the max/min pairs. */
1488 maxmin = wi::cmp (o1val | o1mask, o2val.and_not (o2mask), sgn);
1489 minmax = wi::cmp (o1val.and_not (o1mask), o2val | o2mask, sgn);
1490 if (maxmin < 0) /* o1 is less than o2. */
1492 *mask = 0;
1493 *val = 1;
1495 else if (minmax > 0) /* o1 is not less or equal to o2. */
1497 *mask = 0;
1498 *val = 0;
1500 else if (maxmin == minmax) /* o1 and o2 are equal. */
1502 /* This probably should never happen as we'd have
1503 folded the thing during fully constant value folding. */
1504 *mask = 0;
1505 *val = (code == LE_EXPR ? 1 : 0);
1507 else
1509 /* We know the result of a comparison is always one or zero. */
1510 *mask = 1;
1511 *val = 0;
1513 break;
1516 default:;
1520 /* Return the propagation value when applying the operation CODE to
1521 the value RHS yielding type TYPE. */
1523 static ccp_prop_value_t
1524 bit_value_unop (enum tree_code code, tree type, tree rhs)
1526 ccp_prop_value_t rval = get_value_for_expr (rhs, true);
1527 widest_int value, mask;
1528 ccp_prop_value_t val;
1530 if (rval.lattice_val == UNDEFINED)
1531 return rval;
1533 gcc_assert ((rval.lattice_val == CONSTANT
1534 && TREE_CODE (rval.value) == INTEGER_CST)
1535 || wi::sext (rval.mask, TYPE_PRECISION (TREE_TYPE (rhs))) == -1);
1536 bit_value_unop_1 (code, type, &value, &mask,
1537 TREE_TYPE (rhs), value_to_wide_int (rval), rval.mask);
1538 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1540 val.lattice_val = CONSTANT;
1541 val.mask = mask;
1542 /* ??? Delay building trees here. */
1543 val.value = wide_int_to_tree (type, value);
1545 else
1547 val.lattice_val = VARYING;
1548 val.value = NULL_TREE;
1549 val.mask = -1;
1551 return val;
1554 /* Return the propagation value when applying the operation CODE to
1555 the values RHS1 and RHS2 yielding type TYPE. */
1557 static ccp_prop_value_t
1558 bit_value_binop (enum tree_code code, tree type, tree rhs1, tree rhs2)
1560 ccp_prop_value_t r1val = get_value_for_expr (rhs1, true);
1561 ccp_prop_value_t r2val = get_value_for_expr (rhs2, true);
1562 widest_int value, mask;
1563 ccp_prop_value_t val;
1565 if (r1val.lattice_val == UNDEFINED
1566 || r2val.lattice_val == UNDEFINED)
1568 val.lattice_val = VARYING;
1569 val.value = NULL_TREE;
1570 val.mask = -1;
1571 return val;
1574 gcc_assert ((r1val.lattice_val == CONSTANT
1575 && TREE_CODE (r1val.value) == INTEGER_CST)
1576 || wi::sext (r1val.mask,
1577 TYPE_PRECISION (TREE_TYPE (rhs1))) == -1);
1578 gcc_assert ((r2val.lattice_val == CONSTANT
1579 && TREE_CODE (r2val.value) == INTEGER_CST)
1580 || wi::sext (r2val.mask,
1581 TYPE_PRECISION (TREE_TYPE (rhs2))) == -1);
1582 bit_value_binop_1 (code, type, &value, &mask,
1583 TREE_TYPE (rhs1), value_to_wide_int (r1val), r1val.mask,
1584 TREE_TYPE (rhs2), value_to_wide_int (r2val), r2val.mask);
1585 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1587 val.lattice_val = CONSTANT;
1588 val.mask = mask;
1589 /* ??? Delay building trees here. */
1590 val.value = wide_int_to_tree (type, value);
1592 else
1594 val.lattice_val = VARYING;
1595 val.value = NULL_TREE;
1596 val.mask = -1;
1598 return val;
1601 /* Return the propagation value for __builtin_assume_aligned
1602 and functions with assume_aligned or alloc_aligned attribute.
1603 For __builtin_assume_aligned, ATTR is NULL_TREE,
1604 for assume_aligned attribute ATTR is non-NULL and ALLOC_ALIGNED
1605 is false, for alloc_aligned attribute ATTR is non-NULL and
1606 ALLOC_ALIGNED is true. */
1608 static ccp_prop_value_t
1609 bit_value_assume_aligned (gimple stmt, tree attr, ccp_prop_value_t ptrval,
1610 bool alloc_aligned)
1612 tree align, misalign = NULL_TREE, type;
1613 unsigned HOST_WIDE_INT aligni, misaligni = 0;
1614 ccp_prop_value_t alignval;
1615 widest_int value, mask;
1616 ccp_prop_value_t val;
1618 if (attr == NULL_TREE)
1620 tree ptr = gimple_call_arg (stmt, 0);
1621 type = TREE_TYPE (ptr);
1622 ptrval = get_value_for_expr (ptr, true);
1624 else
1626 tree lhs = gimple_call_lhs (stmt);
1627 type = TREE_TYPE (lhs);
1630 if (ptrval.lattice_val == UNDEFINED)
1631 return ptrval;
1632 gcc_assert ((ptrval.lattice_val == CONSTANT
1633 && TREE_CODE (ptrval.value) == INTEGER_CST)
1634 || wi::sext (ptrval.mask, TYPE_PRECISION (type)) == -1);
1635 if (attr == NULL_TREE)
1637 /* Get aligni and misaligni from __builtin_assume_aligned. */
1638 align = gimple_call_arg (stmt, 1);
1639 if (!tree_fits_uhwi_p (align))
1640 return ptrval;
1641 aligni = tree_to_uhwi (align);
1642 if (gimple_call_num_args (stmt) > 2)
1644 misalign = gimple_call_arg (stmt, 2);
1645 if (!tree_fits_uhwi_p (misalign))
1646 return ptrval;
1647 misaligni = tree_to_uhwi (misalign);
1650 else
1652 /* Get aligni and misaligni from assume_aligned or
1653 alloc_align attributes. */
1654 if (TREE_VALUE (attr) == NULL_TREE)
1655 return ptrval;
1656 attr = TREE_VALUE (attr);
1657 align = TREE_VALUE (attr);
1658 if (!tree_fits_uhwi_p (align))
1659 return ptrval;
1660 aligni = tree_to_uhwi (align);
1661 if (alloc_aligned)
1663 if (aligni == 0 || aligni > gimple_call_num_args (stmt))
1664 return ptrval;
1665 align = gimple_call_arg (stmt, aligni - 1);
1666 if (!tree_fits_uhwi_p (align))
1667 return ptrval;
1668 aligni = tree_to_uhwi (align);
1670 else if (TREE_CHAIN (attr) && TREE_VALUE (TREE_CHAIN (attr)))
1672 misalign = TREE_VALUE (TREE_CHAIN (attr));
1673 if (!tree_fits_uhwi_p (misalign))
1674 return ptrval;
1675 misaligni = tree_to_uhwi (misalign);
1678 if (aligni <= 1 || (aligni & (aligni - 1)) != 0 || misaligni >= aligni)
1679 return ptrval;
1681 align = build_int_cst_type (type, -aligni);
1682 alignval = get_value_for_expr (align, true);
1683 bit_value_binop_1 (BIT_AND_EXPR, type, &value, &mask,
1684 type, value_to_wide_int (ptrval), ptrval.mask,
1685 type, value_to_wide_int (alignval), alignval.mask);
1686 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1688 val.lattice_val = CONSTANT;
1689 val.mask = mask;
1690 gcc_assert ((mask.to_uhwi () & (aligni - 1)) == 0);
1691 gcc_assert ((value.to_uhwi () & (aligni - 1)) == 0);
1692 value |= misaligni;
1693 /* ??? Delay building trees here. */
1694 val.value = wide_int_to_tree (type, value);
1696 else
1698 val.lattice_val = VARYING;
1699 val.value = NULL_TREE;
1700 val.mask = -1;
1702 return val;
1705 /* Evaluate statement STMT.
1706 Valid only for assignments, calls, conditionals, and switches. */
1708 static ccp_prop_value_t
1709 evaluate_stmt (gimple stmt)
1711 ccp_prop_value_t val;
1712 tree simplified = NULL_TREE;
1713 ccp_lattice_t likelyvalue = likely_value (stmt);
1714 bool is_constant = false;
1715 unsigned int align;
1717 if (dump_file && (dump_flags & TDF_DETAILS))
1719 fprintf (dump_file, "which is likely ");
1720 switch (likelyvalue)
1722 case CONSTANT:
1723 fprintf (dump_file, "CONSTANT");
1724 break;
1725 case UNDEFINED:
1726 fprintf (dump_file, "UNDEFINED");
1727 break;
1728 case VARYING:
1729 fprintf (dump_file, "VARYING");
1730 break;
1731 default:;
1733 fprintf (dump_file, "\n");
1736 /* If the statement is likely to have a CONSTANT result, then try
1737 to fold the statement to determine the constant value. */
1738 /* FIXME. This is the only place that we call ccp_fold.
1739 Since likely_value never returns CONSTANT for calls, we will
1740 not attempt to fold them, including builtins that may profit. */
1741 if (likelyvalue == CONSTANT)
1743 fold_defer_overflow_warnings ();
1744 simplified = ccp_fold (stmt);
1745 if (simplified && TREE_CODE (simplified) == SSA_NAME)
1747 val = *get_value (simplified);
1748 if (val.lattice_val != VARYING)
1750 fold_undefer_overflow_warnings (true, stmt, 0);
1751 return val;
1754 is_constant = simplified && is_gimple_min_invariant (simplified);
1755 fold_undefer_overflow_warnings (is_constant, stmt, 0);
1756 if (is_constant)
1758 /* The statement produced a constant value. */
1759 val.lattice_val = CONSTANT;
1760 val.value = simplified;
1761 val.mask = 0;
1762 return val;
1765 /* If the statement is likely to have a VARYING result, then do not
1766 bother folding the statement. */
1767 else if (likelyvalue == VARYING)
1769 enum gimple_code code = gimple_code (stmt);
1770 if (code == GIMPLE_ASSIGN)
1772 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1774 /* Other cases cannot satisfy is_gimple_min_invariant
1775 without folding. */
1776 if (get_gimple_rhs_class (subcode) == GIMPLE_SINGLE_RHS)
1777 simplified = gimple_assign_rhs1 (stmt);
1779 else if (code == GIMPLE_SWITCH)
1780 simplified = gimple_switch_index (as_a <gswitch *> (stmt));
1781 else
1782 /* These cannot satisfy is_gimple_min_invariant without folding. */
1783 gcc_assert (code == GIMPLE_CALL || code == GIMPLE_COND);
1784 is_constant = simplified && is_gimple_min_invariant (simplified);
1785 if (is_constant)
1787 /* The statement produced a constant value. */
1788 val.lattice_val = CONSTANT;
1789 val.value = simplified;
1790 val.mask = 0;
1793 /* If the statement result is likely UNDEFINED, make it so. */
1794 else if (likelyvalue == UNDEFINED)
1796 val.lattice_val = UNDEFINED;
1797 val.value = NULL_TREE;
1798 val.mask = 0;
1799 return val;
1802 /* Resort to simplification for bitwise tracking. */
1803 if (flag_tree_bit_ccp
1804 && (likelyvalue == CONSTANT || is_gimple_call (stmt)
1805 || (gimple_assign_single_p (stmt)
1806 && gimple_assign_rhs_code (stmt) == ADDR_EXPR))
1807 && !is_constant)
1809 enum gimple_code code = gimple_code (stmt);
1810 val.lattice_val = VARYING;
1811 val.value = NULL_TREE;
1812 val.mask = -1;
1813 if (code == GIMPLE_ASSIGN)
1815 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1816 tree rhs1 = gimple_assign_rhs1 (stmt);
1817 tree lhs = gimple_assign_lhs (stmt);
1818 if ((INTEGRAL_TYPE_P (TREE_TYPE (lhs))
1819 || POINTER_TYPE_P (TREE_TYPE (lhs)))
1820 && (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1821 || POINTER_TYPE_P (TREE_TYPE (rhs1))))
1822 switch (get_gimple_rhs_class (subcode))
1824 case GIMPLE_SINGLE_RHS:
1825 val = get_value_for_expr (rhs1, true);
1826 break;
1828 case GIMPLE_UNARY_RHS:
1829 val = bit_value_unop (subcode, TREE_TYPE (lhs), rhs1);
1830 break;
1832 case GIMPLE_BINARY_RHS:
1833 val = bit_value_binop (subcode, TREE_TYPE (lhs), rhs1,
1834 gimple_assign_rhs2 (stmt));
1835 break;
1837 default:;
1840 else if (code == GIMPLE_COND)
1842 enum tree_code code = gimple_cond_code (stmt);
1843 tree rhs1 = gimple_cond_lhs (stmt);
1844 tree rhs2 = gimple_cond_rhs (stmt);
1845 if (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1846 || POINTER_TYPE_P (TREE_TYPE (rhs1)))
1847 val = bit_value_binop (code, TREE_TYPE (rhs1), rhs1, rhs2);
1849 else if (gimple_call_builtin_p (stmt, BUILT_IN_NORMAL))
1851 tree fndecl = gimple_call_fndecl (stmt);
1852 switch (DECL_FUNCTION_CODE (fndecl))
1854 case BUILT_IN_MALLOC:
1855 case BUILT_IN_REALLOC:
1856 case BUILT_IN_CALLOC:
1857 case BUILT_IN_STRDUP:
1858 case BUILT_IN_STRNDUP:
1859 val.lattice_val = CONSTANT;
1860 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1861 val.mask = ~((HOST_WIDE_INT) MALLOC_ABI_ALIGNMENT
1862 / BITS_PER_UNIT - 1);
1863 break;
1865 case BUILT_IN_ALLOCA:
1866 case BUILT_IN_ALLOCA_WITH_ALIGN:
1867 align = (DECL_FUNCTION_CODE (fndecl) == BUILT_IN_ALLOCA_WITH_ALIGN
1868 ? TREE_INT_CST_LOW (gimple_call_arg (stmt, 1))
1869 : BIGGEST_ALIGNMENT);
1870 val.lattice_val = CONSTANT;
1871 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1872 val.mask = ~((HOST_WIDE_INT) align / BITS_PER_UNIT - 1);
1873 break;
1875 /* These builtins return their first argument, unmodified. */
1876 case BUILT_IN_MEMCPY:
1877 case BUILT_IN_MEMMOVE:
1878 case BUILT_IN_MEMSET:
1879 case BUILT_IN_STRCPY:
1880 case BUILT_IN_STRNCPY:
1881 case BUILT_IN_MEMCPY_CHK:
1882 case BUILT_IN_MEMMOVE_CHK:
1883 case BUILT_IN_MEMSET_CHK:
1884 case BUILT_IN_STRCPY_CHK:
1885 case BUILT_IN_STRNCPY_CHK:
1886 val = get_value_for_expr (gimple_call_arg (stmt, 0), true);
1887 break;
1889 case BUILT_IN_ASSUME_ALIGNED:
1890 val = bit_value_assume_aligned (stmt, NULL_TREE, val, false);
1891 break;
1893 case BUILT_IN_ALIGNED_ALLOC:
1895 tree align = get_constant_value (gimple_call_arg (stmt, 0));
1896 if (align
1897 && tree_fits_uhwi_p (align))
1899 unsigned HOST_WIDE_INT aligni = tree_to_uhwi (align);
1900 if (aligni > 1
1901 /* align must be power-of-two */
1902 && (aligni & (aligni - 1)) == 0)
1904 val.lattice_val = CONSTANT;
1905 val.value = build_int_cst (ptr_type_node, 0);
1906 val.mask = -aligni;
1909 break;
1912 default:;
1915 if (is_gimple_call (stmt) && gimple_call_lhs (stmt))
1917 tree fntype = gimple_call_fntype (stmt);
1918 if (fntype)
1920 tree attrs = lookup_attribute ("assume_aligned",
1921 TYPE_ATTRIBUTES (fntype));
1922 if (attrs)
1923 val = bit_value_assume_aligned (stmt, attrs, val, false);
1924 attrs = lookup_attribute ("alloc_align",
1925 TYPE_ATTRIBUTES (fntype));
1926 if (attrs)
1927 val = bit_value_assume_aligned (stmt, attrs, val, true);
1930 is_constant = (val.lattice_val == CONSTANT);
1933 if (flag_tree_bit_ccp
1934 && ((is_constant && TREE_CODE (val.value) == INTEGER_CST)
1935 || !is_constant)
1936 && gimple_get_lhs (stmt)
1937 && TREE_CODE (gimple_get_lhs (stmt)) == SSA_NAME)
1939 tree lhs = gimple_get_lhs (stmt);
1940 wide_int nonzero_bits = get_nonzero_bits (lhs);
1941 if (nonzero_bits != -1)
1943 if (!is_constant)
1945 val.lattice_val = CONSTANT;
1946 val.value = build_zero_cst (TREE_TYPE (lhs));
1947 val.mask = extend_mask (nonzero_bits);
1948 is_constant = true;
1950 else
1952 if (wi::bit_and_not (val.value, nonzero_bits) != 0)
1953 val.value = wide_int_to_tree (TREE_TYPE (lhs),
1954 nonzero_bits & val.value);
1955 if (nonzero_bits == 0)
1956 val.mask = 0;
1957 else
1958 val.mask = val.mask & extend_mask (nonzero_bits);
1963 /* The statement produced a nonconstant value. */
1964 if (!is_constant)
1966 /* The statement produced a copy. */
1967 if (simplified && TREE_CODE (simplified) == SSA_NAME
1968 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (simplified))
1970 val.lattice_val = CONSTANT;
1971 val.value = simplified;
1972 val.mask = -1;
1974 /* The statement is VARYING. */
1975 else
1977 val.lattice_val = VARYING;
1978 val.value = NULL_TREE;
1979 val.mask = -1;
1983 return val;
1986 typedef hash_table<pointer_hash<gimple_statement_base> > gimple_htab;
1988 /* Given a BUILT_IN_STACK_SAVE value SAVED_VAL, insert a clobber of VAR before
1989 each matching BUILT_IN_STACK_RESTORE. Mark visited phis in VISITED. */
1991 static void
1992 insert_clobber_before_stack_restore (tree saved_val, tree var,
1993 gimple_htab **visited)
1995 gimple stmt;
1996 gassign *clobber_stmt;
1997 tree clobber;
1998 imm_use_iterator iter;
1999 gimple_stmt_iterator i;
2000 gimple *slot;
2002 FOR_EACH_IMM_USE_STMT (stmt, iter, saved_val)
2003 if (gimple_call_builtin_p (stmt, BUILT_IN_STACK_RESTORE))
2005 clobber = build_constructor (TREE_TYPE (var),
2006 NULL);
2007 TREE_THIS_VOLATILE (clobber) = 1;
2008 clobber_stmt = gimple_build_assign (var, clobber);
2010 i = gsi_for_stmt (stmt);
2011 gsi_insert_before (&i, clobber_stmt, GSI_SAME_STMT);
2013 else if (gimple_code (stmt) == GIMPLE_PHI)
2015 if (!*visited)
2016 *visited = new gimple_htab (10);
2018 slot = (*visited)->find_slot (stmt, INSERT);
2019 if (*slot != NULL)
2020 continue;
2022 *slot = stmt;
2023 insert_clobber_before_stack_restore (gimple_phi_result (stmt), var,
2024 visited);
2026 else if (gimple_assign_ssa_name_copy_p (stmt))
2027 insert_clobber_before_stack_restore (gimple_assign_lhs (stmt), var,
2028 visited);
2029 else if (chkp_gimple_call_builtin_p (stmt, BUILT_IN_CHKP_BNDRET))
2030 continue;
2031 else
2032 gcc_assert (is_gimple_debug (stmt));
2035 /* Advance the iterator to the previous non-debug gimple statement in the same
2036 or dominating basic block. */
2038 static inline void
2039 gsi_prev_dom_bb_nondebug (gimple_stmt_iterator *i)
2041 basic_block dom;
2043 gsi_prev_nondebug (i);
2044 while (gsi_end_p (*i))
2046 dom = get_immediate_dominator (CDI_DOMINATORS, i->bb);
2047 if (dom == NULL || dom == ENTRY_BLOCK_PTR_FOR_FN (cfun))
2048 return;
2050 *i = gsi_last_bb (dom);
2054 /* Find a BUILT_IN_STACK_SAVE dominating gsi_stmt (I), and insert
2055 a clobber of VAR before each matching BUILT_IN_STACK_RESTORE.
2057 It is possible that BUILT_IN_STACK_SAVE cannot be find in a dominator when a
2058 previous pass (such as DOM) duplicated it along multiple paths to a BB. In
2059 that case the function gives up without inserting the clobbers. */
2061 static void
2062 insert_clobbers_for_var (gimple_stmt_iterator i, tree var)
2064 gimple stmt;
2065 tree saved_val;
2066 gimple_htab *visited = NULL;
2068 for (; !gsi_end_p (i); gsi_prev_dom_bb_nondebug (&i))
2070 stmt = gsi_stmt (i);
2072 if (!gimple_call_builtin_p (stmt, BUILT_IN_STACK_SAVE))
2073 continue;
2075 saved_val = gimple_call_lhs (stmt);
2076 if (saved_val == NULL_TREE)
2077 continue;
2079 insert_clobber_before_stack_restore (saved_val, var, &visited);
2080 break;
2083 delete visited;
2086 /* Detects a __builtin_alloca_with_align with constant size argument. Declares
2087 fixed-size array and returns the address, if found, otherwise returns
2088 NULL_TREE. */
2090 static tree
2091 fold_builtin_alloca_with_align (gimple stmt)
2093 unsigned HOST_WIDE_INT size, threshold, n_elem;
2094 tree lhs, arg, block, var, elem_type, array_type;
2096 /* Get lhs. */
2097 lhs = gimple_call_lhs (stmt);
2098 if (lhs == NULL_TREE)
2099 return NULL_TREE;
2101 /* Detect constant argument. */
2102 arg = get_constant_value (gimple_call_arg (stmt, 0));
2103 if (arg == NULL_TREE
2104 || TREE_CODE (arg) != INTEGER_CST
2105 || !tree_fits_uhwi_p (arg))
2106 return NULL_TREE;
2108 size = tree_to_uhwi (arg);
2110 /* Heuristic: don't fold large allocas. */
2111 threshold = (unsigned HOST_WIDE_INT)PARAM_VALUE (PARAM_LARGE_STACK_FRAME);
2112 /* In case the alloca is located at function entry, it has the same lifetime
2113 as a declared array, so we allow a larger size. */
2114 block = gimple_block (stmt);
2115 if (!(cfun->after_inlining
2116 && TREE_CODE (BLOCK_SUPERCONTEXT (block)) == FUNCTION_DECL))
2117 threshold /= 10;
2118 if (size > threshold)
2119 return NULL_TREE;
2121 /* Declare array. */
2122 elem_type = build_nonstandard_integer_type (BITS_PER_UNIT, 1);
2123 n_elem = size * 8 / BITS_PER_UNIT;
2124 array_type = build_array_type_nelts (elem_type, n_elem);
2125 var = create_tmp_var (array_type);
2126 DECL_ALIGN (var) = TREE_INT_CST_LOW (gimple_call_arg (stmt, 1));
2128 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (lhs);
2129 if (pi != NULL && !pi->pt.anything)
2131 bool singleton_p;
2132 unsigned uid;
2133 singleton_p = pt_solution_singleton_p (&pi->pt, &uid);
2134 gcc_assert (singleton_p);
2135 SET_DECL_PT_UID (var, uid);
2139 /* Fold alloca to the address of the array. */
2140 return fold_convert (TREE_TYPE (lhs), build_fold_addr_expr (var));
2143 /* Fold the stmt at *GSI with CCP specific information that propagating
2144 and regular folding does not catch. */
2146 static bool
2147 ccp_fold_stmt (gimple_stmt_iterator *gsi)
2149 gimple stmt = gsi_stmt (*gsi);
2151 switch (gimple_code (stmt))
2153 case GIMPLE_COND:
2155 gcond *cond_stmt = as_a <gcond *> (stmt);
2156 ccp_prop_value_t val;
2157 /* Statement evaluation will handle type mismatches in constants
2158 more gracefully than the final propagation. This allows us to
2159 fold more conditionals here. */
2160 val = evaluate_stmt (stmt);
2161 if (val.lattice_val != CONSTANT
2162 || val.mask != 0)
2163 return false;
2165 if (dump_file)
2167 fprintf (dump_file, "Folding predicate ");
2168 print_gimple_expr (dump_file, stmt, 0, 0);
2169 fprintf (dump_file, " to ");
2170 print_generic_expr (dump_file, val.value, 0);
2171 fprintf (dump_file, "\n");
2174 if (integer_zerop (val.value))
2175 gimple_cond_make_false (cond_stmt);
2176 else
2177 gimple_cond_make_true (cond_stmt);
2179 return true;
2182 case GIMPLE_CALL:
2184 tree lhs = gimple_call_lhs (stmt);
2185 int flags = gimple_call_flags (stmt);
2186 tree val;
2187 tree argt;
2188 bool changed = false;
2189 unsigned i;
2191 /* If the call was folded into a constant make sure it goes
2192 away even if we cannot propagate into all uses because of
2193 type issues. */
2194 if (lhs
2195 && TREE_CODE (lhs) == SSA_NAME
2196 && (val = get_constant_value (lhs))
2197 /* Don't optimize away calls that have side-effects. */
2198 && (flags & (ECF_CONST|ECF_PURE)) != 0
2199 && (flags & ECF_LOOPING_CONST_OR_PURE) == 0)
2201 tree new_rhs = unshare_expr (val);
2202 bool res;
2203 if (!useless_type_conversion_p (TREE_TYPE (lhs),
2204 TREE_TYPE (new_rhs)))
2205 new_rhs = fold_convert (TREE_TYPE (lhs), new_rhs);
2206 res = update_call_from_tree (gsi, new_rhs);
2207 gcc_assert (res);
2208 return true;
2211 /* Internal calls provide no argument types, so the extra laxity
2212 for normal calls does not apply. */
2213 if (gimple_call_internal_p (stmt))
2214 return false;
2216 /* The heuristic of fold_builtin_alloca_with_align differs before and
2217 after inlining, so we don't require the arg to be changed into a
2218 constant for folding, but just to be constant. */
2219 if (gimple_call_builtin_p (stmt, BUILT_IN_ALLOCA_WITH_ALIGN))
2221 tree new_rhs = fold_builtin_alloca_with_align (stmt);
2222 if (new_rhs)
2224 bool res = update_call_from_tree (gsi, new_rhs);
2225 tree var = TREE_OPERAND (TREE_OPERAND (new_rhs, 0),0);
2226 gcc_assert (res);
2227 insert_clobbers_for_var (*gsi, var);
2228 return true;
2232 /* Propagate into the call arguments. Compared to replace_uses_in
2233 this can use the argument slot types for type verification
2234 instead of the current argument type. We also can safely
2235 drop qualifiers here as we are dealing with constants anyway. */
2236 argt = TYPE_ARG_TYPES (gimple_call_fntype (stmt));
2237 for (i = 0; i < gimple_call_num_args (stmt) && argt;
2238 ++i, argt = TREE_CHAIN (argt))
2240 tree arg = gimple_call_arg (stmt, i);
2241 if (TREE_CODE (arg) == SSA_NAME
2242 && (val = get_constant_value (arg))
2243 && useless_type_conversion_p
2244 (TYPE_MAIN_VARIANT (TREE_VALUE (argt)),
2245 TYPE_MAIN_VARIANT (TREE_TYPE (val))))
2247 gimple_call_set_arg (stmt, i, unshare_expr (val));
2248 changed = true;
2252 return changed;
2255 case GIMPLE_ASSIGN:
2257 tree lhs = gimple_assign_lhs (stmt);
2258 tree val;
2260 /* If we have a load that turned out to be constant replace it
2261 as we cannot propagate into all uses in all cases. */
2262 if (gimple_assign_single_p (stmt)
2263 && TREE_CODE (lhs) == SSA_NAME
2264 && (val = get_constant_value (lhs)))
2266 tree rhs = unshare_expr (val);
2267 if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs)))
2268 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (lhs), rhs);
2269 gimple_assign_set_rhs_from_tree (gsi, rhs);
2270 return true;
2273 return false;
2276 default:
2277 return false;
2281 /* Visit the assignment statement STMT. Set the value of its LHS to the
2282 value computed by the RHS and store LHS in *OUTPUT_P. If STMT
2283 creates virtual definitions, set the value of each new name to that
2284 of the RHS (if we can derive a constant out of the RHS).
2285 Value-returning call statements also perform an assignment, and
2286 are handled here. */
2288 static enum ssa_prop_result
2289 visit_assignment (gimple stmt, tree *output_p)
2291 ccp_prop_value_t val;
2292 enum ssa_prop_result retval = SSA_PROP_NOT_INTERESTING;
2294 tree lhs = gimple_get_lhs (stmt);
2295 if (TREE_CODE (lhs) == SSA_NAME)
2297 /* Evaluate the statement, which could be
2298 either a GIMPLE_ASSIGN or a GIMPLE_CALL. */
2299 val = evaluate_stmt (stmt);
2301 /* If STMT is an assignment to an SSA_NAME, we only have one
2302 value to set. */
2303 if (set_lattice_value (lhs, &val))
2305 *output_p = lhs;
2306 if (val.lattice_val == VARYING)
2307 retval = SSA_PROP_VARYING;
2308 else
2309 retval = SSA_PROP_INTERESTING;
2313 return retval;
2317 /* Visit the conditional statement STMT. Return SSA_PROP_INTERESTING
2318 if it can determine which edge will be taken. Otherwise, return
2319 SSA_PROP_VARYING. */
2321 static enum ssa_prop_result
2322 visit_cond_stmt (gimple stmt, edge *taken_edge_p)
2324 ccp_prop_value_t val;
2325 basic_block block;
2327 block = gimple_bb (stmt);
2328 val = evaluate_stmt (stmt);
2329 if (val.lattice_val != CONSTANT
2330 || val.mask != 0)
2331 return SSA_PROP_VARYING;
2333 /* Find which edge out of the conditional block will be taken and add it
2334 to the worklist. If no single edge can be determined statically,
2335 return SSA_PROP_VARYING to feed all the outgoing edges to the
2336 propagation engine. */
2337 *taken_edge_p = find_taken_edge (block, val.value);
2338 if (*taken_edge_p)
2339 return SSA_PROP_INTERESTING;
2340 else
2341 return SSA_PROP_VARYING;
2345 /* Evaluate statement STMT. If the statement produces an output value and
2346 its evaluation changes the lattice value of its output, return
2347 SSA_PROP_INTERESTING and set *OUTPUT_P to the SSA_NAME holding the
2348 output value.
2350 If STMT is a conditional branch and we can determine its truth
2351 value, set *TAKEN_EDGE_P accordingly. If STMT produces a varying
2352 value, return SSA_PROP_VARYING. */
2354 static enum ssa_prop_result
2355 ccp_visit_stmt (gimple stmt, edge *taken_edge_p, tree *output_p)
2357 tree def;
2358 ssa_op_iter iter;
2360 if (dump_file && (dump_flags & TDF_DETAILS))
2362 fprintf (dump_file, "\nVisiting statement:\n");
2363 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
2366 switch (gimple_code (stmt))
2368 case GIMPLE_ASSIGN:
2369 /* If the statement is an assignment that produces a single
2370 output value, evaluate its RHS to see if the lattice value of
2371 its output has changed. */
2372 return visit_assignment (stmt, output_p);
2374 case GIMPLE_CALL:
2375 /* A value-returning call also performs an assignment. */
2376 if (gimple_call_lhs (stmt) != NULL_TREE)
2377 return visit_assignment (stmt, output_p);
2378 break;
2380 case GIMPLE_COND:
2381 case GIMPLE_SWITCH:
2382 /* If STMT is a conditional branch, see if we can determine
2383 which branch will be taken. */
2384 /* FIXME. It appears that we should be able to optimize
2385 computed GOTOs here as well. */
2386 return visit_cond_stmt (stmt, taken_edge_p);
2388 default:
2389 break;
2392 /* Any other kind of statement is not interesting for constant
2393 propagation and, therefore, not worth simulating. */
2394 if (dump_file && (dump_flags & TDF_DETAILS))
2395 fprintf (dump_file, "No interesting values produced. Marked VARYING.\n");
2397 /* Definitions made by statements other than assignments to
2398 SSA_NAMEs represent unknown modifications to their outputs.
2399 Mark them VARYING. */
2400 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
2401 set_value_varying (def);
2403 return SSA_PROP_VARYING;
2407 /* Main entry point for SSA Conditional Constant Propagation. */
2409 static unsigned int
2410 do_ssa_ccp (void)
2412 unsigned int todo = 0;
2413 calculate_dominance_info (CDI_DOMINATORS);
2414 ccp_initialize ();
2415 ssa_propagate (ccp_visit_stmt, ccp_visit_phi_node);
2416 if (ccp_finalize ())
2417 todo = (TODO_cleanup_cfg | TODO_update_ssa);
2418 free_dominance_info (CDI_DOMINATORS);
2419 return todo;
2423 namespace {
2425 const pass_data pass_data_ccp =
2427 GIMPLE_PASS, /* type */
2428 "ccp", /* name */
2429 OPTGROUP_NONE, /* optinfo_flags */
2430 TV_TREE_CCP, /* tv_id */
2431 ( PROP_cfg | PROP_ssa ), /* properties_required */
2432 0, /* properties_provided */
2433 0, /* properties_destroyed */
2434 0, /* todo_flags_start */
2435 TODO_update_address_taken, /* todo_flags_finish */
2438 class pass_ccp : public gimple_opt_pass
2440 public:
2441 pass_ccp (gcc::context *ctxt)
2442 : gimple_opt_pass (pass_data_ccp, ctxt)
2445 /* opt_pass methods: */
2446 opt_pass * clone () { return new pass_ccp (m_ctxt); }
2447 virtual bool gate (function *) { return flag_tree_ccp != 0; }
2448 virtual unsigned int execute (function *) { return do_ssa_ccp (); }
2450 }; // class pass_ccp
2452 } // anon namespace
2454 gimple_opt_pass *
2455 make_pass_ccp (gcc::context *ctxt)
2457 return new pass_ccp (ctxt);
2462 /* Try to optimize out __builtin_stack_restore. Optimize it out
2463 if there is another __builtin_stack_restore in the same basic
2464 block and no calls or ASM_EXPRs are in between, or if this block's
2465 only outgoing edge is to EXIT_BLOCK and there are no calls or
2466 ASM_EXPRs after this __builtin_stack_restore. */
2468 static tree
2469 optimize_stack_restore (gimple_stmt_iterator i)
2471 tree callee;
2472 gimple stmt;
2474 basic_block bb = gsi_bb (i);
2475 gimple call = gsi_stmt (i);
2477 if (gimple_code (call) != GIMPLE_CALL
2478 || gimple_call_num_args (call) != 1
2479 || TREE_CODE (gimple_call_arg (call, 0)) != SSA_NAME
2480 || !POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, 0))))
2481 return NULL_TREE;
2483 for (gsi_next (&i); !gsi_end_p (i); gsi_next (&i))
2485 stmt = gsi_stmt (i);
2486 if (gimple_code (stmt) == GIMPLE_ASM)
2487 return NULL_TREE;
2488 if (gimple_code (stmt) != GIMPLE_CALL)
2489 continue;
2491 callee = gimple_call_fndecl (stmt);
2492 if (!callee
2493 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
2494 /* All regular builtins are ok, just obviously not alloca. */
2495 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA
2496 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA_WITH_ALIGN)
2497 return NULL_TREE;
2499 if (DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_RESTORE)
2500 goto second_stack_restore;
2503 if (!gsi_end_p (i))
2504 return NULL_TREE;
2506 /* Allow one successor of the exit block, or zero successors. */
2507 switch (EDGE_COUNT (bb->succs))
2509 case 0:
2510 break;
2511 case 1:
2512 if (single_succ_edge (bb)->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
2513 return NULL_TREE;
2514 break;
2515 default:
2516 return NULL_TREE;
2518 second_stack_restore:
2520 /* If there's exactly one use, then zap the call to __builtin_stack_save.
2521 If there are multiple uses, then the last one should remove the call.
2522 In any case, whether the call to __builtin_stack_save can be removed
2523 or not is irrelevant to removing the call to __builtin_stack_restore. */
2524 if (has_single_use (gimple_call_arg (call, 0)))
2526 gimple stack_save = SSA_NAME_DEF_STMT (gimple_call_arg (call, 0));
2527 if (is_gimple_call (stack_save))
2529 callee = gimple_call_fndecl (stack_save);
2530 if (callee
2531 && DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL
2532 && DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_SAVE)
2534 gimple_stmt_iterator stack_save_gsi;
2535 tree rhs;
2537 stack_save_gsi = gsi_for_stmt (stack_save);
2538 rhs = build_int_cst (TREE_TYPE (gimple_call_arg (call, 0)), 0);
2539 update_call_from_tree (&stack_save_gsi, rhs);
2544 /* No effect, so the statement will be deleted. */
2545 return integer_zero_node;
2548 /* If va_list type is a simple pointer and nothing special is needed,
2549 optimize __builtin_va_start (&ap, 0) into ap = __builtin_next_arg (0),
2550 __builtin_va_end (&ap) out as NOP and __builtin_va_copy into a simple
2551 pointer assignment. */
2553 static tree
2554 optimize_stdarg_builtin (gimple call)
2556 tree callee, lhs, rhs, cfun_va_list;
2557 bool va_list_simple_ptr;
2558 location_t loc = gimple_location (call);
2560 if (gimple_code (call) != GIMPLE_CALL)
2561 return NULL_TREE;
2563 callee = gimple_call_fndecl (call);
2565 cfun_va_list = targetm.fn_abi_va_list (callee);
2566 va_list_simple_ptr = POINTER_TYPE_P (cfun_va_list)
2567 && (TREE_TYPE (cfun_va_list) == void_type_node
2568 || TREE_TYPE (cfun_va_list) == char_type_node);
2570 switch (DECL_FUNCTION_CODE (callee))
2572 case BUILT_IN_VA_START:
2573 if (!va_list_simple_ptr
2574 || targetm.expand_builtin_va_start != NULL
2575 || !builtin_decl_explicit_p (BUILT_IN_NEXT_ARG))
2576 return NULL_TREE;
2578 if (gimple_call_num_args (call) != 2)
2579 return NULL_TREE;
2581 lhs = gimple_call_arg (call, 0);
2582 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2583 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2584 != TYPE_MAIN_VARIANT (cfun_va_list))
2585 return NULL_TREE;
2587 lhs = build_fold_indirect_ref_loc (loc, lhs);
2588 rhs = build_call_expr_loc (loc, builtin_decl_explicit (BUILT_IN_NEXT_ARG),
2589 1, integer_zero_node);
2590 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2591 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2593 case BUILT_IN_VA_COPY:
2594 if (!va_list_simple_ptr)
2595 return NULL_TREE;
2597 if (gimple_call_num_args (call) != 2)
2598 return NULL_TREE;
2600 lhs = gimple_call_arg (call, 0);
2601 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2602 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2603 != TYPE_MAIN_VARIANT (cfun_va_list))
2604 return NULL_TREE;
2606 lhs = build_fold_indirect_ref_loc (loc, lhs);
2607 rhs = gimple_call_arg (call, 1);
2608 if (TYPE_MAIN_VARIANT (TREE_TYPE (rhs))
2609 != TYPE_MAIN_VARIANT (cfun_va_list))
2610 return NULL_TREE;
2612 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2613 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2615 case BUILT_IN_VA_END:
2616 /* No effect, so the statement will be deleted. */
2617 return integer_zero_node;
2619 default:
2620 gcc_unreachable ();
2624 /* Attemp to make the block of __builtin_unreachable I unreachable by changing
2625 the incoming jumps. Return true if at least one jump was changed. */
2627 static bool
2628 optimize_unreachable (gimple_stmt_iterator i)
2630 basic_block bb = gsi_bb (i);
2631 gimple_stmt_iterator gsi;
2632 gimple stmt;
2633 edge_iterator ei;
2634 edge e;
2635 bool ret;
2637 if (flag_sanitize & SANITIZE_UNREACHABLE)
2638 return false;
2640 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2642 stmt = gsi_stmt (gsi);
2644 if (is_gimple_debug (stmt))
2645 continue;
2647 if (glabel *label_stmt = dyn_cast <glabel *> (stmt))
2649 /* Verify we do not need to preserve the label. */
2650 if (FORCED_LABEL (gimple_label_label (label_stmt)))
2651 return false;
2653 continue;
2656 /* Only handle the case that __builtin_unreachable is the first statement
2657 in the block. We rely on DCE to remove stmts without side-effects
2658 before __builtin_unreachable. */
2659 if (gsi_stmt (gsi) != gsi_stmt (i))
2660 return false;
2663 ret = false;
2664 FOR_EACH_EDGE (e, ei, bb->preds)
2666 gsi = gsi_last_bb (e->src);
2667 if (gsi_end_p (gsi))
2668 continue;
2670 stmt = gsi_stmt (gsi);
2671 if (gcond *cond_stmt = dyn_cast <gcond *> (stmt))
2673 if (e->flags & EDGE_TRUE_VALUE)
2674 gimple_cond_make_false (cond_stmt);
2675 else if (e->flags & EDGE_FALSE_VALUE)
2676 gimple_cond_make_true (cond_stmt);
2677 else
2678 gcc_unreachable ();
2679 update_stmt (cond_stmt);
2681 else
2683 /* Todo: handle other cases, f.i. switch statement. */
2684 continue;
2687 ret = true;
2690 return ret;
2693 /* A simple pass that attempts to fold all builtin functions. This pass
2694 is run after we've propagated as many constants as we can. */
2696 namespace {
2698 const pass_data pass_data_fold_builtins =
2700 GIMPLE_PASS, /* type */
2701 "fab", /* name */
2702 OPTGROUP_NONE, /* optinfo_flags */
2703 TV_NONE, /* tv_id */
2704 ( PROP_cfg | PROP_ssa ), /* properties_required */
2705 0, /* properties_provided */
2706 0, /* properties_destroyed */
2707 0, /* todo_flags_start */
2708 TODO_update_ssa, /* todo_flags_finish */
2711 class pass_fold_builtins : public gimple_opt_pass
2713 public:
2714 pass_fold_builtins (gcc::context *ctxt)
2715 : gimple_opt_pass (pass_data_fold_builtins, ctxt)
2718 /* opt_pass methods: */
2719 opt_pass * clone () { return new pass_fold_builtins (m_ctxt); }
2720 virtual unsigned int execute (function *);
2722 }; // class pass_fold_builtins
2724 unsigned int
2725 pass_fold_builtins::execute (function *fun)
2727 bool cfg_changed = false;
2728 basic_block bb;
2729 unsigned int todoflags = 0;
2731 FOR_EACH_BB_FN (bb, fun)
2733 gimple_stmt_iterator i;
2734 for (i = gsi_start_bb (bb); !gsi_end_p (i); )
2736 gimple stmt, old_stmt;
2737 tree callee;
2738 enum built_in_function fcode;
2740 stmt = gsi_stmt (i);
2742 if (gimple_code (stmt) != GIMPLE_CALL)
2744 /* Remove all *ssaname_N ={v} {CLOBBER}; stmts,
2745 after the last GIMPLE DSE they aren't needed and might
2746 unnecessarily keep the SSA_NAMEs live. */
2747 if (gimple_clobber_p (stmt))
2749 tree lhs = gimple_assign_lhs (stmt);
2750 if (TREE_CODE (lhs) == MEM_REF
2751 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
2753 unlink_stmt_vdef (stmt);
2754 gsi_remove (&i, true);
2755 release_defs (stmt);
2756 continue;
2759 gsi_next (&i);
2760 continue;
2763 callee = gimple_call_fndecl (stmt);
2764 if (!callee || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL)
2766 gsi_next (&i);
2767 continue;
2770 fcode = DECL_FUNCTION_CODE (callee);
2771 if (fold_stmt (&i))
2773 else
2775 tree result = NULL_TREE;
2776 switch (DECL_FUNCTION_CODE (callee))
2778 case BUILT_IN_CONSTANT_P:
2779 /* Resolve __builtin_constant_p. If it hasn't been
2780 folded to integer_one_node by now, it's fairly
2781 certain that the value simply isn't constant. */
2782 result = integer_zero_node;
2783 break;
2785 case BUILT_IN_ASSUME_ALIGNED:
2786 /* Remove __builtin_assume_aligned. */
2787 result = gimple_call_arg (stmt, 0);
2788 break;
2790 case BUILT_IN_STACK_RESTORE:
2791 result = optimize_stack_restore (i);
2792 if (result)
2793 break;
2794 gsi_next (&i);
2795 continue;
2797 case BUILT_IN_UNREACHABLE:
2798 if (optimize_unreachable (i))
2799 cfg_changed = true;
2800 break;
2802 case BUILT_IN_VA_START:
2803 case BUILT_IN_VA_END:
2804 case BUILT_IN_VA_COPY:
2805 /* These shouldn't be folded before pass_stdarg. */
2806 result = optimize_stdarg_builtin (stmt);
2807 if (result)
2808 break;
2809 /* FALLTHRU */
2811 default:;
2814 if (!result)
2816 gsi_next (&i);
2817 continue;
2820 if (!update_call_from_tree (&i, result))
2821 gimplify_and_update_call_from_tree (&i, result);
2824 todoflags |= TODO_update_address_taken;
2826 if (dump_file && (dump_flags & TDF_DETAILS))
2828 fprintf (dump_file, "Simplified\n ");
2829 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
2832 old_stmt = stmt;
2833 stmt = gsi_stmt (i);
2834 update_stmt (stmt);
2836 if (maybe_clean_or_replace_eh_stmt (old_stmt, stmt)
2837 && gimple_purge_dead_eh_edges (bb))
2838 cfg_changed = true;
2840 if (dump_file && (dump_flags & TDF_DETAILS))
2842 fprintf (dump_file, "to\n ");
2843 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
2844 fprintf (dump_file, "\n");
2847 /* Retry the same statement if it changed into another
2848 builtin, there might be new opportunities now. */
2849 if (gimple_code (stmt) != GIMPLE_CALL)
2851 gsi_next (&i);
2852 continue;
2854 callee = gimple_call_fndecl (stmt);
2855 if (!callee
2856 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
2857 || DECL_FUNCTION_CODE (callee) == fcode)
2858 gsi_next (&i);
2862 /* Delete unreachable blocks. */
2863 if (cfg_changed)
2864 todoflags |= TODO_cleanup_cfg;
2866 return todoflags;
2869 } // anon namespace
2871 gimple_opt_pass *
2872 make_pass_fold_builtins (gcc::context *ctxt)
2874 return new pass_fold_builtins (ctxt);