[ree] PR rtl-optimization/78038: Handle global register dataflow definitions in ree
[official-gcc.git] / gcc / tree-ssa-ccp.c
blob167598f6eec4df60d656019dfb1c2851907b873a
1 /* Conditional constant propagation pass for the GNU compiler.
2 Copyright (C) 2000-2016 Free Software Foundation, Inc.
3 Adapted from original RTL SSA-CCP by Daniel Berlin <dberlin@dberlin.org>
4 Adapted to GIMPLE trees by Diego Novillo <dnovillo@redhat.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 3, or (at your option) any
11 later version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT
14 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* Conditional constant propagation (CCP) is based on the SSA
23 propagation engine (tree-ssa-propagate.c). Constant assignments of
24 the form VAR = CST are propagated from the assignments into uses of
25 VAR, which in turn may generate new constants. The simulation uses
26 a four level lattice to keep track of constant values associated
27 with SSA names. Given an SSA name V_i, it may take one of the
28 following values:
30 UNINITIALIZED -> the initial state of the value. This value
31 is replaced with a correct initial value
32 the first time the value is used, so the
33 rest of the pass does not need to care about
34 it. Using this value simplifies initialization
35 of the pass, and prevents us from needlessly
36 scanning statements that are never reached.
38 UNDEFINED -> V_i is a local variable whose definition
39 has not been processed yet. Therefore we
40 don't yet know if its value is a constant
41 or not.
43 CONSTANT -> V_i has been found to hold a constant
44 value C.
46 VARYING -> V_i cannot take a constant value, or if it
47 does, it is not possible to determine it
48 at compile time.
50 The core of SSA-CCP is in ccp_visit_stmt and ccp_visit_phi_node:
52 1- In ccp_visit_stmt, we are interested in assignments whose RHS
53 evaluates into a constant and conditional jumps whose predicate
54 evaluates into a boolean true or false. When an assignment of
55 the form V_i = CONST is found, V_i's lattice value is set to
56 CONSTANT and CONST is associated with it. This causes the
57 propagation engine to add all the SSA edges coming out the
58 assignment into the worklists, so that statements that use V_i
59 can be visited.
61 If the statement is a conditional with a constant predicate, we
62 mark the outgoing edges as executable or not executable
63 depending on the predicate's value. This is then used when
64 visiting PHI nodes to know when a PHI argument can be ignored.
67 2- In ccp_visit_phi_node, if all the PHI arguments evaluate to the
68 same constant C, then the LHS of the PHI is set to C. This
69 evaluation is known as the "meet operation". Since one of the
70 goals of this evaluation is to optimistically return constant
71 values as often as possible, it uses two main short cuts:
73 - If an argument is flowing in through a non-executable edge, it
74 is ignored. This is useful in cases like this:
76 if (PRED)
77 a_9 = 3;
78 else
79 a_10 = 100;
80 a_11 = PHI (a_9, a_10)
82 If PRED is known to always evaluate to false, then we can
83 assume that a_11 will always take its value from a_10, meaning
84 that instead of consider it VARYING (a_9 and a_10 have
85 different values), we can consider it CONSTANT 100.
87 - If an argument has an UNDEFINED value, then it does not affect
88 the outcome of the meet operation. If a variable V_i has an
89 UNDEFINED value, it means that either its defining statement
90 hasn't been visited yet or V_i has no defining statement, in
91 which case the original symbol 'V' is being used
92 uninitialized. Since 'V' is a local variable, the compiler
93 may assume any initial value for it.
96 After propagation, every variable V_i that ends up with a lattice
97 value of CONSTANT will have the associated constant value in the
98 array CONST_VAL[i].VALUE. That is fed into substitute_and_fold for
99 final substitution and folding.
101 This algorithm uses wide-ints at the max precision of the target.
102 This means that, with one uninteresting exception, variables with
103 UNSIGNED types never go to VARYING because the bits above the
104 precision of the type of the variable are always zero. The
105 uninteresting case is a variable of UNSIGNED type that has the
106 maximum precision of the target. Such variables can go to VARYING,
107 but this causes no loss of infomation since these variables will
108 never be extended.
110 References:
112 Constant propagation with conditional branches,
113 Wegman and Zadeck, ACM TOPLAS 13(2):181-210.
115 Building an Optimizing Compiler,
116 Robert Morgan, Butterworth-Heinemann, 1998, Section 8.9.
118 Advanced Compiler Design and Implementation,
119 Steven Muchnick, Morgan Kaufmann, 1997, Section 12.6 */
121 #include "config.h"
122 #include "system.h"
123 #include "coretypes.h"
124 #include "backend.h"
125 #include "target.h"
126 #include "tree.h"
127 #include "gimple.h"
128 #include "tree-pass.h"
129 #include "ssa.h"
130 #include "gimple-pretty-print.h"
131 #include "fold-const.h"
132 #include "gimple-fold.h"
133 #include "tree-eh.h"
134 #include "gimplify.h"
135 #include "gimple-iterator.h"
136 #include "tree-cfg.h"
137 #include "tree-ssa-propagate.h"
138 #include "dbgcnt.h"
139 #include "params.h"
140 #include "builtins.h"
141 #include "tree-chkp.h"
142 #include "cfgloop.h"
143 #include "stor-layout.h"
144 #include "optabs-query.h"
145 #include "tree-ssa-ccp.h"
147 /* Possible lattice values. */
148 typedef enum
150 UNINITIALIZED,
151 UNDEFINED,
152 CONSTANT,
153 VARYING
154 } ccp_lattice_t;
156 struct ccp_prop_value_t {
157 /* Lattice value. */
158 ccp_lattice_t lattice_val;
160 /* Propagated value. */
161 tree value;
163 /* Mask that applies to the propagated value during CCP. For X
164 with a CONSTANT lattice value X & ~mask == value & ~mask. The
165 zero bits in the mask cover constant values. The ones mean no
166 information. */
167 widest_int mask;
170 /* Array of propagated constant values. After propagation,
171 CONST_VAL[I].VALUE holds the constant value for SSA_NAME(I). If
172 the constant is held in an SSA name representing a memory store
173 (i.e., a VDEF), CONST_VAL[I].MEM_REF will contain the actual
174 memory reference used to store (i.e., the LHS of the assignment
175 doing the store). */
176 static ccp_prop_value_t *const_val;
177 static unsigned n_const_val;
179 static void canonicalize_value (ccp_prop_value_t *);
180 static bool ccp_fold_stmt (gimple_stmt_iterator *);
181 static void ccp_lattice_meet (ccp_prop_value_t *, ccp_prop_value_t *);
183 /* Dump constant propagation value VAL to file OUTF prefixed by PREFIX. */
185 static void
186 dump_lattice_value (FILE *outf, const char *prefix, ccp_prop_value_t val)
188 switch (val.lattice_val)
190 case UNINITIALIZED:
191 fprintf (outf, "%sUNINITIALIZED", prefix);
192 break;
193 case UNDEFINED:
194 fprintf (outf, "%sUNDEFINED", prefix);
195 break;
196 case VARYING:
197 fprintf (outf, "%sVARYING", prefix);
198 break;
199 case CONSTANT:
200 if (TREE_CODE (val.value) != INTEGER_CST
201 || val.mask == 0)
203 fprintf (outf, "%sCONSTANT ", prefix);
204 print_generic_expr (outf, val.value, dump_flags);
206 else
208 widest_int cval = wi::bit_and_not (wi::to_widest (val.value),
209 val.mask);
210 fprintf (outf, "%sCONSTANT ", prefix);
211 print_hex (cval, outf);
212 fprintf (outf, " (");
213 print_hex (val.mask, outf);
214 fprintf (outf, ")");
216 break;
217 default:
218 gcc_unreachable ();
223 /* Print lattice value VAL to stderr. */
225 void debug_lattice_value (ccp_prop_value_t val);
227 DEBUG_FUNCTION void
228 debug_lattice_value (ccp_prop_value_t val)
230 dump_lattice_value (stderr, "", val);
231 fprintf (stderr, "\n");
234 /* Extend NONZERO_BITS to a full mask, based on sgn. */
236 static widest_int
237 extend_mask (const wide_int &nonzero_bits, signop sgn)
239 return widest_int::from (nonzero_bits, sgn);
242 /* Compute a default value for variable VAR and store it in the
243 CONST_VAL array. The following rules are used to get default
244 values:
246 1- Global and static variables that are declared constant are
247 considered CONSTANT.
249 2- Any other value is considered UNDEFINED. This is useful when
250 considering PHI nodes. PHI arguments that are undefined do not
251 change the constant value of the PHI node, which allows for more
252 constants to be propagated.
254 3- Variables defined by statements other than assignments and PHI
255 nodes are considered VARYING.
257 4- Initial values of variables that are not GIMPLE registers are
258 considered VARYING. */
260 static ccp_prop_value_t
261 get_default_value (tree var)
263 ccp_prop_value_t val = { UNINITIALIZED, NULL_TREE, 0 };
264 gimple *stmt;
266 stmt = SSA_NAME_DEF_STMT (var);
268 if (gimple_nop_p (stmt))
270 /* Variables defined by an empty statement are those used
271 before being initialized. If VAR is a local variable, we
272 can assume initially that it is UNDEFINED, otherwise we must
273 consider it VARYING. */
274 if (!virtual_operand_p (var)
275 && SSA_NAME_VAR (var)
276 && TREE_CODE (SSA_NAME_VAR (var)) == VAR_DECL)
277 val.lattice_val = UNDEFINED;
278 else
280 val.lattice_val = VARYING;
281 val.mask = -1;
282 if (flag_tree_bit_ccp)
284 wide_int nonzero_bits = get_nonzero_bits (var);
285 if (nonzero_bits != -1)
287 val.lattice_val = CONSTANT;
288 val.value = build_zero_cst (TREE_TYPE (var));
289 val.mask = extend_mask (nonzero_bits, TYPE_SIGN (TREE_TYPE (var)));
294 else if (is_gimple_assign (stmt))
296 tree cst;
297 if (gimple_assign_single_p (stmt)
298 && DECL_P (gimple_assign_rhs1 (stmt))
299 && (cst = get_symbol_constant_value (gimple_assign_rhs1 (stmt))))
301 val.lattice_val = CONSTANT;
302 val.value = cst;
304 else
306 /* Any other variable defined by an assignment is considered
307 UNDEFINED. */
308 val.lattice_val = UNDEFINED;
311 else if ((is_gimple_call (stmt)
312 && gimple_call_lhs (stmt) != NULL_TREE)
313 || gimple_code (stmt) == GIMPLE_PHI)
315 /* A variable defined by a call or a PHI node is considered
316 UNDEFINED. */
317 val.lattice_val = UNDEFINED;
319 else
321 /* Otherwise, VAR will never take on a constant value. */
322 val.lattice_val = VARYING;
323 val.mask = -1;
326 return val;
330 /* Get the constant value associated with variable VAR. */
332 static inline ccp_prop_value_t *
333 get_value (tree var)
335 ccp_prop_value_t *val;
337 if (const_val == NULL
338 || SSA_NAME_VERSION (var) >= n_const_val)
339 return NULL;
341 val = &const_val[SSA_NAME_VERSION (var)];
342 if (val->lattice_val == UNINITIALIZED)
343 *val = get_default_value (var);
345 canonicalize_value (val);
347 return val;
350 /* Return the constant tree value associated with VAR. */
352 static inline tree
353 get_constant_value (tree var)
355 ccp_prop_value_t *val;
356 if (TREE_CODE (var) != SSA_NAME)
358 if (is_gimple_min_invariant (var))
359 return var;
360 return NULL_TREE;
362 val = get_value (var);
363 if (val
364 && val->lattice_val == CONSTANT
365 && (TREE_CODE (val->value) != INTEGER_CST
366 || val->mask == 0))
367 return val->value;
368 return NULL_TREE;
371 /* Sets the value associated with VAR to VARYING. */
373 static inline void
374 set_value_varying (tree var)
376 ccp_prop_value_t *val = &const_val[SSA_NAME_VERSION (var)];
378 val->lattice_val = VARYING;
379 val->value = NULL_TREE;
380 val->mask = -1;
383 /* For integer constants, make sure to drop TREE_OVERFLOW. */
385 static void
386 canonicalize_value (ccp_prop_value_t *val)
388 if (val->lattice_val != CONSTANT)
389 return;
391 if (TREE_OVERFLOW_P (val->value))
392 val->value = drop_tree_overflow (val->value);
395 /* Return whether the lattice transition is valid. */
397 static bool
398 valid_lattice_transition (ccp_prop_value_t old_val, ccp_prop_value_t new_val)
400 /* Lattice transitions must always be monotonically increasing in
401 value. */
402 if (old_val.lattice_val < new_val.lattice_val)
403 return true;
405 if (old_val.lattice_val != new_val.lattice_val)
406 return false;
408 if (!old_val.value && !new_val.value)
409 return true;
411 /* Now both lattice values are CONSTANT. */
413 /* Allow arbitrary copy changes as we might look through PHI <a_1, ...>
414 when only a single copy edge is executable. */
415 if (TREE_CODE (old_val.value) == SSA_NAME
416 && TREE_CODE (new_val.value) == SSA_NAME)
417 return true;
419 /* Allow transitioning from a constant to a copy. */
420 if (is_gimple_min_invariant (old_val.value)
421 && TREE_CODE (new_val.value) == SSA_NAME)
422 return true;
424 /* Allow transitioning from PHI <&x, not executable> == &x
425 to PHI <&x, &y> == common alignment. */
426 if (TREE_CODE (old_val.value) != INTEGER_CST
427 && TREE_CODE (new_val.value) == INTEGER_CST)
428 return true;
430 /* Bit-lattices have to agree in the still valid bits. */
431 if (TREE_CODE (old_val.value) == INTEGER_CST
432 && TREE_CODE (new_val.value) == INTEGER_CST)
433 return (wi::bit_and_not (wi::to_widest (old_val.value), new_val.mask)
434 == wi::bit_and_not (wi::to_widest (new_val.value), new_val.mask));
436 /* Otherwise constant values have to agree. */
437 if (operand_equal_p (old_val.value, new_val.value, 0))
438 return true;
440 /* At least the kinds and types should agree now. */
441 if (TREE_CODE (old_val.value) != TREE_CODE (new_val.value)
442 || !types_compatible_p (TREE_TYPE (old_val.value),
443 TREE_TYPE (new_val.value)))
444 return false;
446 /* For floats and !HONOR_NANS allow transitions from (partial) NaN
447 to non-NaN. */
448 tree type = TREE_TYPE (new_val.value);
449 if (SCALAR_FLOAT_TYPE_P (type)
450 && !HONOR_NANS (type))
452 if (REAL_VALUE_ISNAN (TREE_REAL_CST (old_val.value)))
453 return true;
455 else if (VECTOR_FLOAT_TYPE_P (type)
456 && !HONOR_NANS (type))
458 for (unsigned i = 0; i < VECTOR_CST_NELTS (old_val.value); ++i)
459 if (!REAL_VALUE_ISNAN
460 (TREE_REAL_CST (VECTOR_CST_ELT (old_val.value, i)))
461 && !operand_equal_p (VECTOR_CST_ELT (old_val.value, i),
462 VECTOR_CST_ELT (new_val.value, i), 0))
463 return false;
464 return true;
466 else if (COMPLEX_FLOAT_TYPE_P (type)
467 && !HONOR_NANS (type))
469 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_REALPART (old_val.value)))
470 && !operand_equal_p (TREE_REALPART (old_val.value),
471 TREE_REALPART (new_val.value), 0))
472 return false;
473 if (!REAL_VALUE_ISNAN (TREE_REAL_CST (TREE_IMAGPART (old_val.value)))
474 && !operand_equal_p (TREE_IMAGPART (old_val.value),
475 TREE_IMAGPART (new_val.value), 0))
476 return false;
477 return true;
479 return false;
482 /* Set the value for variable VAR to NEW_VAL. Return true if the new
483 value is different from VAR's previous value. */
485 static bool
486 set_lattice_value (tree var, ccp_prop_value_t *new_val)
488 /* We can deal with old UNINITIALIZED values just fine here. */
489 ccp_prop_value_t *old_val = &const_val[SSA_NAME_VERSION (var)];
491 canonicalize_value (new_val);
493 /* We have to be careful to not go up the bitwise lattice
494 represented by the mask. Instead of dropping to VARYING
495 use the meet operator to retain a conservative value.
496 Missed optimizations like PR65851 makes this necessary.
497 It also ensures we converge to a stable lattice solution. */
498 if (new_val->lattice_val == CONSTANT
499 && old_val->lattice_val == CONSTANT
500 && TREE_CODE (new_val->value) != SSA_NAME)
501 ccp_lattice_meet (new_val, old_val);
503 gcc_checking_assert (valid_lattice_transition (*old_val, *new_val));
505 /* If *OLD_VAL and NEW_VAL are the same, return false to inform the
506 caller that this was a non-transition. */
507 if (old_val->lattice_val != new_val->lattice_val
508 || (new_val->lattice_val == CONSTANT
509 && (TREE_CODE (new_val->value) != TREE_CODE (old_val->value)
510 || (TREE_CODE (new_val->value) == INTEGER_CST
511 && (new_val->mask != old_val->mask
512 || (wi::bit_and_not (wi::to_widest (old_val->value),
513 new_val->mask)
514 != wi::bit_and_not (wi::to_widest (new_val->value),
515 new_val->mask))))
516 || (TREE_CODE (new_val->value) != INTEGER_CST
517 && !operand_equal_p (new_val->value, old_val->value, 0)))))
519 /* ??? We would like to delay creation of INTEGER_CSTs from
520 partially constants here. */
522 if (dump_file && (dump_flags & TDF_DETAILS))
524 dump_lattice_value (dump_file, "Lattice value changed to ", *new_val);
525 fprintf (dump_file, ". Adding SSA edges to worklist.\n");
528 *old_val = *new_val;
530 gcc_assert (new_val->lattice_val != UNINITIALIZED);
531 return true;
534 return false;
537 static ccp_prop_value_t get_value_for_expr (tree, bool);
538 static ccp_prop_value_t bit_value_binop (enum tree_code, tree, tree, tree);
539 void bit_value_binop (enum tree_code, signop, int, widest_int *, widest_int *,
540 signop, int, const widest_int &, const widest_int &,
541 signop, int, const widest_int &, const widest_int &);
543 /* Return a widest_int that can be used for bitwise simplifications
544 from VAL. */
546 static widest_int
547 value_to_wide_int (ccp_prop_value_t val)
549 if (val.value
550 && TREE_CODE (val.value) == INTEGER_CST)
551 return wi::to_widest (val.value);
553 return 0;
556 /* Return the value for the address expression EXPR based on alignment
557 information. */
559 static ccp_prop_value_t
560 get_value_from_alignment (tree expr)
562 tree type = TREE_TYPE (expr);
563 ccp_prop_value_t val;
564 unsigned HOST_WIDE_INT bitpos;
565 unsigned int align;
567 gcc_assert (TREE_CODE (expr) == ADDR_EXPR);
569 get_pointer_alignment_1 (expr, &align, &bitpos);
570 val.mask = (POINTER_TYPE_P (type) || TYPE_UNSIGNED (type)
571 ? wi::mask <widest_int> (TYPE_PRECISION (type), false)
572 : -1).and_not (align / BITS_PER_UNIT - 1);
573 val.lattice_val
574 = wi::sext (val.mask, TYPE_PRECISION (type)) == -1 ? VARYING : CONSTANT;
575 if (val.lattice_val == CONSTANT)
576 val.value = build_int_cstu (type, bitpos / BITS_PER_UNIT);
577 else
578 val.value = NULL_TREE;
580 return val;
583 /* Return the value for the tree operand EXPR. If FOR_BITS_P is true
584 return constant bits extracted from alignment information for
585 invariant addresses. */
587 static ccp_prop_value_t
588 get_value_for_expr (tree expr, bool for_bits_p)
590 ccp_prop_value_t val;
592 if (TREE_CODE (expr) == SSA_NAME)
594 ccp_prop_value_t *val_ = get_value (expr);
595 if (val_)
596 val = *val_;
597 else
599 val.lattice_val = VARYING;
600 val.value = NULL_TREE;
601 val.mask = -1;
603 if (for_bits_p
604 && val.lattice_val == CONSTANT
605 && TREE_CODE (val.value) == ADDR_EXPR)
606 val = get_value_from_alignment (val.value);
607 /* Fall back to a copy value. */
608 if (!for_bits_p
609 && val.lattice_val == VARYING
610 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (expr))
612 val.lattice_val = CONSTANT;
613 val.value = expr;
614 val.mask = -1;
617 else if (is_gimple_min_invariant (expr)
618 && (!for_bits_p || TREE_CODE (expr) != ADDR_EXPR))
620 val.lattice_val = CONSTANT;
621 val.value = expr;
622 val.mask = 0;
623 canonicalize_value (&val);
625 else if (TREE_CODE (expr) == ADDR_EXPR)
626 val = get_value_from_alignment (expr);
627 else
629 val.lattice_val = VARYING;
630 val.mask = -1;
631 val.value = NULL_TREE;
634 if (val.lattice_val == VARYING
635 && TYPE_UNSIGNED (TREE_TYPE (expr)))
636 val.mask = wi::zext (val.mask, TYPE_PRECISION (TREE_TYPE (expr)));
638 return val;
641 /* Return the likely CCP lattice value for STMT.
643 If STMT has no operands, then return CONSTANT.
645 Else if undefinedness of operands of STMT cause its value to be
646 undefined, then return UNDEFINED.
648 Else if any operands of STMT are constants, then return CONSTANT.
650 Else return VARYING. */
652 static ccp_lattice_t
653 likely_value (gimple *stmt)
655 bool has_constant_operand, has_undefined_operand, all_undefined_operands;
656 bool has_nsa_operand;
657 tree use;
658 ssa_op_iter iter;
659 unsigned i;
661 enum gimple_code code = gimple_code (stmt);
663 /* This function appears to be called only for assignments, calls,
664 conditionals, and switches, due to the logic in visit_stmt. */
665 gcc_assert (code == GIMPLE_ASSIGN
666 || code == GIMPLE_CALL
667 || code == GIMPLE_COND
668 || code == GIMPLE_SWITCH);
670 /* If the statement has volatile operands, it won't fold to a
671 constant value. */
672 if (gimple_has_volatile_ops (stmt))
673 return VARYING;
675 /* Arrive here for more complex cases. */
676 has_constant_operand = false;
677 has_undefined_operand = false;
678 all_undefined_operands = true;
679 has_nsa_operand = false;
680 FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
682 ccp_prop_value_t *val = get_value (use);
684 if (val && val->lattice_val == UNDEFINED)
685 has_undefined_operand = true;
686 else
687 all_undefined_operands = false;
689 if (val && val->lattice_val == CONSTANT)
690 has_constant_operand = true;
692 if (SSA_NAME_IS_DEFAULT_DEF (use)
693 || !prop_simulate_again_p (SSA_NAME_DEF_STMT (use)))
694 has_nsa_operand = true;
697 /* There may be constants in regular rhs operands. For calls we
698 have to ignore lhs, fndecl and static chain, otherwise only
699 the lhs. */
700 for (i = (is_gimple_call (stmt) ? 2 : 0) + gimple_has_lhs (stmt);
701 i < gimple_num_ops (stmt); ++i)
703 tree op = gimple_op (stmt, i);
704 if (!op || TREE_CODE (op) == SSA_NAME)
705 continue;
706 if (is_gimple_min_invariant (op))
707 has_constant_operand = true;
710 if (has_constant_operand)
711 all_undefined_operands = false;
713 if (has_undefined_operand
714 && code == GIMPLE_CALL
715 && gimple_call_internal_p (stmt))
716 switch (gimple_call_internal_fn (stmt))
718 /* These 3 builtins use the first argument just as a magic
719 way how to find out a decl uid. */
720 case IFN_GOMP_SIMD_LANE:
721 case IFN_GOMP_SIMD_VF:
722 case IFN_GOMP_SIMD_LAST_LANE:
723 has_undefined_operand = false;
724 break;
725 default:
726 break;
729 /* If the operation combines operands like COMPLEX_EXPR make sure to
730 not mark the result UNDEFINED if only one part of the result is
731 undefined. */
732 if (has_undefined_operand && all_undefined_operands)
733 return UNDEFINED;
734 else if (code == GIMPLE_ASSIGN && has_undefined_operand)
736 switch (gimple_assign_rhs_code (stmt))
738 /* Unary operators are handled with all_undefined_operands. */
739 case PLUS_EXPR:
740 case MINUS_EXPR:
741 case POINTER_PLUS_EXPR:
742 /* Not MIN_EXPR, MAX_EXPR. One VARYING operand may be selected.
743 Not bitwise operators, one VARYING operand may specify the
744 result completely. Not logical operators for the same reason.
745 Not COMPLEX_EXPR as one VARYING operand makes the result partly
746 not UNDEFINED. Not *DIV_EXPR, comparisons and shifts because
747 the undefined operand may be promoted. */
748 return UNDEFINED;
750 case ADDR_EXPR:
751 /* If any part of an address is UNDEFINED, like the index
752 of an ARRAY_EXPR, then treat the result as UNDEFINED. */
753 return UNDEFINED;
755 default:
759 /* If there was an UNDEFINED operand but the result may be not UNDEFINED
760 fall back to CONSTANT. During iteration UNDEFINED may still drop
761 to CONSTANT. */
762 if (has_undefined_operand)
763 return CONSTANT;
765 /* We do not consider virtual operands here -- load from read-only
766 memory may have only VARYING virtual operands, but still be
767 constant. Also we can combine the stmt with definitions from
768 operands whose definitions are not simulated again. */
769 if (has_constant_operand
770 || has_nsa_operand
771 || gimple_references_memory_p (stmt))
772 return CONSTANT;
774 return VARYING;
777 /* Returns true if STMT cannot be constant. */
779 static bool
780 surely_varying_stmt_p (gimple *stmt)
782 /* If the statement has operands that we cannot handle, it cannot be
783 constant. */
784 if (gimple_has_volatile_ops (stmt))
785 return true;
787 /* If it is a call and does not return a value or is not a
788 builtin and not an indirect call or a call to function with
789 assume_aligned/alloc_align attribute, it is varying. */
790 if (is_gimple_call (stmt))
792 tree fndecl, fntype = gimple_call_fntype (stmt);
793 if (!gimple_call_lhs (stmt)
794 || ((fndecl = gimple_call_fndecl (stmt)) != NULL_TREE
795 && !DECL_BUILT_IN (fndecl)
796 && !lookup_attribute ("assume_aligned",
797 TYPE_ATTRIBUTES (fntype))
798 && !lookup_attribute ("alloc_align",
799 TYPE_ATTRIBUTES (fntype))))
800 return true;
803 /* Any other store operation is not interesting. */
804 else if (gimple_vdef (stmt))
805 return true;
807 /* Anything other than assignments and conditional jumps are not
808 interesting for CCP. */
809 if (gimple_code (stmt) != GIMPLE_ASSIGN
810 && gimple_code (stmt) != GIMPLE_COND
811 && gimple_code (stmt) != GIMPLE_SWITCH
812 && gimple_code (stmt) != GIMPLE_CALL)
813 return true;
815 return false;
818 /* Initialize local data structures for CCP. */
820 static void
821 ccp_initialize (void)
823 basic_block bb;
825 n_const_val = num_ssa_names;
826 const_val = XCNEWVEC (ccp_prop_value_t, n_const_val);
828 /* Initialize simulation flags for PHI nodes and statements. */
829 FOR_EACH_BB_FN (bb, cfun)
831 gimple_stmt_iterator i;
833 for (i = gsi_start_bb (bb); !gsi_end_p (i); gsi_next (&i))
835 gimple *stmt = gsi_stmt (i);
836 bool is_varying;
838 /* If the statement is a control insn, then we do not
839 want to avoid simulating the statement once. Failure
840 to do so means that those edges will never get added. */
841 if (stmt_ends_bb_p (stmt))
842 is_varying = false;
843 else
844 is_varying = surely_varying_stmt_p (stmt);
846 if (is_varying)
848 tree def;
849 ssa_op_iter iter;
851 /* If the statement will not produce a constant, mark
852 all its outputs VARYING. */
853 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
854 set_value_varying (def);
856 prop_set_simulate_again (stmt, !is_varying);
860 /* Now process PHI nodes. We never clear the simulate_again flag on
861 phi nodes, since we do not know which edges are executable yet,
862 except for phi nodes for virtual operands when we do not do store ccp. */
863 FOR_EACH_BB_FN (bb, cfun)
865 gphi_iterator i;
867 for (i = gsi_start_phis (bb); !gsi_end_p (i); gsi_next (&i))
869 gphi *phi = i.phi ();
871 if (virtual_operand_p (gimple_phi_result (phi)))
872 prop_set_simulate_again (phi, false);
873 else
874 prop_set_simulate_again (phi, true);
879 /* Debug count support. Reset the values of ssa names
880 VARYING when the total number ssa names analyzed is
881 beyond the debug count specified. */
883 static void
884 do_dbg_cnt (void)
886 unsigned i;
887 for (i = 0; i < num_ssa_names; i++)
889 if (!dbg_cnt (ccp))
891 const_val[i].lattice_val = VARYING;
892 const_val[i].mask = -1;
893 const_val[i].value = NULL_TREE;
899 /* Do final substitution of propagated values, cleanup the flowgraph and
900 free allocated storage. If NONZERO_P, record nonzero bits.
902 Return TRUE when something was optimized. */
904 static bool
905 ccp_finalize (bool nonzero_p)
907 bool something_changed;
908 unsigned i;
909 tree name;
911 do_dbg_cnt ();
913 /* Derive alignment and misalignment information from partially
914 constant pointers in the lattice or nonzero bits from partially
915 constant integers. */
916 FOR_EACH_SSA_NAME (i, name, cfun)
918 ccp_prop_value_t *val;
919 unsigned int tem, align;
921 if (!POINTER_TYPE_P (TREE_TYPE (name))
922 && (!INTEGRAL_TYPE_P (TREE_TYPE (name))
923 /* Don't record nonzero bits before IPA to avoid
924 using too much memory. */
925 || !nonzero_p))
926 continue;
928 val = get_value (name);
929 if (val->lattice_val != CONSTANT
930 || TREE_CODE (val->value) != INTEGER_CST
931 || val->mask == 0)
932 continue;
934 if (POINTER_TYPE_P (TREE_TYPE (name)))
936 /* Trailing mask bits specify the alignment, trailing value
937 bits the misalignment. */
938 tem = val->mask.to_uhwi ();
939 align = least_bit_hwi (tem);
940 if (align > 1)
941 set_ptr_info_alignment (get_ptr_info (name), align,
942 (TREE_INT_CST_LOW (val->value)
943 & (align - 1)));
945 else
947 unsigned int precision = TYPE_PRECISION (TREE_TYPE (val->value));
948 wide_int nonzero_bits = wide_int::from (val->mask, precision,
949 UNSIGNED) | val->value;
950 nonzero_bits &= get_nonzero_bits (name);
951 set_nonzero_bits (name, nonzero_bits);
955 /* Perform substitutions based on the known constant values. */
956 something_changed = substitute_and_fold (get_constant_value, ccp_fold_stmt);
958 free (const_val);
959 const_val = NULL;
960 return something_changed;;
964 /* Compute the meet operator between *VAL1 and *VAL2. Store the result
965 in VAL1.
967 any M UNDEFINED = any
968 any M VARYING = VARYING
969 Ci M Cj = Ci if (i == j)
970 Ci M Cj = VARYING if (i != j)
973 static void
974 ccp_lattice_meet (ccp_prop_value_t *val1, ccp_prop_value_t *val2)
976 if (val1->lattice_val == UNDEFINED
977 /* For UNDEFINED M SSA we can't always SSA because its definition
978 may not dominate the PHI node. Doing optimistic copy propagation
979 also causes a lot of gcc.dg/uninit-pred*.c FAILs. */
980 && (val2->lattice_val != CONSTANT
981 || TREE_CODE (val2->value) != SSA_NAME))
983 /* UNDEFINED M any = any */
984 *val1 = *val2;
986 else if (val2->lattice_val == UNDEFINED
987 /* See above. */
988 && (val1->lattice_val != CONSTANT
989 || TREE_CODE (val1->value) != SSA_NAME))
991 /* any M UNDEFINED = any
992 Nothing to do. VAL1 already contains the value we want. */
995 else if (val1->lattice_val == VARYING
996 || val2->lattice_val == VARYING)
998 /* any M VARYING = VARYING. */
999 val1->lattice_val = VARYING;
1000 val1->mask = -1;
1001 val1->value = NULL_TREE;
1003 else if (val1->lattice_val == CONSTANT
1004 && val2->lattice_val == CONSTANT
1005 && TREE_CODE (val1->value) == INTEGER_CST
1006 && TREE_CODE (val2->value) == INTEGER_CST)
1008 /* Ci M Cj = Ci if (i == j)
1009 Ci M Cj = VARYING if (i != j)
1011 For INTEGER_CSTs mask unequal bits. If no equal bits remain,
1012 drop to varying. */
1013 val1->mask = (val1->mask | val2->mask
1014 | (wi::to_widest (val1->value)
1015 ^ wi::to_widest (val2->value)));
1016 if (wi::sext (val1->mask, TYPE_PRECISION (TREE_TYPE (val1->value))) == -1)
1018 val1->lattice_val = VARYING;
1019 val1->value = NULL_TREE;
1022 else if (val1->lattice_val == CONSTANT
1023 && val2->lattice_val == CONSTANT
1024 && operand_equal_p (val1->value, val2->value, 0))
1026 /* Ci M Cj = Ci if (i == j)
1027 Ci M Cj = VARYING if (i != j)
1029 VAL1 already contains the value we want for equivalent values. */
1031 else if (val1->lattice_val == CONSTANT
1032 && val2->lattice_val == CONSTANT
1033 && (TREE_CODE (val1->value) == ADDR_EXPR
1034 || TREE_CODE (val2->value) == ADDR_EXPR))
1036 /* When not equal addresses are involved try meeting for
1037 alignment. */
1038 ccp_prop_value_t tem = *val2;
1039 if (TREE_CODE (val1->value) == ADDR_EXPR)
1040 *val1 = get_value_for_expr (val1->value, true);
1041 if (TREE_CODE (val2->value) == ADDR_EXPR)
1042 tem = get_value_for_expr (val2->value, true);
1043 ccp_lattice_meet (val1, &tem);
1045 else
1047 /* Any other combination is VARYING. */
1048 val1->lattice_val = VARYING;
1049 val1->mask = -1;
1050 val1->value = NULL_TREE;
1055 /* Loop through the PHI_NODE's parameters for BLOCK and compare their
1056 lattice values to determine PHI_NODE's lattice value. The value of a
1057 PHI node is determined calling ccp_lattice_meet with all the arguments
1058 of the PHI node that are incoming via executable edges. */
1060 static enum ssa_prop_result
1061 ccp_visit_phi_node (gphi *phi)
1063 unsigned i;
1064 ccp_prop_value_t new_val;
1066 if (dump_file && (dump_flags & TDF_DETAILS))
1068 fprintf (dump_file, "\nVisiting PHI node: ");
1069 print_gimple_stmt (dump_file, phi, 0, dump_flags);
1072 new_val.lattice_val = UNDEFINED;
1073 new_val.value = NULL_TREE;
1074 new_val.mask = 0;
1076 bool first = true;
1077 bool non_exec_edge = false;
1078 for (i = 0; i < gimple_phi_num_args (phi); i++)
1080 /* Compute the meet operator over all the PHI arguments flowing
1081 through executable edges. */
1082 edge e = gimple_phi_arg_edge (phi, i);
1084 if (dump_file && (dump_flags & TDF_DETAILS))
1086 fprintf (dump_file,
1087 "\n Argument #%d (%d -> %d %sexecutable)\n",
1088 i, e->src->index, e->dest->index,
1089 (e->flags & EDGE_EXECUTABLE) ? "" : "not ");
1092 /* If the incoming edge is executable, Compute the meet operator for
1093 the existing value of the PHI node and the current PHI argument. */
1094 if (e->flags & EDGE_EXECUTABLE)
1096 tree arg = gimple_phi_arg (phi, i)->def;
1097 ccp_prop_value_t arg_val = get_value_for_expr (arg, false);
1099 if (first)
1101 new_val = arg_val;
1102 first = false;
1104 else
1105 ccp_lattice_meet (&new_val, &arg_val);
1107 if (dump_file && (dump_flags & TDF_DETAILS))
1109 fprintf (dump_file, "\t");
1110 print_generic_expr (dump_file, arg, dump_flags);
1111 dump_lattice_value (dump_file, "\tValue: ", arg_val);
1112 fprintf (dump_file, "\n");
1115 if (new_val.lattice_val == VARYING)
1116 break;
1118 else
1119 non_exec_edge = true;
1122 /* In case there were non-executable edges and the value is a copy
1123 make sure its definition dominates the PHI node. */
1124 if (non_exec_edge
1125 && new_val.lattice_val == CONSTANT
1126 && TREE_CODE (new_val.value) == SSA_NAME
1127 && ! SSA_NAME_IS_DEFAULT_DEF (new_val.value)
1128 && ! dominated_by_p (CDI_DOMINATORS, gimple_bb (phi),
1129 gimple_bb (SSA_NAME_DEF_STMT (new_val.value))))
1131 new_val.lattice_val = VARYING;
1132 new_val.value = NULL_TREE;
1133 new_val.mask = -1;
1136 if (dump_file && (dump_flags & TDF_DETAILS))
1138 dump_lattice_value (dump_file, "\n PHI node value: ", new_val);
1139 fprintf (dump_file, "\n\n");
1142 /* Make the transition to the new value. */
1143 if (set_lattice_value (gimple_phi_result (phi), &new_val))
1145 if (new_val.lattice_val == VARYING)
1146 return SSA_PROP_VARYING;
1147 else
1148 return SSA_PROP_INTERESTING;
1150 else
1151 return SSA_PROP_NOT_INTERESTING;
1154 /* Return the constant value for OP or OP otherwise. */
1156 static tree
1157 valueize_op (tree op)
1159 if (TREE_CODE (op) == SSA_NAME)
1161 tree tem = get_constant_value (op);
1162 if (tem)
1163 return tem;
1165 return op;
1168 /* Return the constant value for OP, but signal to not follow SSA
1169 edges if the definition may be simulated again. */
1171 static tree
1172 valueize_op_1 (tree op)
1174 if (TREE_CODE (op) == SSA_NAME)
1176 /* If the definition may be simulated again we cannot follow
1177 this SSA edge as the SSA propagator does not necessarily
1178 re-visit the use. */
1179 gimple *def_stmt = SSA_NAME_DEF_STMT (op);
1180 if (!gimple_nop_p (def_stmt)
1181 && prop_simulate_again_p (def_stmt))
1182 return NULL_TREE;
1183 tree tem = get_constant_value (op);
1184 if (tem)
1185 return tem;
1187 return op;
1190 /* CCP specific front-end to the non-destructive constant folding
1191 routines.
1193 Attempt to simplify the RHS of STMT knowing that one or more
1194 operands are constants.
1196 If simplification is possible, return the simplified RHS,
1197 otherwise return the original RHS or NULL_TREE. */
1199 static tree
1200 ccp_fold (gimple *stmt)
1202 location_t loc = gimple_location (stmt);
1203 switch (gimple_code (stmt))
1205 case GIMPLE_COND:
1207 /* Handle comparison operators that can appear in GIMPLE form. */
1208 tree op0 = valueize_op (gimple_cond_lhs (stmt));
1209 tree op1 = valueize_op (gimple_cond_rhs (stmt));
1210 enum tree_code code = gimple_cond_code (stmt);
1211 return fold_binary_loc (loc, code, boolean_type_node, op0, op1);
1214 case GIMPLE_SWITCH:
1216 /* Return the constant switch index. */
1217 return valueize_op (gimple_switch_index (as_a <gswitch *> (stmt)));
1220 case GIMPLE_ASSIGN:
1221 case GIMPLE_CALL:
1222 return gimple_fold_stmt_to_constant_1 (stmt,
1223 valueize_op, valueize_op_1);
1225 default:
1226 gcc_unreachable ();
1230 /* Apply the operation CODE in type TYPE to the value, mask pair
1231 RVAL and RMASK representing a value of type RTYPE and set
1232 the value, mask pair *VAL and *MASK to the result. */
1234 void
1235 bit_value_unop (enum tree_code code, signop type_sgn, int type_precision,
1236 widest_int *val, widest_int *mask,
1237 signop rtype_sgn, int rtype_precision,
1238 const widest_int &rval, const widest_int &rmask)
1240 switch (code)
1242 case BIT_NOT_EXPR:
1243 *mask = rmask;
1244 *val = ~rval;
1245 break;
1247 case NEGATE_EXPR:
1249 widest_int temv, temm;
1250 /* Return ~rval + 1. */
1251 bit_value_unop (BIT_NOT_EXPR, type_sgn, type_precision, &temv, &temm,
1252 type_sgn, type_precision, rval, rmask);
1253 bit_value_binop (PLUS_EXPR, type_sgn, type_precision, val, mask,
1254 type_sgn, type_precision, temv, temm,
1255 type_sgn, type_precision, 1, 0);
1256 break;
1259 CASE_CONVERT:
1261 /* First extend mask and value according to the original type. */
1262 *mask = wi::ext (rmask, rtype_precision, rtype_sgn);
1263 *val = wi::ext (rval, rtype_precision, rtype_sgn);
1265 /* Then extend mask and value according to the target type. */
1266 *mask = wi::ext (*mask, type_precision, type_sgn);
1267 *val = wi::ext (*val, type_precision, type_sgn);
1268 break;
1271 default:
1272 *mask = -1;
1273 break;
1277 /* Apply the operation CODE in type TYPE to the value, mask pairs
1278 R1VAL, R1MASK and R2VAL, R2MASK representing a values of type R1TYPE
1279 and R2TYPE and set the value, mask pair *VAL and *MASK to the result. */
1281 void
1282 bit_value_binop (enum tree_code code, signop sgn, int width,
1283 widest_int *val, widest_int *mask,
1284 signop r1type_sgn, int r1type_precision,
1285 const widest_int &r1val, const widest_int &r1mask,
1286 signop r2type_sgn, int r2type_precision,
1287 const widest_int &r2val, const widest_int &r2mask)
1289 bool swap_p = false;
1291 /* Assume we'll get a constant result. Use an initial non varying
1292 value, we fall back to varying in the end if necessary. */
1293 *mask = -1;
1295 switch (code)
1297 case BIT_AND_EXPR:
1298 /* The mask is constant where there is a known not
1299 set bit, (m1 | m2) & ((v1 | m1) & (v2 | m2)) */
1300 *mask = (r1mask | r2mask) & (r1val | r1mask) & (r2val | r2mask);
1301 *val = r1val & r2val;
1302 break;
1304 case BIT_IOR_EXPR:
1305 /* The mask is constant where there is a known
1306 set bit, (m1 | m2) & ~((v1 & ~m1) | (v2 & ~m2)). */
1307 *mask = (r1mask | r2mask)
1308 .and_not (r1val.and_not (r1mask) | r2val.and_not (r2mask));
1309 *val = r1val | r2val;
1310 break;
1312 case BIT_XOR_EXPR:
1313 /* m1 | m2 */
1314 *mask = r1mask | r2mask;
1315 *val = r1val ^ r2val;
1316 break;
1318 case LROTATE_EXPR:
1319 case RROTATE_EXPR:
1320 if (r2mask == 0)
1322 widest_int shift = r2val;
1323 if (shift == 0)
1325 *mask = r1mask;
1326 *val = r1val;
1328 else
1330 if (wi::neg_p (shift))
1332 shift = -shift;
1333 if (code == RROTATE_EXPR)
1334 code = LROTATE_EXPR;
1335 else
1336 code = RROTATE_EXPR;
1338 if (code == RROTATE_EXPR)
1340 *mask = wi::rrotate (r1mask, shift, width);
1341 *val = wi::rrotate (r1val, shift, width);
1343 else
1345 *mask = wi::lrotate (r1mask, shift, width);
1346 *val = wi::lrotate (r1val, shift, width);
1350 break;
1352 case LSHIFT_EXPR:
1353 case RSHIFT_EXPR:
1354 /* ??? We can handle partially known shift counts if we know
1355 its sign. That way we can tell that (x << (y | 8)) & 255
1356 is zero. */
1357 if (r2mask == 0)
1359 widest_int shift = r2val;
1360 if (shift == 0)
1362 *mask = r1mask;
1363 *val = r1val;
1365 else
1367 if (wi::neg_p (shift))
1369 shift = -shift;
1370 if (code == RSHIFT_EXPR)
1371 code = LSHIFT_EXPR;
1372 else
1373 code = RSHIFT_EXPR;
1375 if (code == RSHIFT_EXPR)
1377 *mask = wi::rshift (wi::ext (r1mask, width, sgn), shift, sgn);
1378 *val = wi::rshift (wi::ext (r1val, width, sgn), shift, sgn);
1380 else
1382 *mask = wi::ext (r1mask << shift, width, sgn);
1383 *val = wi::ext (r1val << shift, width, sgn);
1387 break;
1389 case PLUS_EXPR:
1390 case POINTER_PLUS_EXPR:
1392 /* Do the addition with unknown bits set to zero, to give carry-ins of
1393 zero wherever possible. */
1394 widest_int lo = r1val.and_not (r1mask) + r2val.and_not (r2mask);
1395 lo = wi::ext (lo, width, sgn);
1396 /* Do the addition with unknown bits set to one, to give carry-ins of
1397 one wherever possible. */
1398 widest_int hi = (r1val | r1mask) + (r2val | r2mask);
1399 hi = wi::ext (hi, width, sgn);
1400 /* Each bit in the result is known if (a) the corresponding bits in
1401 both inputs are known, and (b) the carry-in to that bit position
1402 is known. We can check condition (b) by seeing if we got the same
1403 result with minimised carries as with maximised carries. */
1404 *mask = r1mask | r2mask | (lo ^ hi);
1405 *mask = wi::ext (*mask, width, sgn);
1406 /* It shouldn't matter whether we choose lo or hi here. */
1407 *val = lo;
1408 break;
1411 case MINUS_EXPR:
1413 widest_int temv, temm;
1414 bit_value_unop (NEGATE_EXPR, r2type_sgn, r2type_precision, &temv, &temm,
1415 r2type_sgn, r2type_precision, r2val, r2mask);
1416 bit_value_binop (PLUS_EXPR, sgn, width, val, mask,
1417 r1type_sgn, r1type_precision, r1val, r1mask,
1418 r2type_sgn, r2type_precision, temv, temm);
1419 break;
1422 case MULT_EXPR:
1424 /* Just track trailing zeros in both operands and transfer
1425 them to the other. */
1426 int r1tz = wi::ctz (r1val | r1mask);
1427 int r2tz = wi::ctz (r2val | r2mask);
1428 if (r1tz + r2tz >= width)
1430 *mask = 0;
1431 *val = 0;
1433 else if (r1tz + r2tz > 0)
1435 *mask = wi::ext (wi::mask <widest_int> (r1tz + r2tz, true),
1436 width, sgn);
1437 *val = 0;
1439 break;
1442 case EQ_EXPR:
1443 case NE_EXPR:
1445 widest_int m = r1mask | r2mask;
1446 if (r1val.and_not (m) != r2val.and_not (m))
1448 *mask = 0;
1449 *val = ((code == EQ_EXPR) ? 0 : 1);
1451 else
1453 /* We know the result of a comparison is always one or zero. */
1454 *mask = 1;
1455 *val = 0;
1457 break;
1460 case GE_EXPR:
1461 case GT_EXPR:
1462 swap_p = true;
1463 code = swap_tree_comparison (code);
1464 /* Fall through. */
1465 case LT_EXPR:
1466 case LE_EXPR:
1468 int minmax, maxmin;
1470 const widest_int &o1val = swap_p ? r2val : r1val;
1471 const widest_int &o1mask = swap_p ? r2mask : r1mask;
1472 const widest_int &o2val = swap_p ? r1val : r2val;
1473 const widest_int &o2mask = swap_p ? r1mask : r2mask;
1475 /* If the most significant bits are not known we know nothing. */
1476 if (wi::neg_p (o1mask) || wi::neg_p (o2mask))
1477 break;
1479 /* For comparisons the signedness is in the comparison operands. */
1480 sgn = r1type_sgn;
1482 /* If we know the most significant bits we know the values
1483 value ranges by means of treating varying bits as zero
1484 or one. Do a cross comparison of the max/min pairs. */
1485 maxmin = wi::cmp (o1val | o1mask, o2val.and_not (o2mask), sgn);
1486 minmax = wi::cmp (o1val.and_not (o1mask), o2val | o2mask, sgn);
1487 if (maxmin < 0) /* o1 is less than o2. */
1489 *mask = 0;
1490 *val = 1;
1492 else if (minmax > 0) /* o1 is not less or equal to o2. */
1494 *mask = 0;
1495 *val = 0;
1497 else if (maxmin == minmax) /* o1 and o2 are equal. */
1499 /* This probably should never happen as we'd have
1500 folded the thing during fully constant value folding. */
1501 *mask = 0;
1502 *val = (code == LE_EXPR ? 1 : 0);
1504 else
1506 /* We know the result of a comparison is always one or zero. */
1507 *mask = 1;
1508 *val = 0;
1510 break;
1513 default:;
1517 /* Return the propagation value when applying the operation CODE to
1518 the value RHS yielding type TYPE. */
1520 static ccp_prop_value_t
1521 bit_value_unop (enum tree_code code, tree type, tree rhs)
1523 ccp_prop_value_t rval = get_value_for_expr (rhs, true);
1524 widest_int value, mask;
1525 ccp_prop_value_t val;
1527 if (rval.lattice_val == UNDEFINED)
1528 return rval;
1530 gcc_assert ((rval.lattice_val == CONSTANT
1531 && TREE_CODE (rval.value) == INTEGER_CST)
1532 || wi::sext (rval.mask, TYPE_PRECISION (TREE_TYPE (rhs))) == -1);
1533 bit_value_unop (code, TYPE_SIGN (type), TYPE_PRECISION (type), &value, &mask,
1534 TYPE_SIGN (TREE_TYPE (rhs)), TYPE_PRECISION (TREE_TYPE (rhs)),
1535 value_to_wide_int (rval), rval.mask);
1536 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1538 val.lattice_val = CONSTANT;
1539 val.mask = mask;
1540 /* ??? Delay building trees here. */
1541 val.value = wide_int_to_tree (type, value);
1543 else
1545 val.lattice_val = VARYING;
1546 val.value = NULL_TREE;
1547 val.mask = -1;
1549 return val;
1552 /* Return the propagation value when applying the operation CODE to
1553 the values RHS1 and RHS2 yielding type TYPE. */
1555 static ccp_prop_value_t
1556 bit_value_binop (enum tree_code code, tree type, tree rhs1, tree rhs2)
1558 ccp_prop_value_t r1val = get_value_for_expr (rhs1, true);
1559 ccp_prop_value_t r2val = get_value_for_expr (rhs2, true);
1560 widest_int value, mask;
1561 ccp_prop_value_t val;
1563 if (r1val.lattice_val == UNDEFINED
1564 || r2val.lattice_val == UNDEFINED)
1566 val.lattice_val = VARYING;
1567 val.value = NULL_TREE;
1568 val.mask = -1;
1569 return val;
1572 gcc_assert ((r1val.lattice_val == CONSTANT
1573 && TREE_CODE (r1val.value) == INTEGER_CST)
1574 || wi::sext (r1val.mask,
1575 TYPE_PRECISION (TREE_TYPE (rhs1))) == -1);
1576 gcc_assert ((r2val.lattice_val == CONSTANT
1577 && TREE_CODE (r2val.value) == INTEGER_CST)
1578 || wi::sext (r2val.mask,
1579 TYPE_PRECISION (TREE_TYPE (rhs2))) == -1);
1580 bit_value_binop (code, TYPE_SIGN (type), TYPE_PRECISION (type), &value, &mask,
1581 TYPE_SIGN (TREE_TYPE (rhs1)), TYPE_PRECISION (TREE_TYPE (rhs1)),
1582 value_to_wide_int (r1val), r1val.mask,
1583 TYPE_SIGN (TREE_TYPE (rhs2)), TYPE_PRECISION (TREE_TYPE (rhs2)),
1584 value_to_wide_int (r2val), r2val.mask);
1586 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1588 val.lattice_val = CONSTANT;
1589 val.mask = mask;
1590 /* ??? Delay building trees here. */
1591 val.value = wide_int_to_tree (type, value);
1593 else
1595 val.lattice_val = VARYING;
1596 val.value = NULL_TREE;
1597 val.mask = -1;
1599 return val;
1602 /* Return the propagation value for __builtin_assume_aligned
1603 and functions with assume_aligned or alloc_aligned attribute.
1604 For __builtin_assume_aligned, ATTR is NULL_TREE,
1605 for assume_aligned attribute ATTR is non-NULL and ALLOC_ALIGNED
1606 is false, for alloc_aligned attribute ATTR is non-NULL and
1607 ALLOC_ALIGNED is true. */
1609 static ccp_prop_value_t
1610 bit_value_assume_aligned (gimple *stmt, tree attr, ccp_prop_value_t ptrval,
1611 bool alloc_aligned)
1613 tree align, misalign = NULL_TREE, type;
1614 unsigned HOST_WIDE_INT aligni, misaligni = 0;
1615 ccp_prop_value_t alignval;
1616 widest_int value, mask;
1617 ccp_prop_value_t val;
1619 if (attr == NULL_TREE)
1621 tree ptr = gimple_call_arg (stmt, 0);
1622 type = TREE_TYPE (ptr);
1623 ptrval = get_value_for_expr (ptr, true);
1625 else
1627 tree lhs = gimple_call_lhs (stmt);
1628 type = TREE_TYPE (lhs);
1631 if (ptrval.lattice_val == UNDEFINED)
1632 return ptrval;
1633 gcc_assert ((ptrval.lattice_val == CONSTANT
1634 && TREE_CODE (ptrval.value) == INTEGER_CST)
1635 || wi::sext (ptrval.mask, TYPE_PRECISION (type)) == -1);
1636 if (attr == NULL_TREE)
1638 /* Get aligni and misaligni from __builtin_assume_aligned. */
1639 align = gimple_call_arg (stmt, 1);
1640 if (!tree_fits_uhwi_p (align))
1641 return ptrval;
1642 aligni = tree_to_uhwi (align);
1643 if (gimple_call_num_args (stmt) > 2)
1645 misalign = gimple_call_arg (stmt, 2);
1646 if (!tree_fits_uhwi_p (misalign))
1647 return ptrval;
1648 misaligni = tree_to_uhwi (misalign);
1651 else
1653 /* Get aligni and misaligni from assume_aligned or
1654 alloc_align attributes. */
1655 if (TREE_VALUE (attr) == NULL_TREE)
1656 return ptrval;
1657 attr = TREE_VALUE (attr);
1658 align = TREE_VALUE (attr);
1659 if (!tree_fits_uhwi_p (align))
1660 return ptrval;
1661 aligni = tree_to_uhwi (align);
1662 if (alloc_aligned)
1664 if (aligni == 0 || aligni > gimple_call_num_args (stmt))
1665 return ptrval;
1666 align = gimple_call_arg (stmt, aligni - 1);
1667 if (!tree_fits_uhwi_p (align))
1668 return ptrval;
1669 aligni = tree_to_uhwi (align);
1671 else if (TREE_CHAIN (attr) && TREE_VALUE (TREE_CHAIN (attr)))
1673 misalign = TREE_VALUE (TREE_CHAIN (attr));
1674 if (!tree_fits_uhwi_p (misalign))
1675 return ptrval;
1676 misaligni = tree_to_uhwi (misalign);
1679 if (aligni <= 1 || (aligni & (aligni - 1)) != 0 || misaligni >= aligni)
1680 return ptrval;
1682 align = build_int_cst_type (type, -aligni);
1683 alignval = get_value_for_expr (align, true);
1684 bit_value_binop (BIT_AND_EXPR, TYPE_SIGN (type), TYPE_PRECISION (type), &value, &mask,
1685 TYPE_SIGN (type), TYPE_PRECISION (type), value_to_wide_int (ptrval), ptrval.mask,
1686 TYPE_SIGN (type), TYPE_PRECISION (type), value_to_wide_int (alignval), alignval.mask);
1688 if (wi::sext (mask, TYPE_PRECISION (type)) != -1)
1690 val.lattice_val = CONSTANT;
1691 val.mask = mask;
1692 gcc_assert ((mask.to_uhwi () & (aligni - 1)) == 0);
1693 gcc_assert ((value.to_uhwi () & (aligni - 1)) == 0);
1694 value |= misaligni;
1695 /* ??? Delay building trees here. */
1696 val.value = wide_int_to_tree (type, value);
1698 else
1700 val.lattice_val = VARYING;
1701 val.value = NULL_TREE;
1702 val.mask = -1;
1704 return val;
1707 /* Evaluate statement STMT.
1708 Valid only for assignments, calls, conditionals, and switches. */
1710 static ccp_prop_value_t
1711 evaluate_stmt (gimple *stmt)
1713 ccp_prop_value_t val;
1714 tree simplified = NULL_TREE;
1715 ccp_lattice_t likelyvalue = likely_value (stmt);
1716 bool is_constant = false;
1717 unsigned int align;
1719 if (dump_file && (dump_flags & TDF_DETAILS))
1721 fprintf (dump_file, "which is likely ");
1722 switch (likelyvalue)
1724 case CONSTANT:
1725 fprintf (dump_file, "CONSTANT");
1726 break;
1727 case UNDEFINED:
1728 fprintf (dump_file, "UNDEFINED");
1729 break;
1730 case VARYING:
1731 fprintf (dump_file, "VARYING");
1732 break;
1733 default:;
1735 fprintf (dump_file, "\n");
1738 /* If the statement is likely to have a CONSTANT result, then try
1739 to fold the statement to determine the constant value. */
1740 /* FIXME. This is the only place that we call ccp_fold.
1741 Since likely_value never returns CONSTANT for calls, we will
1742 not attempt to fold them, including builtins that may profit. */
1743 if (likelyvalue == CONSTANT)
1745 fold_defer_overflow_warnings ();
1746 simplified = ccp_fold (stmt);
1747 if (simplified && TREE_CODE (simplified) == SSA_NAME)
1749 ccp_prop_value_t *val = get_value (simplified);
1750 if (val && val->lattice_val != VARYING)
1752 fold_undefer_overflow_warnings (true, stmt, 0);
1753 return *val;
1756 is_constant = simplified && is_gimple_min_invariant (simplified);
1757 fold_undefer_overflow_warnings (is_constant, stmt, 0);
1758 if (is_constant)
1760 /* The statement produced a constant value. */
1761 val.lattice_val = CONSTANT;
1762 val.value = simplified;
1763 val.mask = 0;
1764 return val;
1767 /* If the statement is likely to have a VARYING result, then do not
1768 bother folding the statement. */
1769 else if (likelyvalue == VARYING)
1771 enum gimple_code code = gimple_code (stmt);
1772 if (code == GIMPLE_ASSIGN)
1774 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1776 /* Other cases cannot satisfy is_gimple_min_invariant
1777 without folding. */
1778 if (get_gimple_rhs_class (subcode) == GIMPLE_SINGLE_RHS)
1779 simplified = gimple_assign_rhs1 (stmt);
1781 else if (code == GIMPLE_SWITCH)
1782 simplified = gimple_switch_index (as_a <gswitch *> (stmt));
1783 else
1784 /* These cannot satisfy is_gimple_min_invariant without folding. */
1785 gcc_assert (code == GIMPLE_CALL || code == GIMPLE_COND);
1786 is_constant = simplified && is_gimple_min_invariant (simplified);
1787 if (is_constant)
1789 /* The statement produced a constant value. */
1790 val.lattice_val = CONSTANT;
1791 val.value = simplified;
1792 val.mask = 0;
1795 /* If the statement result is likely UNDEFINED, make it so. */
1796 else if (likelyvalue == UNDEFINED)
1798 val.lattice_val = UNDEFINED;
1799 val.value = NULL_TREE;
1800 val.mask = 0;
1801 return val;
1804 /* Resort to simplification for bitwise tracking. */
1805 if (flag_tree_bit_ccp
1806 && (likelyvalue == CONSTANT || is_gimple_call (stmt)
1807 || (gimple_assign_single_p (stmt)
1808 && gimple_assign_rhs_code (stmt) == ADDR_EXPR))
1809 && !is_constant)
1811 enum gimple_code code = gimple_code (stmt);
1812 val.lattice_val = VARYING;
1813 val.value = NULL_TREE;
1814 val.mask = -1;
1815 if (code == GIMPLE_ASSIGN)
1817 enum tree_code subcode = gimple_assign_rhs_code (stmt);
1818 tree rhs1 = gimple_assign_rhs1 (stmt);
1819 tree lhs = gimple_assign_lhs (stmt);
1820 if ((INTEGRAL_TYPE_P (TREE_TYPE (lhs))
1821 || POINTER_TYPE_P (TREE_TYPE (lhs)))
1822 && (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1823 || POINTER_TYPE_P (TREE_TYPE (rhs1))))
1824 switch (get_gimple_rhs_class (subcode))
1826 case GIMPLE_SINGLE_RHS:
1827 val = get_value_for_expr (rhs1, true);
1828 break;
1830 case GIMPLE_UNARY_RHS:
1831 val = bit_value_unop (subcode, TREE_TYPE (lhs), rhs1);
1832 break;
1834 case GIMPLE_BINARY_RHS:
1835 val = bit_value_binop (subcode, TREE_TYPE (lhs), rhs1,
1836 gimple_assign_rhs2 (stmt));
1837 break;
1839 default:;
1842 else if (code == GIMPLE_COND)
1844 enum tree_code code = gimple_cond_code (stmt);
1845 tree rhs1 = gimple_cond_lhs (stmt);
1846 tree rhs2 = gimple_cond_rhs (stmt);
1847 if (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
1848 || POINTER_TYPE_P (TREE_TYPE (rhs1)))
1849 val = bit_value_binop (code, TREE_TYPE (rhs1), rhs1, rhs2);
1851 else if (gimple_call_builtin_p (stmt, BUILT_IN_NORMAL))
1853 tree fndecl = gimple_call_fndecl (stmt);
1854 switch (DECL_FUNCTION_CODE (fndecl))
1856 case BUILT_IN_MALLOC:
1857 case BUILT_IN_REALLOC:
1858 case BUILT_IN_CALLOC:
1859 case BUILT_IN_STRDUP:
1860 case BUILT_IN_STRNDUP:
1861 val.lattice_val = CONSTANT;
1862 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1863 val.mask = ~((HOST_WIDE_INT) MALLOC_ABI_ALIGNMENT
1864 / BITS_PER_UNIT - 1);
1865 break;
1867 case BUILT_IN_ALLOCA:
1868 case BUILT_IN_ALLOCA_WITH_ALIGN:
1869 align = (DECL_FUNCTION_CODE (fndecl) == BUILT_IN_ALLOCA_WITH_ALIGN
1870 ? TREE_INT_CST_LOW (gimple_call_arg (stmt, 1))
1871 : BIGGEST_ALIGNMENT);
1872 val.lattice_val = CONSTANT;
1873 val.value = build_int_cst (TREE_TYPE (gimple_get_lhs (stmt)), 0);
1874 val.mask = ~((HOST_WIDE_INT) align / BITS_PER_UNIT - 1);
1875 break;
1877 /* These builtins return their first argument, unmodified. */
1878 case BUILT_IN_MEMCPY:
1879 case BUILT_IN_MEMMOVE:
1880 case BUILT_IN_MEMSET:
1881 case BUILT_IN_STRCPY:
1882 case BUILT_IN_STRNCPY:
1883 case BUILT_IN_MEMCPY_CHK:
1884 case BUILT_IN_MEMMOVE_CHK:
1885 case BUILT_IN_MEMSET_CHK:
1886 case BUILT_IN_STRCPY_CHK:
1887 case BUILT_IN_STRNCPY_CHK:
1888 val = get_value_for_expr (gimple_call_arg (stmt, 0), true);
1889 break;
1891 case BUILT_IN_ASSUME_ALIGNED:
1892 val = bit_value_assume_aligned (stmt, NULL_TREE, val, false);
1893 break;
1895 case BUILT_IN_ALIGNED_ALLOC:
1897 tree align = get_constant_value (gimple_call_arg (stmt, 0));
1898 if (align
1899 && tree_fits_uhwi_p (align))
1901 unsigned HOST_WIDE_INT aligni = tree_to_uhwi (align);
1902 if (aligni > 1
1903 /* align must be power-of-two */
1904 && (aligni & (aligni - 1)) == 0)
1906 val.lattice_val = CONSTANT;
1907 val.value = build_int_cst (ptr_type_node, 0);
1908 val.mask = -aligni;
1911 break;
1914 default:;
1917 if (is_gimple_call (stmt) && gimple_call_lhs (stmt))
1919 tree fntype = gimple_call_fntype (stmt);
1920 if (fntype)
1922 tree attrs = lookup_attribute ("assume_aligned",
1923 TYPE_ATTRIBUTES (fntype));
1924 if (attrs)
1925 val = bit_value_assume_aligned (stmt, attrs, val, false);
1926 attrs = lookup_attribute ("alloc_align",
1927 TYPE_ATTRIBUTES (fntype));
1928 if (attrs)
1929 val = bit_value_assume_aligned (stmt, attrs, val, true);
1932 is_constant = (val.lattice_val == CONSTANT);
1935 if (flag_tree_bit_ccp
1936 && ((is_constant && TREE_CODE (val.value) == INTEGER_CST)
1937 || !is_constant)
1938 && gimple_get_lhs (stmt)
1939 && TREE_CODE (gimple_get_lhs (stmt)) == SSA_NAME)
1941 tree lhs = gimple_get_lhs (stmt);
1942 wide_int nonzero_bits = get_nonzero_bits (lhs);
1943 if (nonzero_bits != -1)
1945 if (!is_constant)
1947 val.lattice_val = CONSTANT;
1948 val.value = build_zero_cst (TREE_TYPE (lhs));
1949 val.mask = extend_mask (nonzero_bits, TYPE_SIGN (TREE_TYPE (lhs)));
1950 is_constant = true;
1952 else
1954 if (wi::bit_and_not (val.value, nonzero_bits) != 0)
1955 val.value = wide_int_to_tree (TREE_TYPE (lhs),
1956 nonzero_bits & val.value);
1957 if (nonzero_bits == 0)
1958 val.mask = 0;
1959 else
1960 val.mask = val.mask & extend_mask (nonzero_bits,
1961 TYPE_SIGN (TREE_TYPE (lhs)));
1966 /* The statement produced a nonconstant value. */
1967 if (!is_constant)
1969 /* The statement produced a copy. */
1970 if (simplified && TREE_CODE (simplified) == SSA_NAME
1971 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (simplified))
1973 val.lattice_val = CONSTANT;
1974 val.value = simplified;
1975 val.mask = -1;
1977 /* The statement is VARYING. */
1978 else
1980 val.lattice_val = VARYING;
1981 val.value = NULL_TREE;
1982 val.mask = -1;
1986 return val;
1989 typedef hash_table<nofree_ptr_hash<gimple> > gimple_htab;
1991 /* Given a BUILT_IN_STACK_SAVE value SAVED_VAL, insert a clobber of VAR before
1992 each matching BUILT_IN_STACK_RESTORE. Mark visited phis in VISITED. */
1994 static void
1995 insert_clobber_before_stack_restore (tree saved_val, tree var,
1996 gimple_htab **visited)
1998 gimple *stmt;
1999 gassign *clobber_stmt;
2000 tree clobber;
2001 imm_use_iterator iter;
2002 gimple_stmt_iterator i;
2003 gimple **slot;
2005 FOR_EACH_IMM_USE_STMT (stmt, iter, saved_val)
2006 if (gimple_call_builtin_p (stmt, BUILT_IN_STACK_RESTORE))
2008 clobber = build_constructor (TREE_TYPE (var),
2009 NULL);
2010 TREE_THIS_VOLATILE (clobber) = 1;
2011 clobber_stmt = gimple_build_assign (var, clobber);
2013 i = gsi_for_stmt (stmt);
2014 gsi_insert_before (&i, clobber_stmt, GSI_SAME_STMT);
2016 else if (gimple_code (stmt) == GIMPLE_PHI)
2018 if (!*visited)
2019 *visited = new gimple_htab (10);
2021 slot = (*visited)->find_slot (stmt, INSERT);
2022 if (*slot != NULL)
2023 continue;
2025 *slot = stmt;
2026 insert_clobber_before_stack_restore (gimple_phi_result (stmt), var,
2027 visited);
2029 else if (gimple_assign_ssa_name_copy_p (stmt))
2030 insert_clobber_before_stack_restore (gimple_assign_lhs (stmt), var,
2031 visited);
2032 else if (chkp_gimple_call_builtin_p (stmt, BUILT_IN_CHKP_BNDRET))
2033 continue;
2034 else
2035 gcc_assert (is_gimple_debug (stmt));
2038 /* Advance the iterator to the previous non-debug gimple statement in the same
2039 or dominating basic block. */
2041 static inline void
2042 gsi_prev_dom_bb_nondebug (gimple_stmt_iterator *i)
2044 basic_block dom;
2046 gsi_prev_nondebug (i);
2047 while (gsi_end_p (*i))
2049 dom = get_immediate_dominator (CDI_DOMINATORS, i->bb);
2050 if (dom == NULL || dom == ENTRY_BLOCK_PTR_FOR_FN (cfun))
2051 return;
2053 *i = gsi_last_bb (dom);
2057 /* Find a BUILT_IN_STACK_SAVE dominating gsi_stmt (I), and insert
2058 a clobber of VAR before each matching BUILT_IN_STACK_RESTORE.
2060 It is possible that BUILT_IN_STACK_SAVE cannot be find in a dominator when a
2061 previous pass (such as DOM) duplicated it along multiple paths to a BB. In
2062 that case the function gives up without inserting the clobbers. */
2064 static void
2065 insert_clobbers_for_var (gimple_stmt_iterator i, tree var)
2067 gimple *stmt;
2068 tree saved_val;
2069 gimple_htab *visited = NULL;
2071 for (; !gsi_end_p (i); gsi_prev_dom_bb_nondebug (&i))
2073 stmt = gsi_stmt (i);
2075 if (!gimple_call_builtin_p (stmt, BUILT_IN_STACK_SAVE))
2076 continue;
2078 saved_val = gimple_call_lhs (stmt);
2079 if (saved_val == NULL_TREE)
2080 continue;
2082 insert_clobber_before_stack_restore (saved_val, var, &visited);
2083 break;
2086 delete visited;
2089 /* Detects a __builtin_alloca_with_align with constant size argument. Declares
2090 fixed-size array and returns the address, if found, otherwise returns
2091 NULL_TREE. */
2093 static tree
2094 fold_builtin_alloca_with_align (gimple *stmt)
2096 unsigned HOST_WIDE_INT size, threshold, n_elem;
2097 tree lhs, arg, block, var, elem_type, array_type;
2099 /* Get lhs. */
2100 lhs = gimple_call_lhs (stmt);
2101 if (lhs == NULL_TREE)
2102 return NULL_TREE;
2104 /* Detect constant argument. */
2105 arg = get_constant_value (gimple_call_arg (stmt, 0));
2106 if (arg == NULL_TREE
2107 || TREE_CODE (arg) != INTEGER_CST
2108 || !tree_fits_uhwi_p (arg))
2109 return NULL_TREE;
2111 size = tree_to_uhwi (arg);
2113 /* Heuristic: don't fold large allocas. */
2114 threshold = (unsigned HOST_WIDE_INT)PARAM_VALUE (PARAM_LARGE_STACK_FRAME);
2115 /* In case the alloca is located at function entry, it has the same lifetime
2116 as a declared array, so we allow a larger size. */
2117 block = gimple_block (stmt);
2118 if (!(cfun->after_inlining
2119 && block
2120 && TREE_CODE (BLOCK_SUPERCONTEXT (block)) == FUNCTION_DECL))
2121 threshold /= 10;
2122 if (size > threshold)
2123 return NULL_TREE;
2125 /* Declare array. */
2126 elem_type = build_nonstandard_integer_type (BITS_PER_UNIT, 1);
2127 n_elem = size * 8 / BITS_PER_UNIT;
2128 array_type = build_array_type_nelts (elem_type, n_elem);
2129 var = create_tmp_var (array_type);
2130 SET_DECL_ALIGN (var, TREE_INT_CST_LOW (gimple_call_arg (stmt, 1)));
2132 struct ptr_info_def *pi = SSA_NAME_PTR_INFO (lhs);
2133 if (pi != NULL && !pi->pt.anything)
2135 bool singleton_p;
2136 unsigned uid;
2137 singleton_p = pt_solution_singleton_or_null_p (&pi->pt, &uid);
2138 gcc_assert (singleton_p);
2139 SET_DECL_PT_UID (var, uid);
2143 /* Fold alloca to the address of the array. */
2144 return fold_convert (TREE_TYPE (lhs), build_fold_addr_expr (var));
2147 /* Fold the stmt at *GSI with CCP specific information that propagating
2148 and regular folding does not catch. */
2150 static bool
2151 ccp_fold_stmt (gimple_stmt_iterator *gsi)
2153 gimple *stmt = gsi_stmt (*gsi);
2155 switch (gimple_code (stmt))
2157 case GIMPLE_COND:
2159 gcond *cond_stmt = as_a <gcond *> (stmt);
2160 ccp_prop_value_t val;
2161 /* Statement evaluation will handle type mismatches in constants
2162 more gracefully than the final propagation. This allows us to
2163 fold more conditionals here. */
2164 val = evaluate_stmt (stmt);
2165 if (val.lattice_val != CONSTANT
2166 || val.mask != 0)
2167 return false;
2169 if (dump_file)
2171 fprintf (dump_file, "Folding predicate ");
2172 print_gimple_expr (dump_file, stmt, 0, 0);
2173 fprintf (dump_file, " to ");
2174 print_generic_expr (dump_file, val.value, 0);
2175 fprintf (dump_file, "\n");
2178 if (integer_zerop (val.value))
2179 gimple_cond_make_false (cond_stmt);
2180 else
2181 gimple_cond_make_true (cond_stmt);
2183 return true;
2186 case GIMPLE_CALL:
2188 tree lhs = gimple_call_lhs (stmt);
2189 int flags = gimple_call_flags (stmt);
2190 tree val;
2191 tree argt;
2192 bool changed = false;
2193 unsigned i;
2195 /* If the call was folded into a constant make sure it goes
2196 away even if we cannot propagate into all uses because of
2197 type issues. */
2198 if (lhs
2199 && TREE_CODE (lhs) == SSA_NAME
2200 && (val = get_constant_value (lhs))
2201 /* Don't optimize away calls that have side-effects. */
2202 && (flags & (ECF_CONST|ECF_PURE)) != 0
2203 && (flags & ECF_LOOPING_CONST_OR_PURE) == 0)
2205 tree new_rhs = unshare_expr (val);
2206 bool res;
2207 if (!useless_type_conversion_p (TREE_TYPE (lhs),
2208 TREE_TYPE (new_rhs)))
2209 new_rhs = fold_convert (TREE_TYPE (lhs), new_rhs);
2210 res = update_call_from_tree (gsi, new_rhs);
2211 gcc_assert (res);
2212 return true;
2215 /* Internal calls provide no argument types, so the extra laxity
2216 for normal calls does not apply. */
2217 if (gimple_call_internal_p (stmt))
2218 return false;
2220 /* The heuristic of fold_builtin_alloca_with_align differs before and
2221 after inlining, so we don't require the arg to be changed into a
2222 constant for folding, but just to be constant. */
2223 if (gimple_call_builtin_p (stmt, BUILT_IN_ALLOCA_WITH_ALIGN))
2225 tree new_rhs = fold_builtin_alloca_with_align (stmt);
2226 if (new_rhs)
2228 bool res = update_call_from_tree (gsi, new_rhs);
2229 tree var = TREE_OPERAND (TREE_OPERAND (new_rhs, 0),0);
2230 gcc_assert (res);
2231 insert_clobbers_for_var (*gsi, var);
2232 return true;
2236 /* Propagate into the call arguments. Compared to replace_uses_in
2237 this can use the argument slot types for type verification
2238 instead of the current argument type. We also can safely
2239 drop qualifiers here as we are dealing with constants anyway. */
2240 argt = TYPE_ARG_TYPES (gimple_call_fntype (stmt));
2241 for (i = 0; i < gimple_call_num_args (stmt) && argt;
2242 ++i, argt = TREE_CHAIN (argt))
2244 tree arg = gimple_call_arg (stmt, i);
2245 if (TREE_CODE (arg) == SSA_NAME
2246 && (val = get_constant_value (arg))
2247 && useless_type_conversion_p
2248 (TYPE_MAIN_VARIANT (TREE_VALUE (argt)),
2249 TYPE_MAIN_VARIANT (TREE_TYPE (val))))
2251 gimple_call_set_arg (stmt, i, unshare_expr (val));
2252 changed = true;
2256 return changed;
2259 case GIMPLE_ASSIGN:
2261 tree lhs = gimple_assign_lhs (stmt);
2262 tree val;
2264 /* If we have a load that turned out to be constant replace it
2265 as we cannot propagate into all uses in all cases. */
2266 if (gimple_assign_single_p (stmt)
2267 && TREE_CODE (lhs) == SSA_NAME
2268 && (val = get_constant_value (lhs)))
2270 tree rhs = unshare_expr (val);
2271 if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs)))
2272 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (lhs), rhs);
2273 gimple_assign_set_rhs_from_tree (gsi, rhs);
2274 return true;
2277 return false;
2280 default:
2281 return false;
2285 /* Visit the assignment statement STMT. Set the value of its LHS to the
2286 value computed by the RHS and store LHS in *OUTPUT_P. If STMT
2287 creates virtual definitions, set the value of each new name to that
2288 of the RHS (if we can derive a constant out of the RHS).
2289 Value-returning call statements also perform an assignment, and
2290 are handled here. */
2292 static enum ssa_prop_result
2293 visit_assignment (gimple *stmt, tree *output_p)
2295 ccp_prop_value_t val;
2296 enum ssa_prop_result retval = SSA_PROP_NOT_INTERESTING;
2298 tree lhs = gimple_get_lhs (stmt);
2299 if (TREE_CODE (lhs) == SSA_NAME)
2301 /* Evaluate the statement, which could be
2302 either a GIMPLE_ASSIGN or a GIMPLE_CALL. */
2303 val = evaluate_stmt (stmt);
2305 /* If STMT is an assignment to an SSA_NAME, we only have one
2306 value to set. */
2307 if (set_lattice_value (lhs, &val))
2309 *output_p = lhs;
2310 if (val.lattice_val == VARYING)
2311 retval = SSA_PROP_VARYING;
2312 else
2313 retval = SSA_PROP_INTERESTING;
2317 return retval;
2321 /* Visit the conditional statement STMT. Return SSA_PROP_INTERESTING
2322 if it can determine which edge will be taken. Otherwise, return
2323 SSA_PROP_VARYING. */
2325 static enum ssa_prop_result
2326 visit_cond_stmt (gimple *stmt, edge *taken_edge_p)
2328 ccp_prop_value_t val;
2329 basic_block block;
2331 block = gimple_bb (stmt);
2332 val = evaluate_stmt (stmt);
2333 if (val.lattice_val != CONSTANT
2334 || val.mask != 0)
2335 return SSA_PROP_VARYING;
2337 /* Find which edge out of the conditional block will be taken and add it
2338 to the worklist. If no single edge can be determined statically,
2339 return SSA_PROP_VARYING to feed all the outgoing edges to the
2340 propagation engine. */
2341 *taken_edge_p = find_taken_edge (block, val.value);
2342 if (*taken_edge_p)
2343 return SSA_PROP_INTERESTING;
2344 else
2345 return SSA_PROP_VARYING;
2349 /* Evaluate statement STMT. If the statement produces an output value and
2350 its evaluation changes the lattice value of its output, return
2351 SSA_PROP_INTERESTING and set *OUTPUT_P to the SSA_NAME holding the
2352 output value.
2354 If STMT is a conditional branch and we can determine its truth
2355 value, set *TAKEN_EDGE_P accordingly. If STMT produces a varying
2356 value, return SSA_PROP_VARYING. */
2358 static enum ssa_prop_result
2359 ccp_visit_stmt (gimple *stmt, edge *taken_edge_p, tree *output_p)
2361 tree def;
2362 ssa_op_iter iter;
2364 if (dump_file && (dump_flags & TDF_DETAILS))
2366 fprintf (dump_file, "\nVisiting statement:\n");
2367 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
2370 switch (gimple_code (stmt))
2372 case GIMPLE_ASSIGN:
2373 /* If the statement is an assignment that produces a single
2374 output value, evaluate its RHS to see if the lattice value of
2375 its output has changed. */
2376 return visit_assignment (stmt, output_p);
2378 case GIMPLE_CALL:
2379 /* A value-returning call also performs an assignment. */
2380 if (gimple_call_lhs (stmt) != NULL_TREE)
2381 return visit_assignment (stmt, output_p);
2382 break;
2384 case GIMPLE_COND:
2385 case GIMPLE_SWITCH:
2386 /* If STMT is a conditional branch, see if we can determine
2387 which branch will be taken. */
2388 /* FIXME. It appears that we should be able to optimize
2389 computed GOTOs here as well. */
2390 return visit_cond_stmt (stmt, taken_edge_p);
2392 default:
2393 break;
2396 /* Any other kind of statement is not interesting for constant
2397 propagation and, therefore, not worth simulating. */
2398 if (dump_file && (dump_flags & TDF_DETAILS))
2399 fprintf (dump_file, "No interesting values produced. Marked VARYING.\n");
2401 /* Definitions made by statements other than assignments to
2402 SSA_NAMEs represent unknown modifications to their outputs.
2403 Mark them VARYING. */
2404 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
2405 set_value_varying (def);
2407 return SSA_PROP_VARYING;
2411 /* Main entry point for SSA Conditional Constant Propagation. If NONZERO_P,
2412 record nonzero bits. */
2414 static unsigned int
2415 do_ssa_ccp (bool nonzero_p)
2417 unsigned int todo = 0;
2418 calculate_dominance_info (CDI_DOMINATORS);
2420 ccp_initialize ();
2421 ssa_propagate (ccp_visit_stmt, ccp_visit_phi_node);
2422 if (ccp_finalize (nonzero_p || flag_ipa_bit_cp))
2424 todo = (TODO_cleanup_cfg | TODO_update_ssa);
2426 /* ccp_finalize does not preserve loop-closed ssa. */
2427 loops_state_clear (LOOP_CLOSED_SSA);
2430 free_dominance_info (CDI_DOMINATORS);
2431 return todo;
2435 namespace {
2437 const pass_data pass_data_ccp =
2439 GIMPLE_PASS, /* type */
2440 "ccp", /* name */
2441 OPTGROUP_NONE, /* optinfo_flags */
2442 TV_TREE_CCP, /* tv_id */
2443 ( PROP_cfg | PROP_ssa ), /* properties_required */
2444 0, /* properties_provided */
2445 0, /* properties_destroyed */
2446 0, /* todo_flags_start */
2447 TODO_update_address_taken, /* todo_flags_finish */
2450 class pass_ccp : public gimple_opt_pass
2452 public:
2453 pass_ccp (gcc::context *ctxt)
2454 : gimple_opt_pass (pass_data_ccp, ctxt), nonzero_p (false)
2457 /* opt_pass methods: */
2458 opt_pass * clone () { return new pass_ccp (m_ctxt); }
2459 void set_pass_param (unsigned int n, bool param)
2461 gcc_assert (n == 0);
2462 nonzero_p = param;
2464 virtual bool gate (function *) { return flag_tree_ccp != 0; }
2465 virtual unsigned int execute (function *) { return do_ssa_ccp (nonzero_p); }
2467 private:
2468 /* Determines whether the pass instance records nonzero bits. */
2469 bool nonzero_p;
2470 }; // class pass_ccp
2472 } // anon namespace
2474 gimple_opt_pass *
2475 make_pass_ccp (gcc::context *ctxt)
2477 return new pass_ccp (ctxt);
2482 /* Try to optimize out __builtin_stack_restore. Optimize it out
2483 if there is another __builtin_stack_restore in the same basic
2484 block and no calls or ASM_EXPRs are in between, or if this block's
2485 only outgoing edge is to EXIT_BLOCK and there are no calls or
2486 ASM_EXPRs after this __builtin_stack_restore. */
2488 static tree
2489 optimize_stack_restore (gimple_stmt_iterator i)
2491 tree callee;
2492 gimple *stmt;
2494 basic_block bb = gsi_bb (i);
2495 gimple *call = gsi_stmt (i);
2497 if (gimple_code (call) != GIMPLE_CALL
2498 || gimple_call_num_args (call) != 1
2499 || TREE_CODE (gimple_call_arg (call, 0)) != SSA_NAME
2500 || !POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, 0))))
2501 return NULL_TREE;
2503 for (gsi_next (&i); !gsi_end_p (i); gsi_next (&i))
2505 stmt = gsi_stmt (i);
2506 if (gimple_code (stmt) == GIMPLE_ASM)
2507 return NULL_TREE;
2508 if (gimple_code (stmt) != GIMPLE_CALL)
2509 continue;
2511 callee = gimple_call_fndecl (stmt);
2512 if (!callee
2513 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
2514 /* All regular builtins are ok, just obviously not alloca. */
2515 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA
2516 || DECL_FUNCTION_CODE (callee) == BUILT_IN_ALLOCA_WITH_ALIGN)
2517 return NULL_TREE;
2519 if (DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_RESTORE)
2520 goto second_stack_restore;
2523 if (!gsi_end_p (i))
2524 return NULL_TREE;
2526 /* Allow one successor of the exit block, or zero successors. */
2527 switch (EDGE_COUNT (bb->succs))
2529 case 0:
2530 break;
2531 case 1:
2532 if (single_succ_edge (bb)->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
2533 return NULL_TREE;
2534 break;
2535 default:
2536 return NULL_TREE;
2538 second_stack_restore:
2540 /* If there's exactly one use, then zap the call to __builtin_stack_save.
2541 If there are multiple uses, then the last one should remove the call.
2542 In any case, whether the call to __builtin_stack_save can be removed
2543 or not is irrelevant to removing the call to __builtin_stack_restore. */
2544 if (has_single_use (gimple_call_arg (call, 0)))
2546 gimple *stack_save = SSA_NAME_DEF_STMT (gimple_call_arg (call, 0));
2547 if (is_gimple_call (stack_save))
2549 callee = gimple_call_fndecl (stack_save);
2550 if (callee
2551 && DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL
2552 && DECL_FUNCTION_CODE (callee) == BUILT_IN_STACK_SAVE)
2554 gimple_stmt_iterator stack_save_gsi;
2555 tree rhs;
2557 stack_save_gsi = gsi_for_stmt (stack_save);
2558 rhs = build_int_cst (TREE_TYPE (gimple_call_arg (call, 0)), 0);
2559 update_call_from_tree (&stack_save_gsi, rhs);
2564 /* No effect, so the statement will be deleted. */
2565 return integer_zero_node;
2568 /* If va_list type is a simple pointer and nothing special is needed,
2569 optimize __builtin_va_start (&ap, 0) into ap = __builtin_next_arg (0),
2570 __builtin_va_end (&ap) out as NOP and __builtin_va_copy into a simple
2571 pointer assignment. */
2573 static tree
2574 optimize_stdarg_builtin (gimple *call)
2576 tree callee, lhs, rhs, cfun_va_list;
2577 bool va_list_simple_ptr;
2578 location_t loc = gimple_location (call);
2580 if (gimple_code (call) != GIMPLE_CALL)
2581 return NULL_TREE;
2583 callee = gimple_call_fndecl (call);
2585 cfun_va_list = targetm.fn_abi_va_list (callee);
2586 va_list_simple_ptr = POINTER_TYPE_P (cfun_va_list)
2587 && (TREE_TYPE (cfun_va_list) == void_type_node
2588 || TREE_TYPE (cfun_va_list) == char_type_node);
2590 switch (DECL_FUNCTION_CODE (callee))
2592 case BUILT_IN_VA_START:
2593 if (!va_list_simple_ptr
2594 || targetm.expand_builtin_va_start != NULL
2595 || !builtin_decl_explicit_p (BUILT_IN_NEXT_ARG))
2596 return NULL_TREE;
2598 if (gimple_call_num_args (call) != 2)
2599 return NULL_TREE;
2601 lhs = gimple_call_arg (call, 0);
2602 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2603 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2604 != TYPE_MAIN_VARIANT (cfun_va_list))
2605 return NULL_TREE;
2607 lhs = build_fold_indirect_ref_loc (loc, lhs);
2608 rhs = build_call_expr_loc (loc, builtin_decl_explicit (BUILT_IN_NEXT_ARG),
2609 1, integer_zero_node);
2610 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2611 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2613 case BUILT_IN_VA_COPY:
2614 if (!va_list_simple_ptr)
2615 return NULL_TREE;
2617 if (gimple_call_num_args (call) != 2)
2618 return NULL_TREE;
2620 lhs = gimple_call_arg (call, 0);
2621 if (!POINTER_TYPE_P (TREE_TYPE (lhs))
2622 || TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (lhs)))
2623 != TYPE_MAIN_VARIANT (cfun_va_list))
2624 return NULL_TREE;
2626 lhs = build_fold_indirect_ref_loc (loc, lhs);
2627 rhs = gimple_call_arg (call, 1);
2628 if (TYPE_MAIN_VARIANT (TREE_TYPE (rhs))
2629 != TYPE_MAIN_VARIANT (cfun_va_list))
2630 return NULL_TREE;
2632 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
2633 return build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, rhs);
2635 case BUILT_IN_VA_END:
2636 /* No effect, so the statement will be deleted. */
2637 return integer_zero_node;
2639 default:
2640 gcc_unreachable ();
2644 /* Attemp to make the block of __builtin_unreachable I unreachable by changing
2645 the incoming jumps. Return true if at least one jump was changed. */
2647 static bool
2648 optimize_unreachable (gimple_stmt_iterator i)
2650 basic_block bb = gsi_bb (i);
2651 gimple_stmt_iterator gsi;
2652 gimple *stmt;
2653 edge_iterator ei;
2654 edge e;
2655 bool ret;
2657 if (flag_sanitize & SANITIZE_UNREACHABLE)
2658 return false;
2660 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2662 stmt = gsi_stmt (gsi);
2664 if (is_gimple_debug (stmt))
2665 continue;
2667 if (glabel *label_stmt = dyn_cast <glabel *> (stmt))
2669 /* Verify we do not need to preserve the label. */
2670 if (FORCED_LABEL (gimple_label_label (label_stmt)))
2671 return false;
2673 continue;
2676 /* Only handle the case that __builtin_unreachable is the first statement
2677 in the block. We rely on DCE to remove stmts without side-effects
2678 before __builtin_unreachable. */
2679 if (gsi_stmt (gsi) != gsi_stmt (i))
2680 return false;
2683 ret = false;
2684 FOR_EACH_EDGE (e, ei, bb->preds)
2686 gsi = gsi_last_bb (e->src);
2687 if (gsi_end_p (gsi))
2688 continue;
2690 stmt = gsi_stmt (gsi);
2691 if (gcond *cond_stmt = dyn_cast <gcond *> (stmt))
2693 if (e->flags & EDGE_TRUE_VALUE)
2694 gimple_cond_make_false (cond_stmt);
2695 else if (e->flags & EDGE_FALSE_VALUE)
2696 gimple_cond_make_true (cond_stmt);
2697 else
2698 gcc_unreachable ();
2699 update_stmt (cond_stmt);
2701 else
2703 /* Todo: handle other cases, f.i. switch statement. */
2704 continue;
2707 ret = true;
2710 return ret;
2713 /* Optimize
2714 mask_2 = 1 << cnt_1;
2715 _4 = __atomic_fetch_or_* (ptr_6, mask_2, _3);
2716 _5 = _4 & mask_2;
2718 _4 = ATOMIC_BIT_TEST_AND_SET (ptr_6, cnt_1, 0, _3);
2719 _5 = _4;
2720 If _5 is only used in _5 != 0 or _5 == 0 comparisons, 1
2721 is passed instead of 0, and the builtin just returns a zero
2722 or 1 value instead of the actual bit.
2723 Similarly for __sync_fetch_and_or_* (without the ", _3" part
2724 in there), and/or if mask_2 is a power of 2 constant.
2725 Similarly for xor instead of or, use ATOMIC_BIT_TEST_AND_COMPLEMENT
2726 in that case. And similarly for and instead of or, except that
2727 the second argument to the builtin needs to be one's complement
2728 of the mask instead of mask. */
2730 static void
2731 optimize_atomic_bit_test_and (gimple_stmt_iterator *gsip,
2732 enum internal_fn fn, bool has_model_arg,
2733 bool after)
2735 gimple *call = gsi_stmt (*gsip);
2736 tree lhs = gimple_call_lhs (call);
2737 use_operand_p use_p;
2738 gimple *use_stmt;
2739 tree mask, bit;
2740 optab optab;
2742 if (!flag_inline_atomics
2743 || optimize_debug
2744 || !gimple_call_builtin_p (call, BUILT_IN_NORMAL)
2745 || !lhs
2746 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs)
2747 || !single_imm_use (lhs, &use_p, &use_stmt)
2748 || !is_gimple_assign (use_stmt)
2749 || gimple_assign_rhs_code (use_stmt) != BIT_AND_EXPR
2750 || !gimple_vdef (call))
2751 return;
2753 switch (fn)
2755 case IFN_ATOMIC_BIT_TEST_AND_SET:
2756 optab = atomic_bit_test_and_set_optab;
2757 break;
2758 case IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT:
2759 optab = atomic_bit_test_and_complement_optab;
2760 break;
2761 case IFN_ATOMIC_BIT_TEST_AND_RESET:
2762 optab = atomic_bit_test_and_reset_optab;
2763 break;
2764 default:
2765 return;
2768 if (optab_handler (optab, TYPE_MODE (TREE_TYPE (lhs))) == CODE_FOR_nothing)
2769 return;
2771 mask = gimple_call_arg (call, 1);
2772 tree use_lhs = gimple_assign_lhs (use_stmt);
2773 if (!use_lhs)
2774 return;
2776 if (TREE_CODE (mask) == INTEGER_CST)
2778 if (fn == IFN_ATOMIC_BIT_TEST_AND_RESET)
2779 mask = const_unop (BIT_NOT_EXPR, TREE_TYPE (mask), mask);
2780 mask = fold_convert (TREE_TYPE (lhs), mask);
2781 int ibit = tree_log2 (mask);
2782 if (ibit < 0)
2783 return;
2784 bit = build_int_cst (TREE_TYPE (lhs), ibit);
2786 else if (TREE_CODE (mask) == SSA_NAME)
2788 gimple *g = SSA_NAME_DEF_STMT (mask);
2789 if (fn == IFN_ATOMIC_BIT_TEST_AND_RESET)
2791 if (!is_gimple_assign (g)
2792 || gimple_assign_rhs_code (g) != BIT_NOT_EXPR)
2793 return;
2794 mask = gimple_assign_rhs1 (g);
2795 if (TREE_CODE (mask) != SSA_NAME)
2796 return;
2797 g = SSA_NAME_DEF_STMT (mask);
2799 if (!is_gimple_assign (g)
2800 || gimple_assign_rhs_code (g) != LSHIFT_EXPR
2801 || !integer_onep (gimple_assign_rhs1 (g)))
2802 return;
2803 bit = gimple_assign_rhs2 (g);
2805 else
2806 return;
2808 if (gimple_assign_rhs1 (use_stmt) == lhs)
2810 if (!operand_equal_p (gimple_assign_rhs2 (use_stmt), mask, 0))
2811 return;
2813 else if (gimple_assign_rhs2 (use_stmt) != lhs
2814 || !operand_equal_p (gimple_assign_rhs1 (use_stmt), mask, 0))
2815 return;
2817 bool use_bool = true;
2818 bool has_debug_uses = false;
2819 imm_use_iterator iter;
2820 gimple *g;
2822 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (use_lhs))
2823 use_bool = false;
2824 FOR_EACH_IMM_USE_STMT (g, iter, use_lhs)
2826 enum tree_code code = ERROR_MARK;
2827 tree op0 = NULL_TREE, op1 = NULL_TREE;
2828 if (is_gimple_debug (g))
2830 has_debug_uses = true;
2831 continue;
2833 else if (is_gimple_assign (g))
2834 switch (gimple_assign_rhs_code (g))
2836 case COND_EXPR:
2837 op1 = gimple_assign_rhs1 (g);
2838 code = TREE_CODE (op1);
2839 op0 = TREE_OPERAND (op1, 0);
2840 op1 = TREE_OPERAND (op1, 1);
2841 break;
2842 case EQ_EXPR:
2843 case NE_EXPR:
2844 code = gimple_assign_rhs_code (g);
2845 op0 = gimple_assign_rhs1 (g);
2846 op1 = gimple_assign_rhs2 (g);
2847 break;
2848 default:
2849 break;
2851 else if (gimple_code (g) == GIMPLE_COND)
2853 code = gimple_cond_code (g);
2854 op0 = gimple_cond_lhs (g);
2855 op1 = gimple_cond_rhs (g);
2858 if ((code == EQ_EXPR || code == NE_EXPR)
2859 && op0 == use_lhs
2860 && integer_zerop (op1))
2862 use_operand_p use_p;
2863 int n = 0;
2864 FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
2865 n++;
2866 if (n == 1)
2867 continue;
2870 use_bool = false;
2871 BREAK_FROM_IMM_USE_STMT (iter);
2874 tree new_lhs = make_ssa_name (TREE_TYPE (lhs));
2875 tree flag = build_int_cst (TREE_TYPE (lhs), use_bool);
2876 if (has_model_arg)
2877 g = gimple_build_call_internal (fn, 4, gimple_call_arg (call, 0),
2878 bit, flag, gimple_call_arg (call, 2));
2879 else
2880 g = gimple_build_call_internal (fn, 3, gimple_call_arg (call, 0),
2881 bit, flag);
2882 gimple_call_set_lhs (g, new_lhs);
2883 gimple_set_location (g, gimple_location (call));
2884 gimple_set_vuse (g, gimple_vuse (call));
2885 gimple_set_vdef (g, gimple_vdef (call));
2886 SSA_NAME_DEF_STMT (gimple_vdef (call)) = g;
2887 gimple_stmt_iterator gsi = *gsip;
2888 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2889 if (after)
2891 /* The internal function returns the value of the specified bit
2892 before the atomic operation. If we are interested in the value
2893 of the specified bit after the atomic operation (makes only sense
2894 for xor, otherwise the bit content is compile time known),
2895 we need to invert the bit. */
2896 g = gimple_build_assign (make_ssa_name (TREE_TYPE (lhs)),
2897 BIT_XOR_EXPR, new_lhs,
2898 use_bool ? build_int_cst (TREE_TYPE (lhs), 1)
2899 : mask);
2900 new_lhs = gimple_assign_lhs (g);
2901 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2903 if (use_bool && has_debug_uses)
2905 tree temp = make_node (DEBUG_EXPR_DECL);
2906 DECL_ARTIFICIAL (temp) = 1;
2907 TREE_TYPE (temp) = TREE_TYPE (lhs);
2908 DECL_MODE (temp) = TYPE_MODE (TREE_TYPE (lhs));
2909 tree t = build2 (LSHIFT_EXPR, TREE_TYPE (lhs), new_lhs, bit);
2910 g = gimple_build_debug_bind (temp, t, g);
2911 gsi_insert_after (&gsi, g, GSI_NEW_STMT);
2912 FOR_EACH_IMM_USE_STMT (g, iter, use_lhs)
2913 if (is_gimple_debug (g))
2915 use_operand_p use_p;
2916 FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
2917 SET_USE (use_p, temp);
2918 update_stmt (g);
2921 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_lhs)
2922 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (use_lhs);
2923 replace_uses_by (use_lhs, new_lhs);
2924 gsi = gsi_for_stmt (use_stmt);
2925 gsi_remove (&gsi, true);
2926 release_defs (use_stmt);
2927 gsi_remove (gsip, true);
2928 release_ssa_name (lhs);
2931 /* A simple pass that attempts to fold all builtin functions. This pass
2932 is run after we've propagated as many constants as we can. */
2934 namespace {
2936 const pass_data pass_data_fold_builtins =
2938 GIMPLE_PASS, /* type */
2939 "fab", /* name */
2940 OPTGROUP_NONE, /* optinfo_flags */
2941 TV_NONE, /* tv_id */
2942 ( PROP_cfg | PROP_ssa ), /* properties_required */
2943 0, /* properties_provided */
2944 0, /* properties_destroyed */
2945 0, /* todo_flags_start */
2946 TODO_update_ssa, /* todo_flags_finish */
2949 class pass_fold_builtins : public gimple_opt_pass
2951 public:
2952 pass_fold_builtins (gcc::context *ctxt)
2953 : gimple_opt_pass (pass_data_fold_builtins, ctxt)
2956 /* opt_pass methods: */
2957 opt_pass * clone () { return new pass_fold_builtins (m_ctxt); }
2958 virtual unsigned int execute (function *);
2960 }; // class pass_fold_builtins
2962 unsigned int
2963 pass_fold_builtins::execute (function *fun)
2965 bool cfg_changed = false;
2966 basic_block bb;
2967 unsigned int todoflags = 0;
2969 FOR_EACH_BB_FN (bb, fun)
2971 gimple_stmt_iterator i;
2972 for (i = gsi_start_bb (bb); !gsi_end_p (i); )
2974 gimple *stmt, *old_stmt;
2975 tree callee;
2976 enum built_in_function fcode;
2978 stmt = gsi_stmt (i);
2980 if (gimple_code (stmt) != GIMPLE_CALL)
2982 /* Remove all *ssaname_N ={v} {CLOBBER}; stmts,
2983 after the last GIMPLE DSE they aren't needed and might
2984 unnecessarily keep the SSA_NAMEs live. */
2985 if (gimple_clobber_p (stmt))
2987 tree lhs = gimple_assign_lhs (stmt);
2988 if (TREE_CODE (lhs) == MEM_REF
2989 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
2991 unlink_stmt_vdef (stmt);
2992 gsi_remove (&i, true);
2993 release_defs (stmt);
2994 continue;
2997 gsi_next (&i);
2998 continue;
3001 callee = gimple_call_fndecl (stmt);
3002 if (!callee || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL)
3004 gsi_next (&i);
3005 continue;
3008 fcode = DECL_FUNCTION_CODE (callee);
3009 if (fold_stmt (&i))
3011 else
3013 tree result = NULL_TREE;
3014 switch (DECL_FUNCTION_CODE (callee))
3016 case BUILT_IN_CONSTANT_P:
3017 /* Resolve __builtin_constant_p. If it hasn't been
3018 folded to integer_one_node by now, it's fairly
3019 certain that the value simply isn't constant. */
3020 result = integer_zero_node;
3021 break;
3023 case BUILT_IN_ASSUME_ALIGNED:
3024 /* Remove __builtin_assume_aligned. */
3025 result = gimple_call_arg (stmt, 0);
3026 break;
3028 case BUILT_IN_STACK_RESTORE:
3029 result = optimize_stack_restore (i);
3030 if (result)
3031 break;
3032 gsi_next (&i);
3033 continue;
3035 case BUILT_IN_UNREACHABLE:
3036 if (optimize_unreachable (i))
3037 cfg_changed = true;
3038 break;
3040 case BUILT_IN_ATOMIC_FETCH_OR_1:
3041 case BUILT_IN_ATOMIC_FETCH_OR_2:
3042 case BUILT_IN_ATOMIC_FETCH_OR_4:
3043 case BUILT_IN_ATOMIC_FETCH_OR_8:
3044 case BUILT_IN_ATOMIC_FETCH_OR_16:
3045 optimize_atomic_bit_test_and (&i,
3046 IFN_ATOMIC_BIT_TEST_AND_SET,
3047 true, false);
3048 break;
3049 case BUILT_IN_SYNC_FETCH_AND_OR_1:
3050 case BUILT_IN_SYNC_FETCH_AND_OR_2:
3051 case BUILT_IN_SYNC_FETCH_AND_OR_4:
3052 case BUILT_IN_SYNC_FETCH_AND_OR_8:
3053 case BUILT_IN_SYNC_FETCH_AND_OR_16:
3054 optimize_atomic_bit_test_and (&i,
3055 IFN_ATOMIC_BIT_TEST_AND_SET,
3056 false, false);
3057 break;
3059 case BUILT_IN_ATOMIC_FETCH_XOR_1:
3060 case BUILT_IN_ATOMIC_FETCH_XOR_2:
3061 case BUILT_IN_ATOMIC_FETCH_XOR_4:
3062 case BUILT_IN_ATOMIC_FETCH_XOR_8:
3063 case BUILT_IN_ATOMIC_FETCH_XOR_16:
3064 optimize_atomic_bit_test_and
3065 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, true, false);
3066 break;
3067 case BUILT_IN_SYNC_FETCH_AND_XOR_1:
3068 case BUILT_IN_SYNC_FETCH_AND_XOR_2:
3069 case BUILT_IN_SYNC_FETCH_AND_XOR_4:
3070 case BUILT_IN_SYNC_FETCH_AND_XOR_8:
3071 case BUILT_IN_SYNC_FETCH_AND_XOR_16:
3072 optimize_atomic_bit_test_and
3073 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, false, false);
3074 break;
3076 case BUILT_IN_ATOMIC_XOR_FETCH_1:
3077 case BUILT_IN_ATOMIC_XOR_FETCH_2:
3078 case BUILT_IN_ATOMIC_XOR_FETCH_4:
3079 case BUILT_IN_ATOMIC_XOR_FETCH_8:
3080 case BUILT_IN_ATOMIC_XOR_FETCH_16:
3081 optimize_atomic_bit_test_and
3082 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, true, true);
3083 break;
3084 case BUILT_IN_SYNC_XOR_AND_FETCH_1:
3085 case BUILT_IN_SYNC_XOR_AND_FETCH_2:
3086 case BUILT_IN_SYNC_XOR_AND_FETCH_4:
3087 case BUILT_IN_SYNC_XOR_AND_FETCH_8:
3088 case BUILT_IN_SYNC_XOR_AND_FETCH_16:
3089 optimize_atomic_bit_test_and
3090 (&i, IFN_ATOMIC_BIT_TEST_AND_COMPLEMENT, false, true);
3091 break;
3093 case BUILT_IN_ATOMIC_FETCH_AND_1:
3094 case BUILT_IN_ATOMIC_FETCH_AND_2:
3095 case BUILT_IN_ATOMIC_FETCH_AND_4:
3096 case BUILT_IN_ATOMIC_FETCH_AND_8:
3097 case BUILT_IN_ATOMIC_FETCH_AND_16:
3098 optimize_atomic_bit_test_and (&i,
3099 IFN_ATOMIC_BIT_TEST_AND_RESET,
3100 true, false);
3101 break;
3102 case BUILT_IN_SYNC_FETCH_AND_AND_1:
3103 case BUILT_IN_SYNC_FETCH_AND_AND_2:
3104 case BUILT_IN_SYNC_FETCH_AND_AND_4:
3105 case BUILT_IN_SYNC_FETCH_AND_AND_8:
3106 case BUILT_IN_SYNC_FETCH_AND_AND_16:
3107 optimize_atomic_bit_test_and (&i,
3108 IFN_ATOMIC_BIT_TEST_AND_RESET,
3109 false, false);
3110 break;
3112 case BUILT_IN_VA_START:
3113 case BUILT_IN_VA_END:
3114 case BUILT_IN_VA_COPY:
3115 /* These shouldn't be folded before pass_stdarg. */
3116 result = optimize_stdarg_builtin (stmt);
3117 if (result)
3118 break;
3119 /* FALLTHRU */
3121 default:;
3124 if (!result)
3126 gsi_next (&i);
3127 continue;
3130 if (!update_call_from_tree (&i, result))
3131 gimplify_and_update_call_from_tree (&i, result);
3134 todoflags |= TODO_update_address_taken;
3136 if (dump_file && (dump_flags & TDF_DETAILS))
3138 fprintf (dump_file, "Simplified\n ");
3139 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
3142 old_stmt = stmt;
3143 stmt = gsi_stmt (i);
3144 update_stmt (stmt);
3146 if (maybe_clean_or_replace_eh_stmt (old_stmt, stmt)
3147 && gimple_purge_dead_eh_edges (bb))
3148 cfg_changed = true;
3150 if (dump_file && (dump_flags & TDF_DETAILS))
3152 fprintf (dump_file, "to\n ");
3153 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
3154 fprintf (dump_file, "\n");
3157 /* Retry the same statement if it changed into another
3158 builtin, there might be new opportunities now. */
3159 if (gimple_code (stmt) != GIMPLE_CALL)
3161 gsi_next (&i);
3162 continue;
3164 callee = gimple_call_fndecl (stmt);
3165 if (!callee
3166 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
3167 || DECL_FUNCTION_CODE (callee) == fcode)
3168 gsi_next (&i);
3172 /* Delete unreachable blocks. */
3173 if (cfg_changed)
3174 todoflags |= TODO_cleanup_cfg;
3176 return todoflags;
3179 } // anon namespace
3181 gimple_opt_pass *
3182 make_pass_fold_builtins (gcc::context *ctxt)
3184 return new pass_fold_builtins (ctxt);