Merge from gomp branch:
[official-gcc.git] / gcc / tree-ssa-ccp.c
blob673104556905054712dd1771c5727597ef7be83c
1 /* Conditional constant propagation pass for the GNU compiler.
2 Copyright (C) 2000, 2001, 2002, 2003, 2004, 2005
3 Free Software Foundation, Inc.
4 Adapted from original RTL SSA-CCP by Daniel Berlin <dberlin@dberlin.org>
5 Adapted to GIMPLE trees by Diego Novillo <dnovillo@redhat.com>
7 This file is part of GCC.
9 GCC is free software; you can redistribute it and/or modify it
10 under the terms of the GNU General Public License as published by the
11 Free Software Foundation; either version 2, or (at your option) any
12 later version.
14 GCC is distributed in the hope that it will be useful, but WITHOUT
15 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
16 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 for more details.
19 You should have received a copy of the GNU General Public License
20 along with GCC; see the file COPYING. If not, write to the Free
21 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
22 02110-1301, USA. */
24 /* Conditional constant propagation (CCP) is based on the SSA
25 propagation engine (tree-ssa-propagate.c). Constant assignments of
26 the form VAR = CST are propagated from the assignments into uses of
27 VAR, which in turn may generate new constants. The simulation uses
28 a four level lattice to keep track of constant values associated
29 with SSA names. Given an SSA name V_i, it may take one of the
30 following values:
32 UNINITIALIZED -> This is the default starting value. V_i
33 has not been processed yet.
35 UNDEFINED -> V_i is a local variable whose definition
36 has not been processed yet. Therefore we
37 don't yet know if its value is a constant
38 or not.
40 CONSTANT -> V_i has been found to hold a constant
41 value C.
43 VARYING -> V_i cannot take a constant value, or if it
44 does, it is not possible to determine it
45 at compile time.
47 The core of SSA-CCP is in ccp_visit_stmt and ccp_visit_phi_node:
49 1- In ccp_visit_stmt, we are interested in assignments whose RHS
50 evaluates into a constant and conditional jumps whose predicate
51 evaluates into a boolean true or false. When an assignment of
52 the form V_i = CONST is found, V_i's lattice value is set to
53 CONSTANT and CONST is associated with it. This causes the
54 propagation engine to add all the SSA edges coming out the
55 assignment into the worklists, so that statements that use V_i
56 can be visited.
58 If the statement is a conditional with a constant predicate, we
59 mark the outgoing edges as executable or not executable
60 depending on the predicate's value. This is then used when
61 visiting PHI nodes to know when a PHI argument can be ignored.
64 2- In ccp_visit_phi_node, if all the PHI arguments evaluate to the
65 same constant C, then the LHS of the PHI is set to C. This
66 evaluation is known as the "meet operation". Since one of the
67 goals of this evaluation is to optimistically return constant
68 values as often as possible, it uses two main short cuts:
70 - If an argument is flowing in through a non-executable edge, it
71 is ignored. This is useful in cases like this:
73 if (PRED)
74 a_9 = 3;
75 else
76 a_10 = 100;
77 a_11 = PHI (a_9, a_10)
79 If PRED is known to always evaluate to false, then we can
80 assume that a_11 will always take its value from a_10, meaning
81 that instead of consider it VARYING (a_9 and a_10 have
82 different values), we can consider it CONSTANT 100.
84 - If an argument has an UNDEFINED value, then it does not affect
85 the outcome of the meet operation. If a variable V_i has an
86 UNDEFINED value, it means that either its defining statement
87 hasn't been visited yet or V_i has no defining statement, in
88 which case the original symbol 'V' is being used
89 uninitialized. Since 'V' is a local variable, the compiler
90 may assume any initial value for it.
93 After propagation, every variable V_i that ends up with a lattice
94 value of CONSTANT will have the associated constant value in the
95 array CONST_VAL[i].VALUE. That is fed into substitute_and_fold for
96 final substitution and folding.
99 Constant propagation in stores and loads (STORE-CCP)
100 ----------------------------------------------------
102 While CCP has all the logic to propagate constants in GIMPLE
103 registers, it is missing the ability to associate constants with
104 stores and loads (i.e., pointer dereferences, structures and
105 global/aliased variables). We don't keep loads and stores in
106 SSA, but we do build a factored use-def web for them (in the
107 virtual operands).
109 For instance, consider the following code fragment:
111 struct A a;
112 const int B = 42;
114 void foo (int i)
116 if (i > 10)
117 a.a = 42;
118 else
120 a.b = 21;
121 a.a = a.b + 21;
124 if (a.a != B)
125 never_executed ();
128 We should be able to deduce that the predicate 'a.a != B' is always
129 false. To achieve this, we associate constant values to the SSA
130 names in the V_MAY_DEF and V_MUST_DEF operands for each store.
131 Additionally, since we also glob partial loads/stores with the base
132 symbol, we also keep track of the memory reference where the
133 constant value was stored (in the MEM_REF field of PROP_VALUE_T).
134 For instance,
136 # a_5 = V_MAY_DEF <a_4>
137 a.a = 2;
139 # VUSE <a_5>
140 x_3 = a.b;
142 In the example above, CCP will associate value '2' with 'a_5', but
143 it would be wrong to replace the load from 'a.b' with '2', because
144 '2' had been stored into a.a.
146 To support STORE-CCP, it is necessary to add a new value to the
147 constant propagation lattice. When evaluating a load for a memory
148 reference we can no longer assume a value of UNDEFINED if we
149 haven't seen a preceding store to the same memory location.
150 Consider, for instance global variables:
152 int A;
154 foo (int i)
156 if (i_3 > 10)
157 A_4 = 3;
158 # A_5 = PHI (A_4, A_2);
160 # VUSE <A_5>
161 A.0_6 = A;
163 return A.0_6;
166 The value of A_2 cannot be assumed to be UNDEFINED, as it may have
167 been defined outside of foo. If we were to assume it UNDEFINED, we
168 would erroneously optimize the above into 'return 3;'. Therefore,
169 when doing STORE-CCP, we introduce a fifth lattice value
170 (UNKNOWN_VAL), which overrides any other value when computing the
171 meet operation in PHI nodes.
173 Though STORE-CCP is not too expensive, it does have to do more work
174 than regular CCP, so it is only enabled at -O2. Both regular CCP
175 and STORE-CCP use the exact same algorithm. The only distinction
176 is that when doing STORE-CCP, the boolean variable DO_STORE_CCP is
177 set to true. This affects the evaluation of statements and PHI
178 nodes.
180 References:
182 Constant propagation with conditional branches,
183 Wegman and Zadeck, ACM TOPLAS 13(2):181-210.
185 Building an Optimizing Compiler,
186 Robert Morgan, Butterworth-Heinemann, 1998, Section 8.9.
188 Advanced Compiler Design and Implementation,
189 Steven Muchnick, Morgan Kaufmann, 1997, Section 12.6 */
191 #include "config.h"
192 #include "system.h"
193 #include "coretypes.h"
194 #include "tm.h"
195 #include "tree.h"
196 #include "flags.h"
197 #include "rtl.h"
198 #include "tm_p.h"
199 #include "ggc.h"
200 #include "basic-block.h"
201 #include "output.h"
202 #include "expr.h"
203 #include "function.h"
204 #include "diagnostic.h"
205 #include "timevar.h"
206 #include "tree-dump.h"
207 #include "tree-flow.h"
208 #include "tree-pass.h"
209 #include "tree-ssa-propagate.h"
210 #include "langhooks.h"
211 #include "target.h"
214 /* Possible lattice values. */
215 typedef enum
217 UNINITIALIZED = 0,
218 UNDEFINED,
219 UNKNOWN_VAL,
220 CONSTANT,
221 VARYING
222 } ccp_lattice_t;
224 /* Array of propagated constant values. After propagation,
225 CONST_VAL[I].VALUE holds the constant value for SSA_NAME(I). If
226 the constant is held in an SSA name representing a memory store
227 (i.e., a V_MAY_DEF or V_MUST_DEF), CONST_VAL[I].MEM_REF will
228 contain the actual memory reference used to store (i.e., the LHS of
229 the assignment doing the store). */
230 static prop_value_t *const_val;
232 /* True if we are also propagating constants in stores and loads. */
233 static bool do_store_ccp;
235 /* Dump constant propagation value VAL to file OUTF prefixed by PREFIX. */
237 static void
238 dump_lattice_value (FILE *outf, const char *prefix, prop_value_t val)
240 switch (val.lattice_val)
242 case UNINITIALIZED:
243 fprintf (outf, "%sUNINITIALIZED", prefix);
244 break;
245 case UNDEFINED:
246 fprintf (outf, "%sUNDEFINED", prefix);
247 break;
248 case VARYING:
249 fprintf (outf, "%sVARYING", prefix);
250 break;
251 case UNKNOWN_VAL:
252 fprintf (outf, "%sUNKNOWN_VAL", prefix);
253 break;
254 case CONSTANT:
255 fprintf (outf, "%sCONSTANT ", prefix);
256 print_generic_expr (outf, val.value, dump_flags);
257 break;
258 default:
259 gcc_unreachable ();
264 /* Print lattice value VAL to stderr. */
266 void debug_lattice_value (prop_value_t val);
268 void
269 debug_lattice_value (prop_value_t val)
271 dump_lattice_value (stderr, "", val);
272 fprintf (stderr, "\n");
276 /* The regular is_gimple_min_invariant does a shallow test of the object.
277 It assumes that full gimplification has happened, or will happen on the
278 object. For a value coming from DECL_INITIAL, this is not true, so we
279 have to be more strict ourselves. */
281 static bool
282 ccp_decl_initial_min_invariant (tree t)
284 if (!is_gimple_min_invariant (t))
285 return false;
286 if (TREE_CODE (t) == ADDR_EXPR)
288 /* Inline and unroll is_gimple_addressable. */
289 while (1)
291 t = TREE_OPERAND (t, 0);
292 if (is_gimple_id (t))
293 return true;
294 if (!handled_component_p (t))
295 return false;
298 return true;
302 /* Compute a default value for variable VAR and store it in the
303 CONST_VAL array. The following rules are used to get default
304 values:
306 1- Global and static variables that are declared constant are
307 considered CONSTANT.
309 2- Any other value is considered UNDEFINED. This is useful when
310 considering PHI nodes. PHI arguments that are undefined do not
311 change the constant value of the PHI node, which allows for more
312 constants to be propagated.
314 3- If SSA_NAME_VALUE is set and it is a constant, its value is
315 used.
317 4- Variables defined by statements other than assignments and PHI
318 nodes are considered VARYING.
320 5- Variables that are not GIMPLE registers are considered
321 UNKNOWN_VAL, which is really a stronger version of UNDEFINED.
322 It's used to avoid the short circuit evaluation implied by
323 UNDEFINED in ccp_lattice_meet. */
325 static prop_value_t
326 get_default_value (tree var)
328 tree sym = SSA_NAME_VAR (var);
329 prop_value_t val = { UNINITIALIZED, NULL_TREE, NULL_TREE };
331 if (!do_store_ccp && !is_gimple_reg (var))
333 /* Short circuit for regular CCP. We are not interested in any
334 non-register when DO_STORE_CCP is false. */
335 val.lattice_val = VARYING;
337 else if (SSA_NAME_VALUE (var)
338 && is_gimple_min_invariant (SSA_NAME_VALUE (var)))
340 val.lattice_val = CONSTANT;
341 val.value = SSA_NAME_VALUE (var);
343 else if (TREE_STATIC (sym)
344 && TREE_READONLY (sym)
345 && !MTAG_P (sym)
346 && DECL_INITIAL (sym)
347 && ccp_decl_initial_min_invariant (DECL_INITIAL (sym)))
349 /* Globals and static variables declared 'const' take their
350 initial value. */
351 val.lattice_val = CONSTANT;
352 val.value = DECL_INITIAL (sym);
353 val.mem_ref = sym;
355 else
357 tree stmt = SSA_NAME_DEF_STMT (var);
359 if (IS_EMPTY_STMT (stmt))
361 /* Variables defined by an empty statement are those used
362 before being initialized. If VAR is a local variable, we
363 can assume initially that it is UNDEFINED. If we are
364 doing STORE-CCP, function arguments and non-register
365 variables are initially UNKNOWN_VAL, because we cannot
366 discard the value incoming from outside of this function
367 (see ccp_lattice_meet for details). */
368 if (is_gimple_reg (sym) && TREE_CODE (sym) != PARM_DECL)
369 val.lattice_val = UNDEFINED;
370 else if (do_store_ccp)
371 val.lattice_val = UNKNOWN_VAL;
372 else
373 val.lattice_val = VARYING;
375 else if (TREE_CODE (stmt) == MODIFY_EXPR
376 || TREE_CODE (stmt) == PHI_NODE)
378 /* Any other variable defined by an assignment or a PHI node
379 is considered UNDEFINED (or UNKNOWN_VAL if VAR is not a
380 GIMPLE register). */
381 val.lattice_val = is_gimple_reg (sym) ? UNDEFINED : UNKNOWN_VAL;
383 else
385 /* Otherwise, VAR will never take on a constant value. */
386 val.lattice_val = VARYING;
390 return val;
394 /* Get the constant value associated with variable VAR. If
395 MAY_USE_DEFAULT_P is true, call get_default_value on variables that
396 have the lattice value UNINITIALIZED. */
398 static prop_value_t *
399 get_value (tree var, bool may_use_default_p)
401 prop_value_t *val = &const_val[SSA_NAME_VERSION (var)];
402 if (may_use_default_p && val->lattice_val == UNINITIALIZED)
403 *val = get_default_value (var);
405 return val;
409 /* Set the value for variable VAR to NEW_VAL. Return true if the new
410 value is different from VAR's previous value. */
412 static bool
413 set_lattice_value (tree var, prop_value_t new_val)
415 prop_value_t *old_val = get_value (var, false);
417 /* Lattice transitions must always be monotonically increasing in
418 value. We allow two exceptions:
420 1- If *OLD_VAL and NEW_VAL are the same, return false to
421 inform the caller that this was a non-transition.
423 2- If we are doing store-ccp (i.e., DOING_STORE_CCP is true),
424 allow CONSTANT->UNKNOWN_VAL. The UNKNOWN_VAL state is a
425 special type of UNDEFINED state which prevents the short
426 circuit evaluation of PHI arguments (see ccp_visit_phi_node
427 and ccp_lattice_meet). */
428 gcc_assert (old_val->lattice_val <= new_val.lattice_val
429 || (old_val->lattice_val == new_val.lattice_val
430 && old_val->value == new_val.value
431 && old_val->mem_ref == new_val.mem_ref)
432 || (do_store_ccp
433 && old_val->lattice_val == CONSTANT
434 && new_val.lattice_val == UNKNOWN_VAL));
436 if (old_val->lattice_val != new_val.lattice_val)
438 if (dump_file && (dump_flags & TDF_DETAILS))
440 dump_lattice_value (dump_file, "Lattice value changed to ", new_val);
441 fprintf (dump_file, ". %sdding SSA edges to worklist.\n",
442 new_val.lattice_val != UNDEFINED ? "A" : "Not a");
445 *old_val = new_val;
447 /* Transitions UNINITIALIZED -> UNDEFINED are never interesting
448 for propagation purposes. In these cases return false to
449 avoid doing useless work. */
450 return (new_val.lattice_val != UNDEFINED);
453 return false;
457 /* Return the likely CCP lattice value for STMT.
459 If STMT has no operands, then return CONSTANT.
461 Else if any operands of STMT are undefined, then return UNDEFINED.
463 Else if any operands of STMT are constants, then return CONSTANT.
465 Else return VARYING. */
467 static ccp_lattice_t
468 likely_value (tree stmt)
470 bool found_constant;
471 stmt_ann_t ann;
472 tree use;
473 ssa_op_iter iter;
475 ann = stmt_ann (stmt);
477 /* If the statement has volatile operands, it won't fold to a
478 constant value. */
479 if (ann->has_volatile_ops)
480 return VARYING;
482 /* If we are not doing store-ccp, statements with loads
483 and/or stores will never fold into a constant. */
484 if (!do_store_ccp
485 && !ZERO_SSA_OPERANDS (stmt, SSA_OP_ALL_VIRTUALS))
486 return VARYING;
489 /* A CALL_EXPR is assumed to be varying. NOTE: This may be overly
490 conservative, in the presence of const and pure calls. */
491 if (get_call_expr_in (stmt) != NULL_TREE)
492 return VARYING;
494 /* Anything other than assignments and conditional jumps are not
495 interesting for CCP. */
496 if (TREE_CODE (stmt) != MODIFY_EXPR
497 && TREE_CODE (stmt) != COND_EXPR
498 && TREE_CODE (stmt) != SWITCH_EXPR)
499 return VARYING;
501 if (is_gimple_min_invariant (get_rhs (stmt)))
502 return CONSTANT;
504 found_constant = false;
505 FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE|SSA_OP_VUSE)
507 prop_value_t *val = get_value (use, true);
509 if (val->lattice_val == VARYING)
510 return VARYING;
512 if (val->lattice_val == UNKNOWN_VAL)
514 /* UNKNOWN_VAL is invalid when not doing STORE-CCP. */
515 gcc_assert (do_store_ccp);
516 return UNKNOWN_VAL;
519 if (val->lattice_val == CONSTANT)
520 found_constant = true;
523 if (found_constant
524 || ZERO_SSA_OPERANDS (stmt, SSA_OP_USE)
525 || ZERO_SSA_OPERANDS (stmt, SSA_OP_VUSE))
526 return CONSTANT;
528 return UNDEFINED;
532 /* Initialize local data structures for CCP. */
534 static void
535 ccp_initialize (void)
537 basic_block bb;
539 const_val = XNEWVEC (prop_value_t, num_ssa_names);
540 memset (const_val, 0, num_ssa_names * sizeof (*const_val));
542 /* Initialize simulation flags for PHI nodes and statements. */
543 FOR_EACH_BB (bb)
545 block_stmt_iterator i;
547 for (i = bsi_start (bb); !bsi_end_p (i); bsi_next (&i))
549 bool is_varying = false;
550 tree stmt = bsi_stmt (i);
552 if (likely_value (stmt) == VARYING)
555 tree def;
556 ssa_op_iter iter;
558 /* If the statement will not produce a constant, mark
559 all its outputs VARYING. */
560 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
561 get_value (def, false)->lattice_val = VARYING;
563 /* Never mark conditional jumps with DONT_SIMULATE_AGAIN,
564 otherwise the propagator will never add the outgoing
565 control edges. */
566 if (TREE_CODE (stmt) != COND_EXPR
567 && TREE_CODE (stmt) != SWITCH_EXPR)
568 is_varying = true;
571 DONT_SIMULATE_AGAIN (stmt) = is_varying;
575 /* Now process PHI nodes. */
576 FOR_EACH_BB (bb)
578 tree phi;
580 for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
582 int i;
583 tree arg;
584 prop_value_t *val = get_value (PHI_RESULT (phi), false);
586 for (i = 0; i < PHI_NUM_ARGS (phi); i++)
588 arg = PHI_ARG_DEF (phi, i);
590 if (TREE_CODE (arg) == SSA_NAME
591 && get_value (arg, false)->lattice_val == VARYING)
593 val->lattice_val = VARYING;
594 break;
598 DONT_SIMULATE_AGAIN (phi) = (val->lattice_val == VARYING);
604 /* Do final substitution of propagated values, cleanup the flowgraph and
605 free allocated storage. */
607 static void
608 ccp_finalize (void)
610 /* Perform substitutions based on the known constant values. */
611 substitute_and_fold (const_val, false);
613 free (const_val);
617 /* Compute the meet operator between *VAL1 and *VAL2. Store the result
618 in VAL1.
620 any M UNDEFINED = any
621 any M UNKNOWN_VAL = UNKNOWN_VAL
622 any M VARYING = VARYING
623 Ci M Cj = Ci if (i == j)
624 Ci M Cj = VARYING if (i != j)
626 Lattice values UNKNOWN_VAL and UNDEFINED are similar but have
627 different semantics at PHI nodes. Both values imply that we don't
628 know whether the variable is constant or not. However, UNKNOWN_VAL
629 values override all others. For instance, suppose that A is a
630 global variable:
632 +------+
634 | / \
635 | / \
636 | | A_1 = 4
637 | \ /
638 | \ /
639 | A_3 = PHI (A_2, A_1)
640 | ... = A_3
642 +----+
644 If the edge into A_2 is not executable, the first visit to A_3 will
645 yield the constant 4. But the second visit to A_3 will be with A_2
646 in state UNKNOWN_VAL. We can no longer conclude that A_3 is 4
647 because A_2 may have been set in another function. If we had used
648 the lattice value UNDEFINED, we would have had wrongly concluded
649 that A_3 is 4. */
652 static void
653 ccp_lattice_meet (prop_value_t *val1, prop_value_t *val2)
655 if (val1->lattice_val == UNDEFINED)
657 /* UNDEFINED M any = any */
658 *val1 = *val2;
660 else if (val2->lattice_val == UNDEFINED)
662 /* any M UNDEFINED = any
663 Nothing to do. VAL1 already contains the value we want. */
666 else if (val1->lattice_val == UNKNOWN_VAL
667 || val2->lattice_val == UNKNOWN_VAL)
669 /* UNKNOWN_VAL values are invalid if we are not doing STORE-CCP. */
670 gcc_assert (do_store_ccp);
672 /* any M UNKNOWN_VAL = UNKNOWN_VAL. */
673 val1->lattice_val = UNKNOWN_VAL;
674 val1->value = NULL_TREE;
675 val1->mem_ref = NULL_TREE;
677 else if (val1->lattice_val == VARYING
678 || val2->lattice_val == VARYING)
680 /* any M VARYING = VARYING. */
681 val1->lattice_val = VARYING;
682 val1->value = NULL_TREE;
683 val1->mem_ref = NULL_TREE;
685 else if (val1->lattice_val == CONSTANT
686 && val2->lattice_val == CONSTANT
687 && simple_cst_equal (val1->value, val2->value) == 1
688 && (!do_store_ccp
689 || (val1->mem_ref && val2->mem_ref
690 && operand_equal_p (val1->mem_ref, val2->mem_ref, 0))))
692 /* Ci M Cj = Ci if (i == j)
693 Ci M Cj = VARYING if (i != j)
695 If these two values come from memory stores, make sure that
696 they come from the same memory reference. */
697 val1->lattice_val = CONSTANT;
698 val1->value = val1->value;
699 val1->mem_ref = val1->mem_ref;
701 else
703 /* Any other combination is VARYING. */
704 val1->lattice_val = VARYING;
705 val1->value = NULL_TREE;
706 val1->mem_ref = NULL_TREE;
711 /* Loop through the PHI_NODE's parameters for BLOCK and compare their
712 lattice values to determine PHI_NODE's lattice value. The value of a
713 PHI node is determined calling ccp_lattice_meet with all the arguments
714 of the PHI node that are incoming via executable edges. */
716 static enum ssa_prop_result
717 ccp_visit_phi_node (tree phi)
719 int i;
720 prop_value_t *old_val, new_val;
722 if (dump_file && (dump_flags & TDF_DETAILS))
724 fprintf (dump_file, "\nVisiting PHI node: ");
725 print_generic_expr (dump_file, phi, dump_flags);
728 old_val = get_value (PHI_RESULT (phi), false);
729 switch (old_val->lattice_val)
731 case VARYING:
732 return SSA_PROP_VARYING;
734 case CONSTANT:
735 new_val = *old_val;
736 break;
738 case UNKNOWN_VAL:
739 /* To avoid the default value of UNKNOWN_VAL overriding
740 that of its possible constant arguments, temporarily
741 set the PHI node's default lattice value to be
742 UNDEFINED. If the PHI node's old value was UNKNOWN_VAL and
743 the new value is UNDEFINED, then we prevent the invalid
744 transition by not calling set_lattice_value. */
745 gcc_assert (do_store_ccp);
747 /* FALLTHRU */
749 case UNDEFINED:
750 case UNINITIALIZED:
751 new_val.lattice_val = UNDEFINED;
752 new_val.value = NULL_TREE;
753 new_val.mem_ref = NULL_TREE;
754 break;
756 default:
757 gcc_unreachable ();
760 for (i = 0; i < PHI_NUM_ARGS (phi); i++)
762 /* Compute the meet operator over all the PHI arguments flowing
763 through executable edges. */
764 edge e = PHI_ARG_EDGE (phi, i);
766 if (dump_file && (dump_flags & TDF_DETAILS))
768 fprintf (dump_file,
769 "\n Argument #%d (%d -> %d %sexecutable)\n",
770 i, e->src->index, e->dest->index,
771 (e->flags & EDGE_EXECUTABLE) ? "" : "not ");
774 /* If the incoming edge is executable, Compute the meet operator for
775 the existing value of the PHI node and the current PHI argument. */
776 if (e->flags & EDGE_EXECUTABLE)
778 tree arg = PHI_ARG_DEF (phi, i);
779 prop_value_t arg_val;
781 if (is_gimple_min_invariant (arg))
783 arg_val.lattice_val = CONSTANT;
784 arg_val.value = arg;
785 arg_val.mem_ref = NULL_TREE;
787 else
788 arg_val = *(get_value (arg, true));
790 ccp_lattice_meet (&new_val, &arg_val);
792 if (dump_file && (dump_flags & TDF_DETAILS))
794 fprintf (dump_file, "\t");
795 print_generic_expr (dump_file, arg, dump_flags);
796 dump_lattice_value (dump_file, "\tValue: ", arg_val);
797 fprintf (dump_file, "\n");
800 if (new_val.lattice_val == VARYING)
801 break;
805 if (dump_file && (dump_flags & TDF_DETAILS))
807 dump_lattice_value (dump_file, "\n PHI node value: ", new_val);
808 fprintf (dump_file, "\n\n");
811 /* Check for an invalid change from UNKNOWN_VAL to UNDEFINED. */
812 if (do_store_ccp
813 && old_val->lattice_val == UNKNOWN_VAL
814 && new_val.lattice_val == UNDEFINED)
815 return SSA_PROP_NOT_INTERESTING;
817 /* Otherwise, make the transition to the new value. */
818 if (set_lattice_value (PHI_RESULT (phi), new_val))
820 if (new_val.lattice_val == VARYING)
821 return SSA_PROP_VARYING;
822 else
823 return SSA_PROP_INTERESTING;
825 else
826 return SSA_PROP_NOT_INTERESTING;
830 /* CCP specific front-end to the non-destructive constant folding
831 routines.
833 Attempt to simplify the RHS of STMT knowing that one or more
834 operands are constants.
836 If simplification is possible, return the simplified RHS,
837 otherwise return the original RHS. */
839 static tree
840 ccp_fold (tree stmt)
842 tree rhs = get_rhs (stmt);
843 enum tree_code code = TREE_CODE (rhs);
844 enum tree_code_class kind = TREE_CODE_CLASS (code);
845 tree retval = NULL_TREE;
847 if (TREE_CODE (rhs) == SSA_NAME)
849 /* If the RHS is an SSA_NAME, return its known constant value,
850 if any. */
851 return get_value (rhs, true)->value;
853 else if (do_store_ccp && stmt_makes_single_load (stmt))
855 /* If the RHS is a memory load, see if the VUSEs associated with
856 it are a valid constant for that memory load. */
857 prop_value_t *val = get_value_loaded_by (stmt, const_val);
858 if (val && val->mem_ref
859 && operand_equal_p (val->mem_ref, rhs, 0))
860 return val->value;
861 else
862 return NULL_TREE;
865 /* Unary operators. Note that we know the single operand must
866 be a constant. So this should almost always return a
867 simplified RHS. */
868 if (kind == tcc_unary)
870 /* Handle unary operators which can appear in GIMPLE form. */
871 tree op0 = TREE_OPERAND (rhs, 0);
873 /* Simplify the operand down to a constant. */
874 if (TREE_CODE (op0) == SSA_NAME)
876 prop_value_t *val = get_value (op0, true);
877 if (val->lattice_val == CONSTANT)
878 op0 = get_value (op0, true)->value;
881 if ((code == NOP_EXPR || code == CONVERT_EXPR)
882 && tree_ssa_useless_type_conversion_1 (TREE_TYPE (rhs),
883 TREE_TYPE (op0)))
884 return op0;
885 return fold_unary (code, TREE_TYPE (rhs), op0);
888 /* Binary and comparison operators. We know one or both of the
889 operands are constants. */
890 else if (kind == tcc_binary
891 || kind == tcc_comparison
892 || code == TRUTH_AND_EXPR
893 || code == TRUTH_OR_EXPR
894 || code == TRUTH_XOR_EXPR)
896 /* Handle binary and comparison operators that can appear in
897 GIMPLE form. */
898 tree op0 = TREE_OPERAND (rhs, 0);
899 tree op1 = TREE_OPERAND (rhs, 1);
901 /* Simplify the operands down to constants when appropriate. */
902 if (TREE_CODE (op0) == SSA_NAME)
904 prop_value_t *val = get_value (op0, true);
905 if (val->lattice_val == CONSTANT)
906 op0 = val->value;
909 if (TREE_CODE (op1) == SSA_NAME)
911 prop_value_t *val = get_value (op1, true);
912 if (val->lattice_val == CONSTANT)
913 op1 = val->value;
916 return fold_binary (code, TREE_TYPE (rhs), op0, op1);
919 /* We may be able to fold away calls to builtin functions if their
920 arguments are constants. */
921 else if (code == CALL_EXPR
922 && TREE_CODE (TREE_OPERAND (rhs, 0)) == ADDR_EXPR
923 && (TREE_CODE (TREE_OPERAND (TREE_OPERAND (rhs, 0), 0))
924 == FUNCTION_DECL)
925 && DECL_BUILT_IN (TREE_OPERAND (TREE_OPERAND (rhs, 0), 0)))
927 if (!ZERO_SSA_OPERANDS (stmt, SSA_OP_USE))
929 tree *orig, var;
930 tree fndecl, arglist;
931 size_t i = 0;
932 ssa_op_iter iter;
933 use_operand_p var_p;
935 /* Preserve the original values of every operand. */
936 orig = XNEWVEC (tree, NUM_SSA_OPERANDS (stmt, SSA_OP_USE));
937 FOR_EACH_SSA_TREE_OPERAND (var, stmt, iter, SSA_OP_USE)
938 orig[i++] = var;
940 /* Substitute operands with their values and try to fold. */
941 replace_uses_in (stmt, NULL, const_val);
942 fndecl = get_callee_fndecl (rhs);
943 arglist = TREE_OPERAND (rhs, 1);
944 retval = fold_builtin (fndecl, arglist, false);
946 /* Restore operands to their original form. */
947 i = 0;
948 FOR_EACH_SSA_USE_OPERAND (var_p, stmt, iter, SSA_OP_USE)
949 SET_USE (var_p, orig[i++]);
950 free (orig);
953 else
954 return rhs;
956 /* If we got a simplified form, see if we need to convert its type. */
957 if (retval)
958 return fold_convert (TREE_TYPE (rhs), retval);
960 /* No simplification was possible. */
961 return rhs;
965 /* Return the tree representing the element referenced by T if T is an
966 ARRAY_REF or COMPONENT_REF into constant aggregates. Return
967 NULL_TREE otherwise. */
969 static tree
970 fold_const_aggregate_ref (tree t)
972 prop_value_t *value;
973 tree base, ctor, idx, field;
974 unsigned HOST_WIDE_INT cnt;
975 tree cfield, cval;
977 switch (TREE_CODE (t))
979 case ARRAY_REF:
980 /* Get a CONSTRUCTOR. If BASE is a VAR_DECL, get its
981 DECL_INITIAL. If BASE is a nested reference into another
982 ARRAY_REF or COMPONENT_REF, make a recursive call to resolve
983 the inner reference. */
984 base = TREE_OPERAND (t, 0);
985 switch (TREE_CODE (base))
987 case VAR_DECL:
988 if (!TREE_READONLY (base)
989 || TREE_CODE (TREE_TYPE (base)) != ARRAY_TYPE
990 || !targetm.binds_local_p (base))
991 return NULL_TREE;
993 ctor = DECL_INITIAL (base);
994 break;
996 case ARRAY_REF:
997 case COMPONENT_REF:
998 ctor = fold_const_aggregate_ref (base);
999 break;
1001 default:
1002 return NULL_TREE;
1005 if (ctor == NULL_TREE
1006 || TREE_CODE (ctor) != CONSTRUCTOR
1007 || !TREE_STATIC (ctor))
1008 return NULL_TREE;
1010 /* Get the index. If we have an SSA_NAME, try to resolve it
1011 with the current lattice value for the SSA_NAME. */
1012 idx = TREE_OPERAND (t, 1);
1013 switch (TREE_CODE (idx))
1015 case SSA_NAME:
1016 if ((value = get_value (idx, true))
1017 && value->lattice_val == CONSTANT
1018 && TREE_CODE (value->value) == INTEGER_CST)
1019 idx = value->value;
1020 else
1021 return NULL_TREE;
1022 break;
1024 case INTEGER_CST:
1025 break;
1027 default:
1028 return NULL_TREE;
1031 /* Whoo-hoo! I'll fold ya baby. Yeah! */
1032 FOR_EACH_CONSTRUCTOR_ELT (CONSTRUCTOR_ELTS (ctor), cnt, cfield, cval)
1033 if (tree_int_cst_equal (cfield, idx))
1034 return cval;
1035 break;
1037 case COMPONENT_REF:
1038 /* Get a CONSTRUCTOR. If BASE is a VAR_DECL, get its
1039 DECL_INITIAL. If BASE is a nested reference into another
1040 ARRAY_REF or COMPONENT_REF, make a recursive call to resolve
1041 the inner reference. */
1042 base = TREE_OPERAND (t, 0);
1043 switch (TREE_CODE (base))
1045 case VAR_DECL:
1046 if (!TREE_READONLY (base)
1047 || TREE_CODE (TREE_TYPE (base)) != RECORD_TYPE
1048 || !targetm.binds_local_p (base))
1049 return NULL_TREE;
1051 ctor = DECL_INITIAL (base);
1052 break;
1054 case ARRAY_REF:
1055 case COMPONENT_REF:
1056 ctor = fold_const_aggregate_ref (base);
1057 break;
1059 default:
1060 return NULL_TREE;
1063 if (ctor == NULL_TREE
1064 || TREE_CODE (ctor) != CONSTRUCTOR
1065 || !TREE_STATIC (ctor))
1066 return NULL_TREE;
1068 field = TREE_OPERAND (t, 1);
1070 FOR_EACH_CONSTRUCTOR_ELT (CONSTRUCTOR_ELTS (ctor), cnt, cfield, cval)
1071 if (cfield == field
1072 /* FIXME: Handle bit-fields. */
1073 && ! DECL_BIT_FIELD (cfield))
1074 return cval;
1075 break;
1077 case REALPART_EXPR:
1078 case IMAGPART_EXPR:
1080 tree c = fold_const_aggregate_ref (TREE_OPERAND (t, 0));
1081 if (c && TREE_CODE (c) == COMPLEX_CST)
1082 return fold_build1 (TREE_CODE (t), TREE_TYPE (t), c);
1083 break;
1086 default:
1087 break;
1090 return NULL_TREE;
1093 /* Evaluate statement STMT. */
1095 static prop_value_t
1096 evaluate_stmt (tree stmt)
1098 prop_value_t val;
1099 tree simplified;
1100 ccp_lattice_t likelyvalue = likely_value (stmt);
1102 val.mem_ref = NULL_TREE;
1104 /* If the statement is likely to have a CONSTANT result, then try
1105 to fold the statement to determine the constant value. */
1106 if (likelyvalue == CONSTANT)
1107 simplified = ccp_fold (stmt);
1108 /* If the statement is likely to have a VARYING result, then do not
1109 bother folding the statement. */
1110 else if (likelyvalue == VARYING)
1111 simplified = get_rhs (stmt);
1112 /* If the statement is an ARRAY_REF or COMPONENT_REF into constant
1113 aggregates, extract the referenced constant. Otherwise the
1114 statement is likely to have an UNDEFINED value, and there will be
1115 nothing to do. Note that fold_const_aggregate_ref returns
1116 NULL_TREE if the first case does not match. */
1117 else
1118 simplified = fold_const_aggregate_ref (get_rhs (stmt));
1120 if (simplified && is_gimple_min_invariant (simplified))
1122 /* The statement produced a constant value. */
1123 val.lattice_val = CONSTANT;
1124 val.value = simplified;
1126 else
1128 /* The statement produced a nonconstant value. If the statement
1129 had UNDEFINED operands, then the result of the statement
1130 should be UNDEFINED. Otherwise, the statement is VARYING. */
1131 if (likelyvalue == UNDEFINED || likelyvalue == UNKNOWN_VAL)
1132 val.lattice_val = likelyvalue;
1133 else
1134 val.lattice_val = VARYING;
1136 val.value = NULL_TREE;
1139 return val;
1143 /* Visit the assignment statement STMT. Set the value of its LHS to the
1144 value computed by the RHS and store LHS in *OUTPUT_P. If STMT
1145 creates virtual definitions, set the value of each new name to that
1146 of the RHS (if we can derive a constant out of the RHS). */
1148 static enum ssa_prop_result
1149 visit_assignment (tree stmt, tree *output_p)
1151 prop_value_t val;
1152 tree lhs, rhs;
1153 enum ssa_prop_result retval;
1155 lhs = TREE_OPERAND (stmt, 0);
1156 rhs = TREE_OPERAND (stmt, 1);
1158 if (TREE_CODE (rhs) == SSA_NAME)
1160 /* For a simple copy operation, we copy the lattice values. */
1161 prop_value_t *nval = get_value (rhs, true);
1162 val = *nval;
1164 else if (do_store_ccp && stmt_makes_single_load (stmt))
1166 /* Same as above, but the RHS is not a gimple register and yet
1167 has a known VUSE. If STMT is loading from the same memory
1168 location that created the SSA_NAMEs for the virtual operands,
1169 we can propagate the value on the RHS. */
1170 prop_value_t *nval = get_value_loaded_by (stmt, const_val);
1172 if (nval && nval->mem_ref
1173 && operand_equal_p (nval->mem_ref, rhs, 0))
1174 val = *nval;
1175 else
1176 val = evaluate_stmt (stmt);
1178 else
1179 /* Evaluate the statement. */
1180 val = evaluate_stmt (stmt);
1182 /* If the original LHS was a VIEW_CONVERT_EXPR, modify the constant
1183 value to be a VIEW_CONVERT_EXPR of the old constant value.
1185 ??? Also, if this was a definition of a bitfield, we need to widen
1186 the constant value into the type of the destination variable. This
1187 should not be necessary if GCC represented bitfields properly. */
1189 tree orig_lhs = TREE_OPERAND (stmt, 0);
1191 if (TREE_CODE (orig_lhs) == VIEW_CONVERT_EXPR
1192 && val.lattice_val == CONSTANT)
1194 tree w = fold_unary (VIEW_CONVERT_EXPR,
1195 TREE_TYPE (TREE_OPERAND (orig_lhs, 0)),
1196 val.value);
1198 orig_lhs = TREE_OPERAND (orig_lhs, 0);
1199 if (w && is_gimple_min_invariant (w))
1200 val.value = w;
1201 else
1203 val.lattice_val = VARYING;
1204 val.value = NULL;
1208 if (val.lattice_val == CONSTANT
1209 && TREE_CODE (orig_lhs) == COMPONENT_REF
1210 && DECL_BIT_FIELD (TREE_OPERAND (orig_lhs, 1)))
1212 tree w = widen_bitfield (val.value, TREE_OPERAND (orig_lhs, 1),
1213 orig_lhs);
1215 if (w && is_gimple_min_invariant (w))
1216 val.value = w;
1217 else
1219 val.lattice_val = VARYING;
1220 val.value = NULL_TREE;
1221 val.mem_ref = NULL_TREE;
1226 retval = SSA_PROP_NOT_INTERESTING;
1228 /* Set the lattice value of the statement's output. */
1229 if (TREE_CODE (lhs) == SSA_NAME)
1231 /* If STMT is an assignment to an SSA_NAME, we only have one
1232 value to set. */
1233 if (set_lattice_value (lhs, val))
1235 *output_p = lhs;
1236 if (val.lattice_val == VARYING)
1237 retval = SSA_PROP_VARYING;
1238 else
1239 retval = SSA_PROP_INTERESTING;
1242 else if (do_store_ccp && stmt_makes_single_store (stmt))
1244 /* Otherwise, set the names in V_MAY_DEF/V_MUST_DEF operands
1245 to the new constant value and mark the LHS as the memory
1246 reference associated with VAL. */
1247 ssa_op_iter i;
1248 tree vdef;
1249 bool changed;
1251 /* Stores cannot take on an UNDEFINED value. */
1252 if (val.lattice_val == UNDEFINED)
1253 val.lattice_val = UNKNOWN_VAL;
1255 /* Mark VAL as stored in the LHS of this assignment. */
1256 val.mem_ref = lhs;
1258 /* Set the value of every VDEF to VAL. */
1259 changed = false;
1260 FOR_EACH_SSA_TREE_OPERAND (vdef, stmt, i, SSA_OP_VIRTUAL_DEFS)
1261 changed |= set_lattice_value (vdef, val);
1263 /* Note that for propagation purposes, we are only interested in
1264 visiting statements that load the exact same memory reference
1265 stored here. Those statements will have the exact same list
1266 of virtual uses, so it is enough to set the output of this
1267 statement to be its first virtual definition. */
1268 *output_p = first_vdef (stmt);
1269 if (changed)
1271 if (val.lattice_val == VARYING)
1272 retval = SSA_PROP_VARYING;
1273 else
1274 retval = SSA_PROP_INTERESTING;
1278 return retval;
1282 /* Visit the conditional statement STMT. Return SSA_PROP_INTERESTING
1283 if it can determine which edge will be taken. Otherwise, return
1284 SSA_PROP_VARYING. */
1286 static enum ssa_prop_result
1287 visit_cond_stmt (tree stmt, edge *taken_edge_p)
1289 prop_value_t val;
1290 basic_block block;
1292 block = bb_for_stmt (stmt);
1293 val = evaluate_stmt (stmt);
1295 /* Find which edge out of the conditional block will be taken and add it
1296 to the worklist. If no single edge can be determined statically,
1297 return SSA_PROP_VARYING to feed all the outgoing edges to the
1298 propagation engine. */
1299 *taken_edge_p = val.value ? find_taken_edge (block, val.value) : 0;
1300 if (*taken_edge_p)
1301 return SSA_PROP_INTERESTING;
1302 else
1303 return SSA_PROP_VARYING;
1307 /* Evaluate statement STMT. If the statement produces an output value and
1308 its evaluation changes the lattice value of its output, return
1309 SSA_PROP_INTERESTING and set *OUTPUT_P to the SSA_NAME holding the
1310 output value.
1312 If STMT is a conditional branch and we can determine its truth
1313 value, set *TAKEN_EDGE_P accordingly. If STMT produces a varying
1314 value, return SSA_PROP_VARYING. */
1316 static enum ssa_prop_result
1317 ccp_visit_stmt (tree stmt, edge *taken_edge_p, tree *output_p)
1319 tree def;
1320 ssa_op_iter iter;
1322 if (dump_file && (dump_flags & TDF_DETAILS))
1324 fprintf (dump_file, "\nVisiting statement:\n");
1325 print_generic_stmt (dump_file, stmt, dump_flags);
1326 fprintf (dump_file, "\n");
1329 if (TREE_CODE (stmt) == MODIFY_EXPR)
1331 /* If the statement is an assignment that produces a single
1332 output value, evaluate its RHS to see if the lattice value of
1333 its output has changed. */
1334 return visit_assignment (stmt, output_p);
1336 else if (TREE_CODE (stmt) == COND_EXPR || TREE_CODE (stmt) == SWITCH_EXPR)
1338 /* If STMT is a conditional branch, see if we can determine
1339 which branch will be taken. */
1340 return visit_cond_stmt (stmt, taken_edge_p);
1343 /* Any other kind of statement is not interesting for constant
1344 propagation and, therefore, not worth simulating. */
1345 if (dump_file && (dump_flags & TDF_DETAILS))
1346 fprintf (dump_file, "No interesting values produced. Marked VARYING.\n");
1348 /* Definitions made by statements other than assignments to
1349 SSA_NAMEs represent unknown modifications to their outputs.
1350 Mark them VARYING. */
1351 FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_ALL_DEFS)
1353 prop_value_t v = { VARYING, NULL_TREE, NULL_TREE };
1354 set_lattice_value (def, v);
1357 return SSA_PROP_VARYING;
1361 /* Main entry point for SSA Conditional Constant Propagation. */
1363 static void
1364 execute_ssa_ccp (bool store_ccp)
1366 do_store_ccp = store_ccp;
1367 ccp_initialize ();
1368 ssa_propagate (ccp_visit_stmt, ccp_visit_phi_node);
1369 ccp_finalize ();
1373 static void
1374 do_ssa_ccp (void)
1376 execute_ssa_ccp (false);
1380 static bool
1381 gate_ccp (void)
1383 return flag_tree_ccp != 0;
1387 struct tree_opt_pass pass_ccp =
1389 "ccp", /* name */
1390 gate_ccp, /* gate */
1391 do_ssa_ccp, /* execute */
1392 NULL, /* sub */
1393 NULL, /* next */
1394 0, /* static_pass_number */
1395 TV_TREE_CCP, /* tv_id */
1396 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
1397 0, /* properties_provided */
1398 0, /* properties_destroyed */
1399 0, /* todo_flags_start */
1400 TODO_cleanup_cfg | TODO_dump_func | TODO_update_ssa
1401 | TODO_ggc_collect | TODO_verify_ssa
1402 | TODO_verify_stmts, /* todo_flags_finish */
1403 0 /* letter */
1407 static void
1408 do_ssa_store_ccp (void)
1410 /* If STORE-CCP is not enabled, we just run regular CCP. */
1411 execute_ssa_ccp (flag_tree_store_ccp != 0);
1414 static bool
1415 gate_store_ccp (void)
1417 /* STORE-CCP is enabled only with -ftree-store-ccp, but when
1418 -fno-tree-store-ccp is specified, we should run regular CCP.
1419 That's why the pass is enabled with either flag. */
1420 return flag_tree_store_ccp != 0 || flag_tree_ccp != 0;
1424 struct tree_opt_pass pass_store_ccp =
1426 "store_ccp", /* name */
1427 gate_store_ccp, /* gate */
1428 do_ssa_store_ccp, /* execute */
1429 NULL, /* sub */
1430 NULL, /* next */
1431 0, /* static_pass_number */
1432 TV_TREE_STORE_CCP, /* tv_id */
1433 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
1434 0, /* properties_provided */
1435 0, /* properties_destroyed */
1436 0, /* todo_flags_start */
1437 TODO_dump_func | TODO_update_ssa
1438 | TODO_ggc_collect | TODO_verify_ssa
1439 | TODO_cleanup_cfg
1440 | TODO_verify_stmts, /* todo_flags_finish */
1441 0 /* letter */
1444 /* Given a constant value VAL for bitfield FIELD, and a destination
1445 variable VAR, return VAL appropriately widened to fit into VAR. If
1446 FIELD is wider than HOST_WIDE_INT, NULL is returned. */
1448 tree
1449 widen_bitfield (tree val, tree field, tree var)
1451 unsigned HOST_WIDE_INT var_size, field_size;
1452 tree wide_val;
1453 unsigned HOST_WIDE_INT mask;
1454 unsigned int i;
1456 /* We can only do this if the size of the type and field and VAL are
1457 all constants representable in HOST_WIDE_INT. */
1458 if (!host_integerp (TYPE_SIZE (TREE_TYPE (var)), 1)
1459 || !host_integerp (DECL_SIZE (field), 1)
1460 || !host_integerp (val, 0))
1461 return NULL_TREE;
1463 var_size = tree_low_cst (TYPE_SIZE (TREE_TYPE (var)), 1);
1464 field_size = tree_low_cst (DECL_SIZE (field), 1);
1466 /* Give up if either the bitfield or the variable are too wide. */
1467 if (field_size > HOST_BITS_PER_WIDE_INT || var_size > HOST_BITS_PER_WIDE_INT)
1468 return NULL_TREE;
1470 gcc_assert (var_size >= field_size);
1472 /* If the sign bit of the value is not set or the field's type is unsigned,
1473 just mask off the high order bits of the value. */
1474 if (DECL_UNSIGNED (field)
1475 || !(tree_low_cst (val, 0) & (((HOST_WIDE_INT)1) << (field_size - 1))))
1477 /* Zero extension. Build a mask with the lower 'field_size' bits
1478 set and a BIT_AND_EXPR node to clear the high order bits of
1479 the value. */
1480 for (i = 0, mask = 0; i < field_size; i++)
1481 mask |= ((HOST_WIDE_INT) 1) << i;
1483 wide_val = fold_build2 (BIT_AND_EXPR, TREE_TYPE (var), val,
1484 build_int_cst (TREE_TYPE (var), mask));
1486 else
1488 /* Sign extension. Create a mask with the upper 'field_size'
1489 bits set and a BIT_IOR_EXPR to set the high order bits of the
1490 value. */
1491 for (i = 0, mask = 0; i < (var_size - field_size); i++)
1492 mask |= ((HOST_WIDE_INT) 1) << (var_size - i - 1);
1494 wide_val = fold_build2 (BIT_IOR_EXPR, TREE_TYPE (var), val,
1495 build_int_cst (TREE_TYPE (var), mask));
1498 return wide_val;
1502 /* A subroutine of fold_stmt_r. Attempts to fold *(A+O) to A[X].
1503 BASE is an array type. OFFSET is a byte displacement. ORIG_TYPE
1504 is the desired result type. */
1506 static tree
1507 maybe_fold_offset_to_array_ref (tree base, tree offset, tree orig_type)
1509 tree min_idx, idx, elt_offset = integer_zero_node;
1510 tree array_type, elt_type, elt_size;
1512 /* If BASE is an ARRAY_REF, we can pick up another offset (this time
1513 measured in units of the size of elements type) from that ARRAY_REF).
1514 We can't do anything if either is variable.
1516 The case we handle here is *(&A[N]+O). */
1517 if (TREE_CODE (base) == ARRAY_REF)
1519 tree low_bound = array_ref_low_bound (base);
1521 elt_offset = TREE_OPERAND (base, 1);
1522 if (TREE_CODE (low_bound) != INTEGER_CST
1523 || TREE_CODE (elt_offset) != INTEGER_CST)
1524 return NULL_TREE;
1526 elt_offset = int_const_binop (MINUS_EXPR, elt_offset, low_bound, 0);
1527 base = TREE_OPERAND (base, 0);
1530 /* Ignore stupid user tricks of indexing non-array variables. */
1531 array_type = TREE_TYPE (base);
1532 if (TREE_CODE (array_type) != ARRAY_TYPE)
1533 return NULL_TREE;
1534 elt_type = TREE_TYPE (array_type);
1535 if (!lang_hooks.types_compatible_p (orig_type, elt_type))
1536 return NULL_TREE;
1538 /* If OFFSET and ELT_OFFSET are zero, we don't care about the size of the
1539 element type (so we can use the alignment if it's not constant).
1540 Otherwise, compute the offset as an index by using a division. If the
1541 division isn't exact, then don't do anything. */
1542 elt_size = TYPE_SIZE_UNIT (elt_type);
1543 if (integer_zerop (offset))
1545 if (TREE_CODE (elt_size) != INTEGER_CST)
1546 elt_size = size_int (TYPE_ALIGN (elt_type));
1548 idx = integer_zero_node;
1550 else
1552 unsigned HOST_WIDE_INT lquo, lrem;
1553 HOST_WIDE_INT hquo, hrem;
1555 if (TREE_CODE (elt_size) != INTEGER_CST
1556 || div_and_round_double (TRUNC_DIV_EXPR, 1,
1557 TREE_INT_CST_LOW (offset),
1558 TREE_INT_CST_HIGH (offset),
1559 TREE_INT_CST_LOW (elt_size),
1560 TREE_INT_CST_HIGH (elt_size),
1561 &lquo, &hquo, &lrem, &hrem)
1562 || lrem || hrem)
1563 return NULL_TREE;
1565 idx = build_int_cst_wide (NULL_TREE, lquo, hquo);
1568 /* Assume the low bound is zero. If there is a domain type, get the
1569 low bound, if any, convert the index into that type, and add the
1570 low bound. */
1571 min_idx = integer_zero_node;
1572 if (TYPE_DOMAIN (array_type))
1574 if (TYPE_MIN_VALUE (TYPE_DOMAIN (array_type)))
1575 min_idx = TYPE_MIN_VALUE (TYPE_DOMAIN (array_type));
1576 else
1577 min_idx = fold_convert (TYPE_DOMAIN (array_type), min_idx);
1579 if (TREE_CODE (min_idx) != INTEGER_CST)
1580 return NULL_TREE;
1582 idx = fold_convert (TYPE_DOMAIN (array_type), idx);
1583 elt_offset = fold_convert (TYPE_DOMAIN (array_type), elt_offset);
1586 if (!integer_zerop (min_idx))
1587 idx = int_const_binop (PLUS_EXPR, idx, min_idx, 0);
1588 if (!integer_zerop (elt_offset))
1589 idx = int_const_binop (PLUS_EXPR, idx, elt_offset, 0);
1591 return build4 (ARRAY_REF, orig_type, base, idx, min_idx,
1592 size_int (tree_low_cst (elt_size, 1)
1593 / (TYPE_ALIGN_UNIT (elt_type))));
1597 /* A subroutine of fold_stmt_r. Attempts to fold *(S+O) to S.X.
1598 BASE is a record type. OFFSET is a byte displacement. ORIG_TYPE
1599 is the desired result type. */
1600 /* ??? This doesn't handle class inheritance. */
1602 static tree
1603 maybe_fold_offset_to_component_ref (tree record_type, tree base, tree offset,
1604 tree orig_type, bool base_is_ptr)
1606 tree f, t, field_type, tail_array_field, field_offset;
1608 if (TREE_CODE (record_type) != RECORD_TYPE
1609 && TREE_CODE (record_type) != UNION_TYPE
1610 && TREE_CODE (record_type) != QUAL_UNION_TYPE)
1611 return NULL_TREE;
1613 /* Short-circuit silly cases. */
1614 if (lang_hooks.types_compatible_p (record_type, orig_type))
1615 return NULL_TREE;
1617 tail_array_field = NULL_TREE;
1618 for (f = TYPE_FIELDS (record_type); f ; f = TREE_CHAIN (f))
1620 int cmp;
1622 if (TREE_CODE (f) != FIELD_DECL)
1623 continue;
1624 if (DECL_BIT_FIELD (f))
1625 continue;
1627 field_offset = byte_position (f);
1628 if (TREE_CODE (field_offset) != INTEGER_CST)
1629 continue;
1631 /* ??? Java creates "interesting" fields for representing base classes.
1632 They have no name, and have no context. With no context, we get into
1633 trouble with nonoverlapping_component_refs_p. Skip them. */
1634 if (!DECL_FIELD_CONTEXT (f))
1635 continue;
1637 /* The previous array field isn't at the end. */
1638 tail_array_field = NULL_TREE;
1640 /* Check to see if this offset overlaps with the field. */
1641 cmp = tree_int_cst_compare (field_offset, offset);
1642 if (cmp > 0)
1643 continue;
1645 field_type = TREE_TYPE (f);
1647 /* Here we exactly match the offset being checked. If the types match,
1648 then we can return that field. */
1649 if (cmp == 0
1650 && lang_hooks.types_compatible_p (orig_type, field_type))
1652 if (base_is_ptr)
1653 base = build1 (INDIRECT_REF, record_type, base);
1654 t = build3 (COMPONENT_REF, field_type, base, f, NULL_TREE);
1655 return t;
1658 /* Don't care about offsets into the middle of scalars. */
1659 if (!AGGREGATE_TYPE_P (field_type))
1660 continue;
1662 /* Check for array at the end of the struct. This is often
1663 used as for flexible array members. We should be able to
1664 turn this into an array access anyway. */
1665 if (TREE_CODE (field_type) == ARRAY_TYPE)
1666 tail_array_field = f;
1668 /* Check the end of the field against the offset. */
1669 if (!DECL_SIZE_UNIT (f)
1670 || TREE_CODE (DECL_SIZE_UNIT (f)) != INTEGER_CST)
1671 continue;
1672 t = int_const_binop (MINUS_EXPR, offset, field_offset, 1);
1673 if (!tree_int_cst_lt (t, DECL_SIZE_UNIT (f)))
1674 continue;
1676 /* If we matched, then set offset to the displacement into
1677 this field. */
1678 offset = t;
1679 goto found;
1682 if (!tail_array_field)
1683 return NULL_TREE;
1685 f = tail_array_field;
1686 field_type = TREE_TYPE (f);
1687 offset = int_const_binop (MINUS_EXPR, offset, byte_position (f), 1);
1689 found:
1690 /* If we get here, we've got an aggregate field, and a possibly
1691 nonzero offset into them. Recurse and hope for a valid match. */
1692 if (base_is_ptr)
1693 base = build1 (INDIRECT_REF, record_type, base);
1694 base = build3 (COMPONENT_REF, field_type, base, f, NULL_TREE);
1696 t = maybe_fold_offset_to_array_ref (base, offset, orig_type);
1697 if (t)
1698 return t;
1699 return maybe_fold_offset_to_component_ref (field_type, base, offset,
1700 orig_type, false);
1704 /* A subroutine of fold_stmt_r. Attempt to simplify *(BASE+OFFSET).
1705 Return the simplified expression, or NULL if nothing could be done. */
1707 static tree
1708 maybe_fold_stmt_indirect (tree expr, tree base, tree offset)
1710 tree t;
1712 /* We may well have constructed a double-nested PLUS_EXPR via multiple
1713 substitutions. Fold that down to one. Remove NON_LVALUE_EXPRs that
1714 are sometimes added. */
1715 base = fold (base);
1716 STRIP_TYPE_NOPS (base);
1717 TREE_OPERAND (expr, 0) = base;
1719 /* One possibility is that the address reduces to a string constant. */
1720 t = fold_read_from_constant_string (expr);
1721 if (t)
1722 return t;
1724 /* Add in any offset from a PLUS_EXPR. */
1725 if (TREE_CODE (base) == PLUS_EXPR)
1727 tree offset2;
1729 offset2 = TREE_OPERAND (base, 1);
1730 if (TREE_CODE (offset2) != INTEGER_CST)
1731 return NULL_TREE;
1732 base = TREE_OPERAND (base, 0);
1734 offset = int_const_binop (PLUS_EXPR, offset, offset2, 1);
1737 if (TREE_CODE (base) == ADDR_EXPR)
1739 /* Strip the ADDR_EXPR. */
1740 base = TREE_OPERAND (base, 0);
1742 /* Fold away CONST_DECL to its value, if the type is scalar. */
1743 if (TREE_CODE (base) == CONST_DECL
1744 && ccp_decl_initial_min_invariant (DECL_INITIAL (base)))
1745 return DECL_INITIAL (base);
1747 /* Try folding *(&B+O) to B[X]. */
1748 t = maybe_fold_offset_to_array_ref (base, offset, TREE_TYPE (expr));
1749 if (t)
1750 return t;
1752 /* Try folding *(&B+O) to B.X. */
1753 t = maybe_fold_offset_to_component_ref (TREE_TYPE (base), base, offset,
1754 TREE_TYPE (expr), false);
1755 if (t)
1756 return t;
1758 /* Fold *&B to B. We can only do this if EXPR is the same type
1759 as BASE. We can't do this if EXPR is the element type of an array
1760 and BASE is the array. */
1761 if (integer_zerop (offset)
1762 && lang_hooks.types_compatible_p (TREE_TYPE (base),
1763 TREE_TYPE (expr)))
1764 return base;
1766 else
1768 /* We can get here for out-of-range string constant accesses,
1769 such as "_"[3]. Bail out of the entire substitution search
1770 and arrange for the entire statement to be replaced by a
1771 call to __builtin_trap. In all likelihood this will all be
1772 constant-folded away, but in the meantime we can't leave with
1773 something that get_expr_operands can't understand. */
1775 t = base;
1776 STRIP_NOPS (t);
1777 if (TREE_CODE (t) == ADDR_EXPR
1778 && TREE_CODE (TREE_OPERAND (t, 0)) == STRING_CST)
1780 /* FIXME: Except that this causes problems elsewhere with dead
1781 code not being deleted, and we die in the rtl expanders
1782 because we failed to remove some ssa_name. In the meantime,
1783 just return zero. */
1784 /* FIXME2: This condition should be signaled by
1785 fold_read_from_constant_string directly, rather than
1786 re-checking for it here. */
1787 return integer_zero_node;
1790 /* Try folding *(B+O) to B->X. Still an improvement. */
1791 if (POINTER_TYPE_P (TREE_TYPE (base)))
1793 t = maybe_fold_offset_to_component_ref (TREE_TYPE (TREE_TYPE (base)),
1794 base, offset,
1795 TREE_TYPE (expr), true);
1796 if (t)
1797 return t;
1801 /* Otherwise we had an offset that we could not simplify. */
1802 return NULL_TREE;
1806 /* A subroutine of fold_stmt_r. EXPR is a PLUS_EXPR.
1808 A quaint feature extant in our address arithmetic is that there
1809 can be hidden type changes here. The type of the result need
1810 not be the same as the type of the input pointer.
1812 What we're after here is an expression of the form
1813 (T *)(&array + const)
1814 where the cast doesn't actually exist, but is implicit in the
1815 type of the PLUS_EXPR. We'd like to turn this into
1816 &array[x]
1817 which may be able to propagate further. */
1819 static tree
1820 maybe_fold_stmt_addition (tree expr)
1822 tree op0 = TREE_OPERAND (expr, 0);
1823 tree op1 = TREE_OPERAND (expr, 1);
1824 tree ptr_type = TREE_TYPE (expr);
1825 tree ptd_type;
1826 tree t;
1827 bool subtract = (TREE_CODE (expr) == MINUS_EXPR);
1829 /* We're only interested in pointer arithmetic. */
1830 if (!POINTER_TYPE_P (ptr_type))
1831 return NULL_TREE;
1832 /* Canonicalize the integral operand to op1. */
1833 if (INTEGRAL_TYPE_P (TREE_TYPE (op0)))
1835 if (subtract)
1836 return NULL_TREE;
1837 t = op0, op0 = op1, op1 = t;
1839 /* It had better be a constant. */
1840 if (TREE_CODE (op1) != INTEGER_CST)
1841 return NULL_TREE;
1842 /* The first operand should be an ADDR_EXPR. */
1843 if (TREE_CODE (op0) != ADDR_EXPR)
1844 return NULL_TREE;
1845 op0 = TREE_OPERAND (op0, 0);
1847 /* If the first operand is an ARRAY_REF, expand it so that we can fold
1848 the offset into it. */
1849 while (TREE_CODE (op0) == ARRAY_REF)
1851 tree array_obj = TREE_OPERAND (op0, 0);
1852 tree array_idx = TREE_OPERAND (op0, 1);
1853 tree elt_type = TREE_TYPE (op0);
1854 tree elt_size = TYPE_SIZE_UNIT (elt_type);
1855 tree min_idx;
1857 if (TREE_CODE (array_idx) != INTEGER_CST)
1858 break;
1859 if (TREE_CODE (elt_size) != INTEGER_CST)
1860 break;
1862 /* Un-bias the index by the min index of the array type. */
1863 min_idx = TYPE_DOMAIN (TREE_TYPE (array_obj));
1864 if (min_idx)
1866 min_idx = TYPE_MIN_VALUE (min_idx);
1867 if (min_idx)
1869 if (TREE_CODE (min_idx) != INTEGER_CST)
1870 break;
1872 array_idx = convert (TREE_TYPE (min_idx), array_idx);
1873 if (!integer_zerop (min_idx))
1874 array_idx = int_const_binop (MINUS_EXPR, array_idx,
1875 min_idx, 0);
1879 /* Convert the index to a byte offset. */
1880 array_idx = convert (sizetype, array_idx);
1881 array_idx = int_const_binop (MULT_EXPR, array_idx, elt_size, 0);
1883 /* Update the operands for the next round, or for folding. */
1884 /* If we're manipulating unsigned types, then folding into negative
1885 values can produce incorrect results. Particularly if the type
1886 is smaller than the width of the pointer. */
1887 if (subtract
1888 && TYPE_UNSIGNED (TREE_TYPE (op1))
1889 && tree_int_cst_lt (array_idx, op1))
1890 return NULL;
1891 op1 = int_const_binop (subtract ? MINUS_EXPR : PLUS_EXPR,
1892 array_idx, op1, 0);
1893 subtract = false;
1894 op0 = array_obj;
1897 /* If we weren't able to fold the subtraction into another array reference,
1898 canonicalize the integer for passing to the array and component ref
1899 simplification functions. */
1900 if (subtract)
1902 if (TYPE_UNSIGNED (TREE_TYPE (op1)))
1903 return NULL;
1904 op1 = fold_unary (NEGATE_EXPR, TREE_TYPE (op1), op1);
1905 /* ??? In theory fold should always produce another integer. */
1906 if (op1 == NULL || TREE_CODE (op1) != INTEGER_CST)
1907 return NULL;
1910 ptd_type = TREE_TYPE (ptr_type);
1912 /* At which point we can try some of the same things as for indirects. */
1913 t = maybe_fold_offset_to_array_ref (op0, op1, ptd_type);
1914 if (!t)
1915 t = maybe_fold_offset_to_component_ref (TREE_TYPE (op0), op0, op1,
1916 ptd_type, false);
1917 if (t)
1918 t = build1 (ADDR_EXPR, ptr_type, t);
1920 return t;
1923 /* For passing state through walk_tree into fold_stmt_r and its
1924 children. */
1926 struct fold_stmt_r_data
1928 bool *changed_p;
1929 bool *inside_addr_expr_p;
1932 /* Subroutine of fold_stmt called via walk_tree. We perform several
1933 simplifications of EXPR_P, mostly having to do with pointer arithmetic. */
1935 static tree
1936 fold_stmt_r (tree *expr_p, int *walk_subtrees, void *data)
1938 struct fold_stmt_r_data *fold_stmt_r_data = (struct fold_stmt_r_data *) data;
1939 bool *inside_addr_expr_p = fold_stmt_r_data->inside_addr_expr_p;
1940 bool *changed_p = fold_stmt_r_data->changed_p;
1941 tree expr = *expr_p, t;
1943 /* ??? It'd be nice if walk_tree had a pre-order option. */
1944 switch (TREE_CODE (expr))
1946 case INDIRECT_REF:
1947 t = walk_tree (&TREE_OPERAND (expr, 0), fold_stmt_r, data, NULL);
1948 if (t)
1949 return t;
1950 *walk_subtrees = 0;
1952 t = maybe_fold_stmt_indirect (expr, TREE_OPERAND (expr, 0),
1953 integer_zero_node);
1954 break;
1956 /* ??? Could handle more ARRAY_REFs here, as a variant of INDIRECT_REF.
1957 We'd only want to bother decomposing an existing ARRAY_REF if
1958 the base array is found to have another offset contained within.
1959 Otherwise we'd be wasting time. */
1960 case ARRAY_REF:
1961 /* If we are not processing expressions found within an
1962 ADDR_EXPR, then we can fold constant array references. */
1963 if (!*inside_addr_expr_p)
1964 t = fold_read_from_constant_string (expr);
1965 else
1966 t = NULL;
1967 break;
1969 case ADDR_EXPR:
1970 *inside_addr_expr_p = true;
1971 t = walk_tree (&TREE_OPERAND (expr, 0), fold_stmt_r, data, NULL);
1972 *inside_addr_expr_p = false;
1973 if (t)
1974 return t;
1975 *walk_subtrees = 0;
1977 /* Set TREE_INVARIANT properly so that the value is properly
1978 considered constant, and so gets propagated as expected. */
1979 if (*changed_p)
1980 recompute_tree_invariant_for_addr_expr (expr);
1981 return NULL_TREE;
1983 case PLUS_EXPR:
1984 case MINUS_EXPR:
1985 t = walk_tree (&TREE_OPERAND (expr, 0), fold_stmt_r, data, NULL);
1986 if (t)
1987 return t;
1988 t = walk_tree (&TREE_OPERAND (expr, 1), fold_stmt_r, data, NULL);
1989 if (t)
1990 return t;
1991 *walk_subtrees = 0;
1993 t = maybe_fold_stmt_addition (expr);
1994 break;
1996 case COMPONENT_REF:
1997 t = walk_tree (&TREE_OPERAND (expr, 0), fold_stmt_r, data, NULL);
1998 if (t)
1999 return t;
2000 *walk_subtrees = 0;
2002 /* Make sure the FIELD_DECL is actually a field in the type on the lhs.
2003 We've already checked that the records are compatible, so we should
2004 come up with a set of compatible fields. */
2006 tree expr_record = TREE_TYPE (TREE_OPERAND (expr, 0));
2007 tree expr_field = TREE_OPERAND (expr, 1);
2009 if (DECL_FIELD_CONTEXT (expr_field) != TYPE_MAIN_VARIANT (expr_record))
2011 expr_field = find_compatible_field (expr_record, expr_field);
2012 TREE_OPERAND (expr, 1) = expr_field;
2015 break;
2017 case TARGET_MEM_REF:
2018 t = maybe_fold_tmr (expr);
2019 break;
2021 default:
2022 return NULL_TREE;
2025 if (t)
2027 *expr_p = t;
2028 *changed_p = true;
2031 return NULL_TREE;
2035 /* Return the string length, maximum string length or maximum value of
2036 ARG in LENGTH.
2037 If ARG is an SSA name variable, follow its use-def chains. If LENGTH
2038 is not NULL and, for TYPE == 0, its value is not equal to the length
2039 we determine or if we are unable to determine the length or value,
2040 return false. VISITED is a bitmap of visited variables.
2041 TYPE is 0 if string length should be returned, 1 for maximum string
2042 length and 2 for maximum value ARG can have. */
2044 static bool
2045 get_maxval_strlen (tree arg, tree *length, bitmap visited, int type)
2047 tree var, def_stmt, val;
2049 if (TREE_CODE (arg) != SSA_NAME)
2051 if (type == 2)
2053 val = arg;
2054 if (TREE_CODE (val) != INTEGER_CST
2055 || tree_int_cst_sgn (val) < 0)
2056 return false;
2058 else
2059 val = c_strlen (arg, 1);
2060 if (!val)
2061 return false;
2063 if (*length)
2065 if (type > 0)
2067 if (TREE_CODE (*length) != INTEGER_CST
2068 || TREE_CODE (val) != INTEGER_CST)
2069 return false;
2071 if (tree_int_cst_lt (*length, val))
2072 *length = val;
2073 return true;
2075 else if (simple_cst_equal (val, *length) != 1)
2076 return false;
2079 *length = val;
2080 return true;
2083 /* If we were already here, break the infinite cycle. */
2084 if (bitmap_bit_p (visited, SSA_NAME_VERSION (arg)))
2085 return true;
2086 bitmap_set_bit (visited, SSA_NAME_VERSION (arg));
2088 var = arg;
2089 def_stmt = SSA_NAME_DEF_STMT (var);
2091 switch (TREE_CODE (def_stmt))
2093 case MODIFY_EXPR:
2095 tree rhs;
2097 /* The RHS of the statement defining VAR must either have a
2098 constant length or come from another SSA_NAME with a constant
2099 length. */
2100 rhs = TREE_OPERAND (def_stmt, 1);
2101 STRIP_NOPS (rhs);
2102 return get_maxval_strlen (rhs, length, visited, type);
2105 case PHI_NODE:
2107 /* All the arguments of the PHI node must have the same constant
2108 length. */
2109 int i;
2111 for (i = 0; i < PHI_NUM_ARGS (def_stmt); i++)
2113 tree arg = PHI_ARG_DEF (def_stmt, i);
2115 /* If this PHI has itself as an argument, we cannot
2116 determine the string length of this argument. However,
2117 if we can find a constant string length for the other
2118 PHI args then we can still be sure that this is a
2119 constant string length. So be optimistic and just
2120 continue with the next argument. */
2121 if (arg == PHI_RESULT (def_stmt))
2122 continue;
2124 if (!get_maxval_strlen (arg, length, visited, type))
2125 return false;
2128 return true;
2131 default:
2132 break;
2136 return false;
2140 /* Fold builtin call FN in statement STMT. If it cannot be folded into a
2141 constant, return NULL_TREE. Otherwise, return its constant value. */
2143 static tree
2144 ccp_fold_builtin (tree stmt, tree fn)
2146 tree result, val[3];
2147 tree callee, arglist, a;
2148 int arg_mask, i, type;
2149 bitmap visited;
2150 bool ignore;
2152 ignore = TREE_CODE (stmt) != MODIFY_EXPR;
2154 /* First try the generic builtin folder. If that succeeds, return the
2155 result directly. */
2156 callee = get_callee_fndecl (fn);
2157 arglist = TREE_OPERAND (fn, 1);
2158 result = fold_builtin (callee, arglist, ignore);
2159 if (result)
2161 if (ignore)
2162 STRIP_NOPS (result);
2163 return result;
2166 /* Ignore MD builtins. */
2167 if (DECL_BUILT_IN_CLASS (callee) == BUILT_IN_MD)
2168 return NULL_TREE;
2170 /* If the builtin could not be folded, and it has no argument list,
2171 we're done. */
2172 if (!arglist)
2173 return NULL_TREE;
2175 /* Limit the work only for builtins we know how to simplify. */
2176 switch (DECL_FUNCTION_CODE (callee))
2178 case BUILT_IN_STRLEN:
2179 case BUILT_IN_FPUTS:
2180 case BUILT_IN_FPUTS_UNLOCKED:
2181 arg_mask = 1;
2182 type = 0;
2183 break;
2184 case BUILT_IN_STRCPY:
2185 case BUILT_IN_STRNCPY:
2186 arg_mask = 2;
2187 type = 0;
2188 break;
2189 case BUILT_IN_MEMCPY_CHK:
2190 case BUILT_IN_MEMPCPY_CHK:
2191 case BUILT_IN_MEMMOVE_CHK:
2192 case BUILT_IN_MEMSET_CHK:
2193 case BUILT_IN_STRNCPY_CHK:
2194 arg_mask = 4;
2195 type = 2;
2196 break;
2197 case BUILT_IN_STRCPY_CHK:
2198 case BUILT_IN_STPCPY_CHK:
2199 arg_mask = 2;
2200 type = 1;
2201 break;
2202 case BUILT_IN_SNPRINTF_CHK:
2203 case BUILT_IN_VSNPRINTF_CHK:
2204 arg_mask = 2;
2205 type = 2;
2206 break;
2207 default:
2208 return NULL_TREE;
2211 /* Try to use the dataflow information gathered by the CCP process. */
2212 visited = BITMAP_ALLOC (NULL);
2214 memset (val, 0, sizeof (val));
2215 for (i = 0, a = arglist;
2216 arg_mask;
2217 i++, arg_mask >>= 1, a = TREE_CHAIN (a))
2218 if (arg_mask & 1)
2220 bitmap_clear (visited);
2221 if (!get_maxval_strlen (TREE_VALUE (a), &val[i], visited, type))
2222 val[i] = NULL_TREE;
2225 BITMAP_FREE (visited);
2227 result = NULL_TREE;
2228 switch (DECL_FUNCTION_CODE (callee))
2230 case BUILT_IN_STRLEN:
2231 if (val[0])
2233 tree new = fold_convert (TREE_TYPE (fn), val[0]);
2235 /* If the result is not a valid gimple value, or not a cast
2236 of a valid gimple value, then we can not use the result. */
2237 if (is_gimple_val (new)
2238 || (is_gimple_cast (new)
2239 && is_gimple_val (TREE_OPERAND (new, 0))))
2240 return new;
2242 break;
2244 case BUILT_IN_STRCPY:
2245 if (val[1] && is_gimple_val (val[1]))
2246 result = fold_builtin_strcpy (callee, arglist, val[1]);
2247 break;
2249 case BUILT_IN_STRNCPY:
2250 if (val[1] && is_gimple_val (val[1]))
2251 result = fold_builtin_strncpy (callee, arglist, val[1]);
2252 break;
2254 case BUILT_IN_FPUTS:
2255 result = fold_builtin_fputs (arglist,
2256 TREE_CODE (stmt) != MODIFY_EXPR, 0,
2257 val[0]);
2258 break;
2260 case BUILT_IN_FPUTS_UNLOCKED:
2261 result = fold_builtin_fputs (arglist,
2262 TREE_CODE (stmt) != MODIFY_EXPR, 1,
2263 val[0]);
2264 break;
2266 case BUILT_IN_MEMCPY_CHK:
2267 case BUILT_IN_MEMPCPY_CHK:
2268 case BUILT_IN_MEMMOVE_CHK:
2269 case BUILT_IN_MEMSET_CHK:
2270 if (val[2] && is_gimple_val (val[2]))
2271 result = fold_builtin_memory_chk (callee, arglist, val[2], ignore,
2272 DECL_FUNCTION_CODE (callee));
2273 break;
2275 case BUILT_IN_STRCPY_CHK:
2276 case BUILT_IN_STPCPY_CHK:
2277 if (val[1] && is_gimple_val (val[1]))
2278 result = fold_builtin_stxcpy_chk (callee, arglist, val[1], ignore,
2279 DECL_FUNCTION_CODE (callee));
2280 break;
2282 case BUILT_IN_STRNCPY_CHK:
2283 if (val[2] && is_gimple_val (val[2]))
2284 result = fold_builtin_strncpy_chk (arglist, val[2]);
2285 break;
2287 case BUILT_IN_SNPRINTF_CHK:
2288 case BUILT_IN_VSNPRINTF_CHK:
2289 if (val[1] && is_gimple_val (val[1]))
2290 result = fold_builtin_snprintf_chk (arglist, val[1],
2291 DECL_FUNCTION_CODE (callee));
2292 break;
2294 default:
2295 gcc_unreachable ();
2298 if (result && ignore)
2299 result = fold_ignored_result (result);
2300 return result;
2304 /* Fold the statement pointed to by STMT_P. In some cases, this function may
2305 replace the whole statement with a new one. Returns true iff folding
2306 makes any changes. */
2308 bool
2309 fold_stmt (tree *stmt_p)
2311 tree rhs, result, stmt;
2312 struct fold_stmt_r_data fold_stmt_r_data;
2313 bool changed = false;
2314 bool inside_addr_expr = false;
2316 fold_stmt_r_data.changed_p = &changed;
2317 fold_stmt_r_data.inside_addr_expr_p = &inside_addr_expr;
2319 stmt = *stmt_p;
2321 /* If we replaced constants and the statement makes pointer dereferences,
2322 then we may need to fold instances of *&VAR into VAR, etc. */
2323 if (walk_tree (stmt_p, fold_stmt_r, &fold_stmt_r_data, NULL))
2325 *stmt_p
2326 = build_function_call_expr (implicit_built_in_decls[BUILT_IN_TRAP],
2327 NULL);
2328 return true;
2331 rhs = get_rhs (stmt);
2332 if (!rhs)
2333 return changed;
2334 result = NULL_TREE;
2336 if (TREE_CODE (rhs) == CALL_EXPR)
2338 tree callee;
2340 /* Check for builtins that CCP can handle using information not
2341 available in the generic fold routines. */
2342 callee = get_callee_fndecl (rhs);
2343 if (callee && DECL_BUILT_IN (callee))
2344 result = ccp_fold_builtin (stmt, rhs);
2345 else
2347 /* Check for resolvable OBJ_TYPE_REF. The only sorts we can resolve
2348 here are when we've propagated the address of a decl into the
2349 object slot. */
2350 /* ??? Should perhaps do this in fold proper. However, doing it
2351 there requires that we create a new CALL_EXPR, and that requires
2352 copying EH region info to the new node. Easier to just do it
2353 here where we can just smash the call operand. */
2354 callee = TREE_OPERAND (rhs, 0);
2355 if (TREE_CODE (callee) == OBJ_TYPE_REF
2356 && lang_hooks.fold_obj_type_ref
2357 && TREE_CODE (OBJ_TYPE_REF_OBJECT (callee)) == ADDR_EXPR
2358 && DECL_P (TREE_OPERAND
2359 (OBJ_TYPE_REF_OBJECT (callee), 0)))
2361 tree t;
2363 /* ??? Caution: Broken ADDR_EXPR semantics means that
2364 looking at the type of the operand of the addr_expr
2365 can yield an array type. See silly exception in
2366 check_pointer_types_r. */
2368 t = TREE_TYPE (TREE_TYPE (OBJ_TYPE_REF_OBJECT (callee)));
2369 t = lang_hooks.fold_obj_type_ref (callee, t);
2370 if (t)
2372 TREE_OPERAND (rhs, 0) = t;
2373 changed = true;
2379 /* If we couldn't fold the RHS, hand over to the generic fold routines. */
2380 if (result == NULL_TREE)
2381 result = fold (rhs);
2383 /* Strip away useless type conversions. Both the NON_LVALUE_EXPR that
2384 may have been added by fold, and "useless" type conversions that might
2385 now be apparent due to propagation. */
2386 STRIP_USELESS_TYPE_CONVERSION (result);
2388 if (result != rhs)
2389 changed |= set_rhs (stmt_p, result);
2391 return changed;
2394 /* Perform the minimal folding on statement STMT. Only operations like
2395 *&x created by constant propagation are handled. The statement cannot
2396 be replaced with a new one. */
2398 bool
2399 fold_stmt_inplace (tree stmt)
2401 tree old_stmt = stmt, rhs, new_rhs;
2402 struct fold_stmt_r_data fold_stmt_r_data;
2403 bool changed = false;
2404 bool inside_addr_expr = false;
2406 fold_stmt_r_data.changed_p = &changed;
2407 fold_stmt_r_data.inside_addr_expr_p = &inside_addr_expr;
2409 walk_tree (&stmt, fold_stmt_r, &fold_stmt_r_data, NULL);
2410 gcc_assert (stmt == old_stmt);
2412 rhs = get_rhs (stmt);
2413 if (!rhs || rhs == stmt)
2414 return changed;
2416 new_rhs = fold (rhs);
2417 STRIP_USELESS_TYPE_CONVERSION (new_rhs);
2418 if (new_rhs == rhs)
2419 return changed;
2421 changed |= set_rhs (&stmt, new_rhs);
2422 gcc_assert (stmt == old_stmt);
2424 return changed;
2427 /* Convert EXPR into a GIMPLE value suitable for substitution on the
2428 RHS of an assignment. Insert the necessary statements before
2429 iterator *SI_P. */
2431 static tree
2432 convert_to_gimple_builtin (block_stmt_iterator *si_p, tree expr)
2434 tree_stmt_iterator ti;
2435 tree stmt = bsi_stmt (*si_p);
2436 tree tmp, stmts = NULL;
2438 push_gimplify_context ();
2439 tmp = get_initialized_tmp_var (expr, &stmts, NULL);
2440 pop_gimplify_context (NULL);
2442 if (EXPR_HAS_LOCATION (stmt))
2443 annotate_all_with_locus (&stmts, EXPR_LOCATION (stmt));
2445 /* The replacement can expose previously unreferenced variables. */
2446 for (ti = tsi_start (stmts); !tsi_end_p (ti); tsi_next (&ti))
2448 tree new_stmt = tsi_stmt (ti);
2449 find_new_referenced_vars (tsi_stmt_ptr (ti));
2450 bsi_insert_before (si_p, new_stmt, BSI_NEW_STMT);
2451 mark_new_vars_to_rename (bsi_stmt (*si_p));
2452 bsi_next (si_p);
2455 return tmp;
2459 /* A simple pass that attempts to fold all builtin functions. This pass
2460 is run after we've propagated as many constants as we can. */
2462 static void
2463 execute_fold_all_builtins (void)
2465 bool cfg_changed = false;
2466 basic_block bb;
2467 FOR_EACH_BB (bb)
2469 block_stmt_iterator i;
2470 for (i = bsi_start (bb); !bsi_end_p (i); )
2472 tree *stmtp = bsi_stmt_ptr (i);
2473 tree old_stmt = *stmtp;
2474 tree call = get_rhs (*stmtp);
2475 tree callee, result;
2476 enum built_in_function fcode;
2478 if (!call || TREE_CODE (call) != CALL_EXPR)
2480 bsi_next (&i);
2481 continue;
2483 callee = get_callee_fndecl (call);
2484 if (!callee || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL)
2486 bsi_next (&i);
2487 continue;
2489 fcode = DECL_FUNCTION_CODE (callee);
2491 result = ccp_fold_builtin (*stmtp, call);
2492 if (!result)
2493 switch (DECL_FUNCTION_CODE (callee))
2495 case BUILT_IN_CONSTANT_P:
2496 /* Resolve __builtin_constant_p. If it hasn't been
2497 folded to integer_one_node by now, it's fairly
2498 certain that the value simply isn't constant. */
2499 result = integer_zero_node;
2500 break;
2502 default:
2503 bsi_next (&i);
2504 continue;
2507 if (dump_file && (dump_flags & TDF_DETAILS))
2509 fprintf (dump_file, "Simplified\n ");
2510 print_generic_stmt (dump_file, *stmtp, dump_flags);
2513 if (!set_rhs (stmtp, result))
2515 result = convert_to_gimple_builtin (&i, result);
2516 if (result)
2518 bool ok = set_rhs (stmtp, result);
2520 gcc_assert (ok);
2523 mark_new_vars_to_rename (*stmtp);
2524 if (maybe_clean_or_replace_eh_stmt (old_stmt, *stmtp)
2525 && tree_purge_dead_eh_edges (bb))
2526 cfg_changed = true;
2528 if (dump_file && (dump_flags & TDF_DETAILS))
2530 fprintf (dump_file, "to\n ");
2531 print_generic_stmt (dump_file, *stmtp, dump_flags);
2532 fprintf (dump_file, "\n");
2535 /* Retry the same statement if it changed into another
2536 builtin, there might be new opportunities now. */
2537 call = get_rhs (*stmtp);
2538 if (!call || TREE_CODE (call) != CALL_EXPR)
2540 bsi_next (&i);
2541 continue;
2543 callee = get_callee_fndecl (call);
2544 if (!callee
2545 || DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL
2546 || DECL_FUNCTION_CODE (callee) == fcode)
2547 bsi_next (&i);
2551 /* Delete unreachable blocks. */
2552 if (cfg_changed)
2553 cleanup_tree_cfg ();
2557 struct tree_opt_pass pass_fold_builtins =
2559 "fab", /* name */
2560 NULL, /* gate */
2561 execute_fold_all_builtins, /* execute */
2562 NULL, /* sub */
2563 NULL, /* next */
2564 0, /* static_pass_number */
2565 0, /* tv_id */
2566 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
2567 0, /* properties_provided */
2568 0, /* properties_destroyed */
2569 0, /* todo_flags_start */
2570 TODO_dump_func
2571 | TODO_verify_ssa
2572 | TODO_update_ssa, /* todo_flags_finish */
2573 0 /* letter */