builtin-has-attribute-4.c: Skip on 32-bit hppa*-*-hpux*.
[official-gcc.git] / gcc / tree-ssa-sccvn.c
blob81604d2912a7db05fede7a38a83aeb198e3fc7d5
1 /* SCC value numbering for trees
2 Copyright (C) 2006-2019 Free Software Foundation, Inc.
3 Contributed by Daniel Berlin <dan@dberlin.org>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "backend.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "ssa.h"
29 #include "expmed.h"
30 #include "insn-config.h"
31 #include "memmodel.h"
32 #include "emit-rtl.h"
33 #include "cgraph.h"
34 #include "gimple-pretty-print.h"
35 #include "alias.h"
36 #include "fold-const.h"
37 #include "stor-layout.h"
38 #include "cfganal.h"
39 #include "tree-inline.h"
40 #include "internal-fn.h"
41 #include "gimple-fold.h"
42 #include "tree-eh.h"
43 #include "gimplify.h"
44 #include "flags.h"
45 #include "dojump.h"
46 #include "explow.h"
47 #include "calls.h"
48 #include "varasm.h"
49 #include "stmt.h"
50 #include "expr.h"
51 #include "tree-dfa.h"
52 #include "tree-ssa.h"
53 #include "dumpfile.h"
54 #include "cfgloop.h"
55 #include "params.h"
56 #include "tree-ssa-propagate.h"
57 #include "tree-cfg.h"
58 #include "domwalk.h"
59 #include "gimple-iterator.h"
60 #include "gimple-match.h"
61 #include "stringpool.h"
62 #include "attribs.h"
63 #include "tree-pass.h"
64 #include "statistics.h"
65 #include "langhooks.h"
66 #include "ipa-utils.h"
67 #include "dbgcnt.h"
68 #include "tree-cfgcleanup.h"
69 #include "tree-ssa-loop.h"
70 #include "tree-scalar-evolution.h"
71 #include "tree-ssa-loop-niter.h"
72 #include "tree-ssa-sccvn.h"
74 /* This algorithm is based on the SCC algorithm presented by Keith
75 Cooper and L. Taylor Simpson in "SCC-Based Value numbering"
76 (http://citeseer.ist.psu.edu/41805.html). In
77 straight line code, it is equivalent to a regular hash based value
78 numbering that is performed in reverse postorder.
80 For code with cycles, there are two alternatives, both of which
81 require keeping the hashtables separate from the actual list of
82 value numbers for SSA names.
84 1. Iterate value numbering in an RPO walk of the blocks, removing
85 all the entries from the hashtable after each iteration (but
86 keeping the SSA name->value number mapping between iterations).
87 Iterate until it does not change.
89 2. Perform value numbering as part of an SCC walk on the SSA graph,
90 iterating only the cycles in the SSA graph until they do not change
91 (using a separate, optimistic hashtable for value numbering the SCC
92 operands).
94 The second is not just faster in practice (because most SSA graph
95 cycles do not involve all the variables in the graph), it also has
96 some nice properties.
98 One of these nice properties is that when we pop an SCC off the
99 stack, we are guaranteed to have processed all the operands coming from
100 *outside of that SCC*, so we do not need to do anything special to
101 ensure they have value numbers.
103 Another nice property is that the SCC walk is done as part of a DFS
104 of the SSA graph, which makes it easy to perform combining and
105 simplifying operations at the same time.
107 The code below is deliberately written in a way that makes it easy
108 to separate the SCC walk from the other work it does.
110 In order to propagate constants through the code, we track which
111 expressions contain constants, and use those while folding. In
112 theory, we could also track expressions whose value numbers are
113 replaced, in case we end up folding based on expression
114 identities.
116 In order to value number memory, we assign value numbers to vuses.
117 This enables us to note that, for example, stores to the same
118 address of the same value from the same starting memory states are
119 equivalent.
120 TODO:
122 1. We can iterate only the changing portions of the SCC's, but
123 I have not seen an SCC big enough for this to be a win.
124 2. If you differentiate between phi nodes for loops and phi nodes
125 for if-then-else, you can properly consider phi nodes in different
126 blocks for equivalence.
127 3. We could value number vuses in more cases, particularly, whole
128 structure copies.
131 /* There's no BB_EXECUTABLE but we can use BB_VISITED. */
132 #define BB_EXECUTABLE BB_VISITED
134 static tree *last_vuse_ptr;
135 static vn_lookup_kind vn_walk_kind;
136 static vn_lookup_kind default_vn_walk_kind;
138 /* vn_nary_op hashtable helpers. */
140 struct vn_nary_op_hasher : nofree_ptr_hash <vn_nary_op_s>
142 typedef vn_nary_op_s *compare_type;
143 static inline hashval_t hash (const vn_nary_op_s *);
144 static inline bool equal (const vn_nary_op_s *, const vn_nary_op_s *);
147 /* Return the computed hashcode for nary operation P1. */
149 inline hashval_t
150 vn_nary_op_hasher::hash (const vn_nary_op_s *vno1)
152 return vno1->hashcode;
155 /* Compare nary operations P1 and P2 and return true if they are
156 equivalent. */
158 inline bool
159 vn_nary_op_hasher::equal (const vn_nary_op_s *vno1, const vn_nary_op_s *vno2)
161 return vno1 == vno2 || vn_nary_op_eq (vno1, vno2);
164 typedef hash_table<vn_nary_op_hasher> vn_nary_op_table_type;
165 typedef vn_nary_op_table_type::iterator vn_nary_op_iterator_type;
168 /* vn_phi hashtable helpers. */
170 static int
171 vn_phi_eq (const_vn_phi_t const vp1, const_vn_phi_t const vp2);
173 struct vn_phi_hasher : nofree_ptr_hash <vn_phi_s>
175 static inline hashval_t hash (const vn_phi_s *);
176 static inline bool equal (const vn_phi_s *, const vn_phi_s *);
179 /* Return the computed hashcode for phi operation P1. */
181 inline hashval_t
182 vn_phi_hasher::hash (const vn_phi_s *vp1)
184 return vp1->hashcode;
187 /* Compare two phi entries for equality, ignoring VN_TOP arguments. */
189 inline bool
190 vn_phi_hasher::equal (const vn_phi_s *vp1, const vn_phi_s *vp2)
192 return vp1 == vp2 || vn_phi_eq (vp1, vp2);
195 typedef hash_table<vn_phi_hasher> vn_phi_table_type;
196 typedef vn_phi_table_type::iterator vn_phi_iterator_type;
199 /* Compare two reference operands P1 and P2 for equality. Return true if
200 they are equal, and false otherwise. */
202 static int
203 vn_reference_op_eq (const void *p1, const void *p2)
205 const_vn_reference_op_t const vro1 = (const_vn_reference_op_t) p1;
206 const_vn_reference_op_t const vro2 = (const_vn_reference_op_t) p2;
208 return (vro1->opcode == vro2->opcode
209 /* We do not care for differences in type qualification. */
210 && (vro1->type == vro2->type
211 || (vro1->type && vro2->type
212 && types_compatible_p (TYPE_MAIN_VARIANT (vro1->type),
213 TYPE_MAIN_VARIANT (vro2->type))))
214 && expressions_equal_p (vro1->op0, vro2->op0)
215 && expressions_equal_p (vro1->op1, vro2->op1)
216 && expressions_equal_p (vro1->op2, vro2->op2));
219 /* Free a reference operation structure VP. */
221 static inline void
222 free_reference (vn_reference_s *vr)
224 vr->operands.release ();
228 /* vn_reference hashtable helpers. */
230 struct vn_reference_hasher : nofree_ptr_hash <vn_reference_s>
232 static inline hashval_t hash (const vn_reference_s *);
233 static inline bool equal (const vn_reference_s *, const vn_reference_s *);
236 /* Return the hashcode for a given reference operation P1. */
238 inline hashval_t
239 vn_reference_hasher::hash (const vn_reference_s *vr1)
241 return vr1->hashcode;
244 inline bool
245 vn_reference_hasher::equal (const vn_reference_s *v, const vn_reference_s *c)
247 return v == c || vn_reference_eq (v, c);
250 typedef hash_table<vn_reference_hasher> vn_reference_table_type;
251 typedef vn_reference_table_type::iterator vn_reference_iterator_type;
254 /* The set of VN hashtables. */
256 typedef struct vn_tables_s
258 vn_nary_op_table_type *nary;
259 vn_phi_table_type *phis;
260 vn_reference_table_type *references;
261 } *vn_tables_t;
264 /* vn_constant hashtable helpers. */
266 struct vn_constant_hasher : free_ptr_hash <vn_constant_s>
268 static inline hashval_t hash (const vn_constant_s *);
269 static inline bool equal (const vn_constant_s *, const vn_constant_s *);
272 /* Hash table hash function for vn_constant_t. */
274 inline hashval_t
275 vn_constant_hasher::hash (const vn_constant_s *vc1)
277 return vc1->hashcode;
280 /* Hash table equality function for vn_constant_t. */
282 inline bool
283 vn_constant_hasher::equal (const vn_constant_s *vc1, const vn_constant_s *vc2)
285 if (vc1->hashcode != vc2->hashcode)
286 return false;
288 return vn_constant_eq_with_type (vc1->constant, vc2->constant);
291 static hash_table<vn_constant_hasher> *constant_to_value_id;
292 static bitmap constant_value_ids;
295 /* Obstack we allocate the vn-tables elements from. */
296 static obstack vn_tables_obstack;
297 /* Special obstack we never unwind. */
298 static obstack vn_tables_insert_obstack;
300 static vn_reference_t last_inserted_ref;
301 static vn_phi_t last_inserted_phi;
302 static vn_nary_op_t last_inserted_nary;
304 /* Valid hashtables storing information we have proven to be
305 correct. */
306 static vn_tables_t valid_info;
309 /* Valueization hook. Valueize NAME if it is an SSA name, otherwise
310 just return it. */
311 tree (*vn_valueize) (tree);
314 /* This represents the top of the VN lattice, which is the universal
315 value. */
317 tree VN_TOP;
319 /* Unique counter for our value ids. */
321 static unsigned int next_value_id;
324 /* Table of vn_ssa_aux_t's, one per ssa_name. The vn_ssa_aux_t objects
325 are allocated on an obstack for locality reasons, and to free them
326 without looping over the vec. */
328 struct vn_ssa_aux_hasher : typed_noop_remove <vn_ssa_aux_t>
330 typedef vn_ssa_aux_t value_type;
331 typedef tree compare_type;
332 static inline hashval_t hash (const value_type &);
333 static inline bool equal (const value_type &, const compare_type &);
334 static inline void mark_deleted (value_type &) {}
335 static inline void mark_empty (value_type &e) { e = NULL; }
336 static inline bool is_deleted (value_type &) { return false; }
337 static inline bool is_empty (value_type &e) { return e == NULL; }
340 hashval_t
341 vn_ssa_aux_hasher::hash (const value_type &entry)
343 return SSA_NAME_VERSION (entry->name);
346 bool
347 vn_ssa_aux_hasher::equal (const value_type &entry, const compare_type &name)
349 return name == entry->name;
352 static hash_table<vn_ssa_aux_hasher> *vn_ssa_aux_hash;
353 typedef hash_table<vn_ssa_aux_hasher>::iterator vn_ssa_aux_iterator_type;
354 static struct obstack vn_ssa_aux_obstack;
356 static vn_nary_op_t vn_nary_op_insert_stmt (gimple *, tree);
357 static unsigned int vn_nary_length_from_stmt (gimple *);
358 static vn_nary_op_t alloc_vn_nary_op_noinit (unsigned int, obstack *);
359 static vn_nary_op_t vn_nary_op_insert_into (vn_nary_op_t,
360 vn_nary_op_table_type *, bool);
361 static void init_vn_nary_op_from_stmt (vn_nary_op_t, gimple *);
362 static void init_vn_nary_op_from_pieces (vn_nary_op_t, unsigned int,
363 enum tree_code, tree, tree *);
364 static tree vn_lookup_simplify_result (gimple_match_op *);
366 /* Return whether there is value numbering information for a given SSA name. */
368 bool
369 has_VN_INFO (tree name)
371 return vn_ssa_aux_hash->find_with_hash (name, SSA_NAME_VERSION (name));
374 vn_ssa_aux_t
375 VN_INFO (tree name)
377 vn_ssa_aux_t *res
378 = vn_ssa_aux_hash->find_slot_with_hash (name, SSA_NAME_VERSION (name),
379 INSERT);
380 if (*res != NULL)
381 return *res;
383 vn_ssa_aux_t newinfo = *res = XOBNEW (&vn_ssa_aux_obstack, struct vn_ssa_aux);
384 memset (newinfo, 0, sizeof (struct vn_ssa_aux));
385 newinfo->name = name;
386 newinfo->valnum = VN_TOP;
387 /* We are using the visited flag to handle uses with defs not within the
388 region being value-numbered. */
389 newinfo->visited = false;
391 /* Given we create the VN_INFOs on-demand now we have to do initialization
392 different than VN_TOP here. */
393 if (SSA_NAME_IS_DEFAULT_DEF (name))
394 switch (TREE_CODE (SSA_NAME_VAR (name)))
396 case VAR_DECL:
397 /* All undefined vars are VARYING. */
398 newinfo->valnum = name;
399 newinfo->visited = true;
400 break;
402 case PARM_DECL:
403 /* Parameters are VARYING but we can record a condition
404 if we know it is a non-NULL pointer. */
405 newinfo->visited = true;
406 newinfo->valnum = name;
407 if (POINTER_TYPE_P (TREE_TYPE (name))
408 && nonnull_arg_p (SSA_NAME_VAR (name)))
410 tree ops[2];
411 ops[0] = name;
412 ops[1] = build_int_cst (TREE_TYPE (name), 0);
413 vn_nary_op_t nary;
414 /* Allocate from non-unwinding stack. */
415 nary = alloc_vn_nary_op_noinit (2, &vn_tables_insert_obstack);
416 init_vn_nary_op_from_pieces (nary, 2, NE_EXPR,
417 boolean_type_node, ops);
418 nary->predicated_values = 0;
419 nary->u.result = boolean_true_node;
420 vn_nary_op_insert_into (nary, valid_info->nary, true);
421 gcc_assert (nary->unwind_to == NULL);
422 /* Also do not link it into the undo chain. */
423 last_inserted_nary = nary->next;
424 nary->next = (vn_nary_op_t)(void *)-1;
425 nary = alloc_vn_nary_op_noinit (2, &vn_tables_insert_obstack);
426 init_vn_nary_op_from_pieces (nary, 2, EQ_EXPR,
427 boolean_type_node, ops);
428 nary->predicated_values = 0;
429 nary->u.result = boolean_false_node;
430 vn_nary_op_insert_into (nary, valid_info->nary, true);
431 gcc_assert (nary->unwind_to == NULL);
432 last_inserted_nary = nary->next;
433 nary->next = (vn_nary_op_t)(void *)-1;
434 if (dump_file && (dump_flags & TDF_DETAILS))
436 fprintf (dump_file, "Recording ");
437 print_generic_expr (dump_file, name, TDF_SLIM);
438 fprintf (dump_file, " != 0\n");
441 break;
443 case RESULT_DECL:
444 /* If the result is passed by invisible reference the default
445 def is initialized, otherwise it's uninitialized. Still
446 undefined is varying. */
447 newinfo->visited = true;
448 newinfo->valnum = name;
449 break;
451 default:
452 gcc_unreachable ();
454 return newinfo;
457 /* Return the SSA value of X. */
459 inline tree
460 SSA_VAL (tree x, bool *visited = NULL)
462 vn_ssa_aux_t tem = vn_ssa_aux_hash->find_with_hash (x, SSA_NAME_VERSION (x));
463 if (visited)
464 *visited = tem && tem->visited;
465 return tem && tem->visited ? tem->valnum : x;
468 /* Return the SSA value of the VUSE x, supporting released VDEFs
469 during elimination which will value-number the VDEF to the
470 associated VUSE (but not substitute in the whole lattice). */
472 static inline tree
473 vuse_ssa_val (tree x)
475 if (!x)
476 return NULL_TREE;
480 x = SSA_VAL (x);
481 gcc_assert (x != VN_TOP);
483 while (SSA_NAME_IN_FREE_LIST (x));
485 return x;
488 /* Similar to the above but used as callback for walk_non_aliases_vuses
489 and thus should stop at unvisited VUSE to not walk across region
490 boundaries. */
492 static tree
493 vuse_valueize (tree vuse)
497 bool visited;
498 vuse = SSA_VAL (vuse, &visited);
499 if (!visited)
500 return NULL_TREE;
501 gcc_assert (vuse != VN_TOP);
503 while (SSA_NAME_IN_FREE_LIST (vuse));
504 return vuse;
508 /* Return the vn_kind the expression computed by the stmt should be
509 associated with. */
511 enum vn_kind
512 vn_get_stmt_kind (gimple *stmt)
514 switch (gimple_code (stmt))
516 case GIMPLE_CALL:
517 return VN_REFERENCE;
518 case GIMPLE_PHI:
519 return VN_PHI;
520 case GIMPLE_ASSIGN:
522 enum tree_code code = gimple_assign_rhs_code (stmt);
523 tree rhs1 = gimple_assign_rhs1 (stmt);
524 switch (get_gimple_rhs_class (code))
526 case GIMPLE_UNARY_RHS:
527 case GIMPLE_BINARY_RHS:
528 case GIMPLE_TERNARY_RHS:
529 return VN_NARY;
530 case GIMPLE_SINGLE_RHS:
531 switch (TREE_CODE_CLASS (code))
533 case tcc_reference:
534 /* VOP-less references can go through unary case. */
535 if ((code == REALPART_EXPR
536 || code == IMAGPART_EXPR
537 || code == VIEW_CONVERT_EXPR
538 || code == BIT_FIELD_REF)
539 && TREE_CODE (TREE_OPERAND (rhs1, 0)) == SSA_NAME)
540 return VN_NARY;
542 /* Fallthrough. */
543 case tcc_declaration:
544 return VN_REFERENCE;
546 case tcc_constant:
547 return VN_CONSTANT;
549 default:
550 if (code == ADDR_EXPR)
551 return (is_gimple_min_invariant (rhs1)
552 ? VN_CONSTANT : VN_REFERENCE);
553 else if (code == CONSTRUCTOR)
554 return VN_NARY;
555 return VN_NONE;
557 default:
558 return VN_NONE;
561 default:
562 return VN_NONE;
566 /* Lookup a value id for CONSTANT and return it. If it does not
567 exist returns 0. */
569 unsigned int
570 get_constant_value_id (tree constant)
572 vn_constant_s **slot;
573 struct vn_constant_s vc;
575 vc.hashcode = vn_hash_constant_with_type (constant);
576 vc.constant = constant;
577 slot = constant_to_value_id->find_slot (&vc, NO_INSERT);
578 if (slot)
579 return (*slot)->value_id;
580 return 0;
583 /* Lookup a value id for CONSTANT, and if it does not exist, create a
584 new one and return it. If it does exist, return it. */
586 unsigned int
587 get_or_alloc_constant_value_id (tree constant)
589 vn_constant_s **slot;
590 struct vn_constant_s vc;
591 vn_constant_t vcp;
593 /* If the hashtable isn't initialized we're not running from PRE and thus
594 do not need value-ids. */
595 if (!constant_to_value_id)
596 return 0;
598 vc.hashcode = vn_hash_constant_with_type (constant);
599 vc.constant = constant;
600 slot = constant_to_value_id->find_slot (&vc, INSERT);
601 if (*slot)
602 return (*slot)->value_id;
604 vcp = XNEW (struct vn_constant_s);
605 vcp->hashcode = vc.hashcode;
606 vcp->constant = constant;
607 vcp->value_id = get_next_value_id ();
608 *slot = vcp;
609 bitmap_set_bit (constant_value_ids, vcp->value_id);
610 return vcp->value_id;
613 /* Return true if V is a value id for a constant. */
615 bool
616 value_id_constant_p (unsigned int v)
618 return bitmap_bit_p (constant_value_ids, v);
621 /* Compute the hash for a reference operand VRO1. */
623 static void
624 vn_reference_op_compute_hash (const vn_reference_op_t vro1, inchash::hash &hstate)
626 hstate.add_int (vro1->opcode);
627 if (vro1->op0)
628 inchash::add_expr (vro1->op0, hstate);
629 if (vro1->op1)
630 inchash::add_expr (vro1->op1, hstate);
631 if (vro1->op2)
632 inchash::add_expr (vro1->op2, hstate);
635 /* Compute a hash for the reference operation VR1 and return it. */
637 static hashval_t
638 vn_reference_compute_hash (const vn_reference_t vr1)
640 inchash::hash hstate;
641 hashval_t result;
642 int i;
643 vn_reference_op_t vro;
644 poly_int64 off = -1;
645 bool deref = false;
647 FOR_EACH_VEC_ELT (vr1->operands, i, vro)
649 if (vro->opcode == MEM_REF)
650 deref = true;
651 else if (vro->opcode != ADDR_EXPR)
652 deref = false;
653 if (maybe_ne (vro->off, -1))
655 if (known_eq (off, -1))
656 off = 0;
657 off += vro->off;
659 else
661 if (maybe_ne (off, -1)
662 && maybe_ne (off, 0))
663 hstate.add_poly_int (off);
664 off = -1;
665 if (deref
666 && vro->opcode == ADDR_EXPR)
668 if (vro->op0)
670 tree op = TREE_OPERAND (vro->op0, 0);
671 hstate.add_int (TREE_CODE (op));
672 inchash::add_expr (op, hstate);
675 else
676 vn_reference_op_compute_hash (vro, hstate);
679 result = hstate.end ();
680 /* ??? We would ICE later if we hash instead of adding that in. */
681 if (vr1->vuse)
682 result += SSA_NAME_VERSION (vr1->vuse);
684 return result;
687 /* Return true if reference operations VR1 and VR2 are equivalent. This
688 means they have the same set of operands and vuses. */
690 bool
691 vn_reference_eq (const_vn_reference_t const vr1, const_vn_reference_t const vr2)
693 unsigned i, j;
695 /* Early out if this is not a hash collision. */
696 if (vr1->hashcode != vr2->hashcode)
697 return false;
699 /* The VOP needs to be the same. */
700 if (vr1->vuse != vr2->vuse)
701 return false;
703 /* If the operands are the same we are done. */
704 if (vr1->operands == vr2->operands)
705 return true;
707 if (!expressions_equal_p (TYPE_SIZE (vr1->type), TYPE_SIZE (vr2->type)))
708 return false;
710 if (INTEGRAL_TYPE_P (vr1->type)
711 && INTEGRAL_TYPE_P (vr2->type))
713 if (TYPE_PRECISION (vr1->type) != TYPE_PRECISION (vr2->type))
714 return false;
716 else if (INTEGRAL_TYPE_P (vr1->type)
717 && (TYPE_PRECISION (vr1->type)
718 != TREE_INT_CST_LOW (TYPE_SIZE (vr1->type))))
719 return false;
720 else if (INTEGRAL_TYPE_P (vr2->type)
721 && (TYPE_PRECISION (vr2->type)
722 != TREE_INT_CST_LOW (TYPE_SIZE (vr2->type))))
723 return false;
725 i = 0;
726 j = 0;
729 poly_int64 off1 = 0, off2 = 0;
730 vn_reference_op_t vro1, vro2;
731 vn_reference_op_s tem1, tem2;
732 bool deref1 = false, deref2 = false;
733 for (; vr1->operands.iterate (i, &vro1); i++)
735 if (vro1->opcode == MEM_REF)
736 deref1 = true;
737 /* Do not look through a storage order barrier. */
738 else if (vro1->opcode == VIEW_CONVERT_EXPR && vro1->reverse)
739 return false;
740 if (known_eq (vro1->off, -1))
741 break;
742 off1 += vro1->off;
744 for (; vr2->operands.iterate (j, &vro2); j++)
746 if (vro2->opcode == MEM_REF)
747 deref2 = true;
748 /* Do not look through a storage order barrier. */
749 else if (vro2->opcode == VIEW_CONVERT_EXPR && vro2->reverse)
750 return false;
751 if (known_eq (vro2->off, -1))
752 break;
753 off2 += vro2->off;
755 if (maybe_ne (off1, off2))
756 return false;
757 if (deref1 && vro1->opcode == ADDR_EXPR)
759 memset (&tem1, 0, sizeof (tem1));
760 tem1.op0 = TREE_OPERAND (vro1->op0, 0);
761 tem1.type = TREE_TYPE (tem1.op0);
762 tem1.opcode = TREE_CODE (tem1.op0);
763 vro1 = &tem1;
764 deref1 = false;
766 if (deref2 && vro2->opcode == ADDR_EXPR)
768 memset (&tem2, 0, sizeof (tem2));
769 tem2.op0 = TREE_OPERAND (vro2->op0, 0);
770 tem2.type = TREE_TYPE (tem2.op0);
771 tem2.opcode = TREE_CODE (tem2.op0);
772 vro2 = &tem2;
773 deref2 = false;
775 if (deref1 != deref2)
776 return false;
777 if (!vn_reference_op_eq (vro1, vro2))
778 return false;
779 ++j;
780 ++i;
782 while (vr1->operands.length () != i
783 || vr2->operands.length () != j);
785 return true;
788 /* Copy the operations present in load/store REF into RESULT, a vector of
789 vn_reference_op_s's. */
791 static void
792 copy_reference_ops_from_ref (tree ref, vec<vn_reference_op_s> *result)
794 if (TREE_CODE (ref) == TARGET_MEM_REF)
796 vn_reference_op_s temp;
798 result->reserve (3);
800 memset (&temp, 0, sizeof (temp));
801 temp.type = TREE_TYPE (ref);
802 temp.opcode = TREE_CODE (ref);
803 temp.op0 = TMR_INDEX (ref);
804 temp.op1 = TMR_STEP (ref);
805 temp.op2 = TMR_OFFSET (ref);
806 temp.off = -1;
807 temp.clique = MR_DEPENDENCE_CLIQUE (ref);
808 temp.base = MR_DEPENDENCE_BASE (ref);
809 result->quick_push (temp);
811 memset (&temp, 0, sizeof (temp));
812 temp.type = NULL_TREE;
813 temp.opcode = ERROR_MARK;
814 temp.op0 = TMR_INDEX2 (ref);
815 temp.off = -1;
816 result->quick_push (temp);
818 memset (&temp, 0, sizeof (temp));
819 temp.type = NULL_TREE;
820 temp.opcode = TREE_CODE (TMR_BASE (ref));
821 temp.op0 = TMR_BASE (ref);
822 temp.off = -1;
823 result->quick_push (temp);
824 return;
827 /* For non-calls, store the information that makes up the address. */
828 tree orig = ref;
829 while (ref)
831 vn_reference_op_s temp;
833 memset (&temp, 0, sizeof (temp));
834 temp.type = TREE_TYPE (ref);
835 temp.opcode = TREE_CODE (ref);
836 temp.off = -1;
838 switch (temp.opcode)
840 case MODIFY_EXPR:
841 temp.op0 = TREE_OPERAND (ref, 1);
842 break;
843 case WITH_SIZE_EXPR:
844 temp.op0 = TREE_OPERAND (ref, 1);
845 temp.off = 0;
846 break;
847 case MEM_REF:
848 /* The base address gets its own vn_reference_op_s structure. */
849 temp.op0 = TREE_OPERAND (ref, 1);
850 if (!mem_ref_offset (ref).to_shwi (&temp.off))
851 temp.off = -1;
852 temp.clique = MR_DEPENDENCE_CLIQUE (ref);
853 temp.base = MR_DEPENDENCE_BASE (ref);
854 temp.reverse = REF_REVERSE_STORAGE_ORDER (ref);
855 break;
856 case BIT_FIELD_REF:
857 /* Record bits, position and storage order. */
858 temp.op0 = TREE_OPERAND (ref, 1);
859 temp.op1 = TREE_OPERAND (ref, 2);
860 if (!multiple_p (bit_field_offset (ref), BITS_PER_UNIT, &temp.off))
861 temp.off = -1;
862 temp.reverse = REF_REVERSE_STORAGE_ORDER (ref);
863 break;
864 case COMPONENT_REF:
865 /* The field decl is enough to unambiguously specify the field,
866 a matching type is not necessary and a mismatching type
867 is always a spurious difference. */
868 temp.type = NULL_TREE;
869 temp.op0 = TREE_OPERAND (ref, 1);
870 temp.op1 = TREE_OPERAND (ref, 2);
872 tree this_offset = component_ref_field_offset (ref);
873 if (this_offset
874 && poly_int_tree_p (this_offset))
876 tree bit_offset = DECL_FIELD_BIT_OFFSET (TREE_OPERAND (ref, 1));
877 if (TREE_INT_CST_LOW (bit_offset) % BITS_PER_UNIT == 0)
879 poly_offset_int off
880 = (wi::to_poly_offset (this_offset)
881 + (wi::to_offset (bit_offset) >> LOG2_BITS_PER_UNIT));
882 /* Probibit value-numbering zero offset components
883 of addresses the same before the pass folding
884 __builtin_object_size had a chance to run
885 (checking cfun->after_inlining does the
886 trick here). */
887 if (TREE_CODE (orig) != ADDR_EXPR
888 || maybe_ne (off, 0)
889 || cfun->after_inlining)
890 off.to_shwi (&temp.off);
894 break;
895 case ARRAY_RANGE_REF:
896 case ARRAY_REF:
898 tree eltype = TREE_TYPE (TREE_TYPE (TREE_OPERAND (ref, 0)));
899 /* Record index as operand. */
900 temp.op0 = TREE_OPERAND (ref, 1);
901 /* Always record lower bounds and element size. */
902 temp.op1 = array_ref_low_bound (ref);
903 /* But record element size in units of the type alignment. */
904 temp.op2 = TREE_OPERAND (ref, 3);
905 temp.align = eltype->type_common.align;
906 if (! temp.op2)
907 temp.op2 = size_binop (EXACT_DIV_EXPR, TYPE_SIZE_UNIT (eltype),
908 size_int (TYPE_ALIGN_UNIT (eltype)));
909 if (poly_int_tree_p (temp.op0)
910 && poly_int_tree_p (temp.op1)
911 && TREE_CODE (temp.op2) == INTEGER_CST)
913 poly_offset_int off = ((wi::to_poly_offset (temp.op0)
914 - wi::to_poly_offset (temp.op1))
915 * wi::to_offset (temp.op2)
916 * vn_ref_op_align_unit (&temp));
917 off.to_shwi (&temp.off);
920 break;
921 case VAR_DECL:
922 if (DECL_HARD_REGISTER (ref))
924 temp.op0 = ref;
925 break;
927 /* Fallthru. */
928 case PARM_DECL:
929 case CONST_DECL:
930 case RESULT_DECL:
931 /* Canonicalize decls to MEM[&decl] which is what we end up with
932 when valueizing MEM[ptr] with ptr = &decl. */
933 temp.opcode = MEM_REF;
934 temp.op0 = build_int_cst (build_pointer_type (TREE_TYPE (ref)), 0);
935 temp.off = 0;
936 result->safe_push (temp);
937 temp.opcode = ADDR_EXPR;
938 temp.op0 = build1 (ADDR_EXPR, TREE_TYPE (temp.op0), ref);
939 temp.type = TREE_TYPE (temp.op0);
940 temp.off = -1;
941 break;
942 case STRING_CST:
943 case INTEGER_CST:
944 case COMPLEX_CST:
945 case VECTOR_CST:
946 case REAL_CST:
947 case FIXED_CST:
948 case CONSTRUCTOR:
949 case SSA_NAME:
950 temp.op0 = ref;
951 break;
952 case ADDR_EXPR:
953 if (is_gimple_min_invariant (ref))
955 temp.op0 = ref;
956 break;
958 break;
959 /* These are only interesting for their operands, their
960 existence, and their type. They will never be the last
961 ref in the chain of references (IE they require an
962 operand), so we don't have to put anything
963 for op* as it will be handled by the iteration */
964 case REALPART_EXPR:
965 temp.off = 0;
966 break;
967 case VIEW_CONVERT_EXPR:
968 temp.off = 0;
969 temp.reverse = storage_order_barrier_p (ref);
970 break;
971 case IMAGPART_EXPR:
972 /* This is only interesting for its constant offset. */
973 temp.off = TREE_INT_CST_LOW (TYPE_SIZE_UNIT (TREE_TYPE (ref)));
974 break;
975 default:
976 gcc_unreachable ();
978 result->safe_push (temp);
980 if (REFERENCE_CLASS_P (ref)
981 || TREE_CODE (ref) == MODIFY_EXPR
982 || TREE_CODE (ref) == WITH_SIZE_EXPR
983 || (TREE_CODE (ref) == ADDR_EXPR
984 && !is_gimple_min_invariant (ref)))
985 ref = TREE_OPERAND (ref, 0);
986 else
987 ref = NULL_TREE;
991 /* Build a alias-oracle reference abstraction in *REF from the vn_reference
992 operands in *OPS, the reference alias set SET and the reference type TYPE.
993 Return true if something useful was produced. */
995 bool
996 ao_ref_init_from_vn_reference (ao_ref *ref,
997 alias_set_type set, tree type,
998 vec<vn_reference_op_s> ops)
1000 vn_reference_op_t op;
1001 unsigned i;
1002 tree base = NULL_TREE;
1003 tree *op0_p = &base;
1004 poly_offset_int offset = 0;
1005 poly_offset_int max_size;
1006 poly_offset_int size = -1;
1007 tree size_tree = NULL_TREE;
1008 alias_set_type base_alias_set = -1;
1010 /* First get the final access size from just the outermost expression. */
1011 op = &ops[0];
1012 if (op->opcode == COMPONENT_REF)
1013 size_tree = DECL_SIZE (op->op0);
1014 else if (op->opcode == BIT_FIELD_REF)
1015 size_tree = op->op0;
1016 else
1018 machine_mode mode = TYPE_MODE (type);
1019 if (mode == BLKmode)
1020 size_tree = TYPE_SIZE (type);
1021 else
1022 size = GET_MODE_BITSIZE (mode);
1024 if (size_tree != NULL_TREE
1025 && poly_int_tree_p (size_tree))
1026 size = wi::to_poly_offset (size_tree);
1028 /* Initially, maxsize is the same as the accessed element size.
1029 In the following it will only grow (or become -1). */
1030 max_size = size;
1032 /* Compute cumulative bit-offset for nested component-refs and array-refs,
1033 and find the ultimate containing object. */
1034 FOR_EACH_VEC_ELT (ops, i, op)
1036 switch (op->opcode)
1038 /* These may be in the reference ops, but we cannot do anything
1039 sensible with them here. */
1040 case ADDR_EXPR:
1041 /* Apart from ADDR_EXPR arguments to MEM_REF. */
1042 if (base != NULL_TREE
1043 && TREE_CODE (base) == MEM_REF
1044 && op->op0
1045 && DECL_P (TREE_OPERAND (op->op0, 0)))
1047 vn_reference_op_t pop = &ops[i-1];
1048 base = TREE_OPERAND (op->op0, 0);
1049 if (known_eq (pop->off, -1))
1051 max_size = -1;
1052 offset = 0;
1054 else
1055 offset += pop->off * BITS_PER_UNIT;
1056 op0_p = NULL;
1057 break;
1059 /* Fallthru. */
1060 case CALL_EXPR:
1061 return false;
1063 /* Record the base objects. */
1064 case MEM_REF:
1065 base_alias_set = get_deref_alias_set (op->op0);
1066 *op0_p = build2 (MEM_REF, op->type,
1067 NULL_TREE, op->op0);
1068 MR_DEPENDENCE_CLIQUE (*op0_p) = op->clique;
1069 MR_DEPENDENCE_BASE (*op0_p) = op->base;
1070 op0_p = &TREE_OPERAND (*op0_p, 0);
1071 break;
1073 case VAR_DECL:
1074 case PARM_DECL:
1075 case RESULT_DECL:
1076 case SSA_NAME:
1077 *op0_p = op->op0;
1078 op0_p = NULL;
1079 break;
1081 /* And now the usual component-reference style ops. */
1082 case BIT_FIELD_REF:
1083 offset += wi::to_poly_offset (op->op1);
1084 break;
1086 case COMPONENT_REF:
1088 tree field = op->op0;
1089 /* We do not have a complete COMPONENT_REF tree here so we
1090 cannot use component_ref_field_offset. Do the interesting
1091 parts manually. */
1092 tree this_offset = DECL_FIELD_OFFSET (field);
1094 if (op->op1 || !poly_int_tree_p (this_offset))
1095 max_size = -1;
1096 else
1098 poly_offset_int woffset = (wi::to_poly_offset (this_offset)
1099 << LOG2_BITS_PER_UNIT);
1100 woffset += wi::to_offset (DECL_FIELD_BIT_OFFSET (field));
1101 offset += woffset;
1103 break;
1106 case ARRAY_RANGE_REF:
1107 case ARRAY_REF:
1108 /* We recorded the lower bound and the element size. */
1109 if (!poly_int_tree_p (op->op0)
1110 || !poly_int_tree_p (op->op1)
1111 || TREE_CODE (op->op2) != INTEGER_CST)
1112 max_size = -1;
1113 else
1115 poly_offset_int woffset
1116 = wi::sext (wi::to_poly_offset (op->op0)
1117 - wi::to_poly_offset (op->op1),
1118 TYPE_PRECISION (TREE_TYPE (op->op0)));
1119 woffset *= wi::to_offset (op->op2) * vn_ref_op_align_unit (op);
1120 woffset <<= LOG2_BITS_PER_UNIT;
1121 offset += woffset;
1123 break;
1125 case REALPART_EXPR:
1126 break;
1128 case IMAGPART_EXPR:
1129 offset += size;
1130 break;
1132 case VIEW_CONVERT_EXPR:
1133 break;
1135 case STRING_CST:
1136 case INTEGER_CST:
1137 case COMPLEX_CST:
1138 case VECTOR_CST:
1139 case REAL_CST:
1140 case CONSTRUCTOR:
1141 case CONST_DECL:
1142 return false;
1144 default:
1145 return false;
1149 if (base == NULL_TREE)
1150 return false;
1152 ref->ref = NULL_TREE;
1153 ref->base = base;
1154 ref->ref_alias_set = set;
1155 if (base_alias_set != -1)
1156 ref->base_alias_set = base_alias_set;
1157 else
1158 ref->base_alias_set = get_alias_set (base);
1159 /* We discount volatiles from value-numbering elsewhere. */
1160 ref->volatile_p = false;
1162 if (!size.to_shwi (&ref->size) || maybe_lt (ref->size, 0))
1164 ref->offset = 0;
1165 ref->size = -1;
1166 ref->max_size = -1;
1167 return true;
1170 if (!offset.to_shwi (&ref->offset))
1172 ref->offset = 0;
1173 ref->max_size = -1;
1174 return true;
1177 if (!max_size.to_shwi (&ref->max_size) || maybe_lt (ref->max_size, 0))
1178 ref->max_size = -1;
1180 return true;
1183 /* Copy the operations present in load/store/call REF into RESULT, a vector of
1184 vn_reference_op_s's. */
1186 static void
1187 copy_reference_ops_from_call (gcall *call,
1188 vec<vn_reference_op_s> *result)
1190 vn_reference_op_s temp;
1191 unsigned i;
1192 tree lhs = gimple_call_lhs (call);
1193 int lr;
1195 /* If 2 calls have a different non-ssa lhs, vdef value numbers should be
1196 different. By adding the lhs here in the vector, we ensure that the
1197 hashcode is different, guaranteeing a different value number. */
1198 if (lhs && TREE_CODE (lhs) != SSA_NAME)
1200 memset (&temp, 0, sizeof (temp));
1201 temp.opcode = MODIFY_EXPR;
1202 temp.type = TREE_TYPE (lhs);
1203 temp.op0 = lhs;
1204 temp.off = -1;
1205 result->safe_push (temp);
1208 /* Copy the type, opcode, function, static chain and EH region, if any. */
1209 memset (&temp, 0, sizeof (temp));
1210 temp.type = gimple_call_fntype (call);
1211 temp.opcode = CALL_EXPR;
1212 temp.op0 = gimple_call_fn (call);
1213 temp.op1 = gimple_call_chain (call);
1214 if (stmt_could_throw_p (cfun, call) && (lr = lookup_stmt_eh_lp (call)) > 0)
1215 temp.op2 = size_int (lr);
1216 temp.off = -1;
1217 result->safe_push (temp);
1219 /* Copy the call arguments. As they can be references as well,
1220 just chain them together. */
1221 for (i = 0; i < gimple_call_num_args (call); ++i)
1223 tree callarg = gimple_call_arg (call, i);
1224 copy_reference_ops_from_ref (callarg, result);
1228 /* Fold *& at position *I_P in a vn_reference_op_s vector *OPS. Updates
1229 *I_P to point to the last element of the replacement. */
1230 static bool
1231 vn_reference_fold_indirect (vec<vn_reference_op_s> *ops,
1232 unsigned int *i_p)
1234 unsigned int i = *i_p;
1235 vn_reference_op_t op = &(*ops)[i];
1236 vn_reference_op_t mem_op = &(*ops)[i - 1];
1237 tree addr_base;
1238 poly_int64 addr_offset = 0;
1240 /* The only thing we have to do is from &OBJ.foo.bar add the offset
1241 from .foo.bar to the preceding MEM_REF offset and replace the
1242 address with &OBJ. */
1243 addr_base = get_addr_base_and_unit_offset (TREE_OPERAND (op->op0, 0),
1244 &addr_offset);
1245 gcc_checking_assert (addr_base && TREE_CODE (addr_base) != MEM_REF);
1246 if (addr_base != TREE_OPERAND (op->op0, 0))
1248 poly_offset_int off
1249 = (poly_offset_int::from (wi::to_poly_wide (mem_op->op0),
1250 SIGNED)
1251 + addr_offset);
1252 mem_op->op0 = wide_int_to_tree (TREE_TYPE (mem_op->op0), off);
1253 op->op0 = build_fold_addr_expr (addr_base);
1254 if (tree_fits_shwi_p (mem_op->op0))
1255 mem_op->off = tree_to_shwi (mem_op->op0);
1256 else
1257 mem_op->off = -1;
1258 return true;
1260 return false;
1263 /* Fold *& at position *I_P in a vn_reference_op_s vector *OPS. Updates
1264 *I_P to point to the last element of the replacement. */
1265 static bool
1266 vn_reference_maybe_forwprop_address (vec<vn_reference_op_s> *ops,
1267 unsigned int *i_p)
1269 unsigned int i = *i_p;
1270 vn_reference_op_t op = &(*ops)[i];
1271 vn_reference_op_t mem_op = &(*ops)[i - 1];
1272 gimple *def_stmt;
1273 enum tree_code code;
1274 poly_offset_int off;
1276 def_stmt = SSA_NAME_DEF_STMT (op->op0);
1277 if (!is_gimple_assign (def_stmt))
1278 return false;
1280 code = gimple_assign_rhs_code (def_stmt);
1281 if (code != ADDR_EXPR
1282 && code != POINTER_PLUS_EXPR)
1283 return false;
1285 off = poly_offset_int::from (wi::to_poly_wide (mem_op->op0), SIGNED);
1287 /* The only thing we have to do is from &OBJ.foo.bar add the offset
1288 from .foo.bar to the preceding MEM_REF offset and replace the
1289 address with &OBJ. */
1290 if (code == ADDR_EXPR)
1292 tree addr, addr_base;
1293 poly_int64 addr_offset;
1295 addr = gimple_assign_rhs1 (def_stmt);
1296 addr_base = get_addr_base_and_unit_offset (TREE_OPERAND (addr, 0),
1297 &addr_offset);
1298 /* If that didn't work because the address isn't invariant propagate
1299 the reference tree from the address operation in case the current
1300 dereference isn't offsetted. */
1301 if (!addr_base
1302 && *i_p == ops->length () - 1
1303 && known_eq (off, 0)
1304 /* This makes us disable this transform for PRE where the
1305 reference ops might be also used for code insertion which
1306 is invalid. */
1307 && default_vn_walk_kind == VN_WALKREWRITE)
1309 auto_vec<vn_reference_op_s, 32> tem;
1310 copy_reference_ops_from_ref (TREE_OPERAND (addr, 0), &tem);
1311 /* Make sure to preserve TBAA info. The only objects not
1312 wrapped in MEM_REFs that can have their address taken are
1313 STRING_CSTs. */
1314 if (tem.length () >= 2
1315 && tem[tem.length () - 2].opcode == MEM_REF)
1317 vn_reference_op_t new_mem_op = &tem[tem.length () - 2];
1318 new_mem_op->op0
1319 = wide_int_to_tree (TREE_TYPE (mem_op->op0),
1320 wi::to_poly_wide (new_mem_op->op0));
1322 else
1323 gcc_assert (tem.last ().opcode == STRING_CST);
1324 ops->pop ();
1325 ops->pop ();
1326 ops->safe_splice (tem);
1327 --*i_p;
1328 return true;
1330 if (!addr_base
1331 || TREE_CODE (addr_base) != MEM_REF
1332 || (TREE_CODE (TREE_OPERAND (addr_base, 0)) == SSA_NAME
1333 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (TREE_OPERAND (addr_base, 0))))
1334 return false;
1336 off += addr_offset;
1337 off += mem_ref_offset (addr_base);
1338 op->op0 = TREE_OPERAND (addr_base, 0);
1340 else
1342 tree ptr, ptroff;
1343 ptr = gimple_assign_rhs1 (def_stmt);
1344 ptroff = gimple_assign_rhs2 (def_stmt);
1345 if (TREE_CODE (ptr) != SSA_NAME
1346 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (ptr)
1347 /* Make sure to not endlessly recurse.
1348 See gcc.dg/tree-ssa/20040408-1.c for an example. Can easily
1349 happen when we value-number a PHI to its backedge value. */
1350 || SSA_VAL (ptr) == op->op0
1351 || !poly_int_tree_p (ptroff))
1352 return false;
1354 off += wi::to_poly_offset (ptroff);
1355 op->op0 = ptr;
1358 mem_op->op0 = wide_int_to_tree (TREE_TYPE (mem_op->op0), off);
1359 if (tree_fits_shwi_p (mem_op->op0))
1360 mem_op->off = tree_to_shwi (mem_op->op0);
1361 else
1362 mem_op->off = -1;
1363 /* ??? Can end up with endless recursion here!?
1364 gcc.c-torture/execute/strcmp-1.c */
1365 if (TREE_CODE (op->op0) == SSA_NAME)
1366 op->op0 = SSA_VAL (op->op0);
1367 if (TREE_CODE (op->op0) != SSA_NAME)
1368 op->opcode = TREE_CODE (op->op0);
1370 /* And recurse. */
1371 if (TREE_CODE (op->op0) == SSA_NAME)
1372 vn_reference_maybe_forwprop_address (ops, i_p);
1373 else if (TREE_CODE (op->op0) == ADDR_EXPR)
1374 vn_reference_fold_indirect (ops, i_p);
1375 return true;
1378 /* Optimize the reference REF to a constant if possible or return
1379 NULL_TREE if not. */
1381 tree
1382 fully_constant_vn_reference_p (vn_reference_t ref)
1384 vec<vn_reference_op_s> operands = ref->operands;
1385 vn_reference_op_t op;
1387 /* Try to simplify the translated expression if it is
1388 a call to a builtin function with at most two arguments. */
1389 op = &operands[0];
1390 if (op->opcode == CALL_EXPR
1391 && TREE_CODE (op->op0) == ADDR_EXPR
1392 && TREE_CODE (TREE_OPERAND (op->op0, 0)) == FUNCTION_DECL
1393 && fndecl_built_in_p (TREE_OPERAND (op->op0, 0))
1394 && operands.length () >= 2
1395 && operands.length () <= 3)
1397 vn_reference_op_t arg0, arg1 = NULL;
1398 bool anyconst = false;
1399 arg0 = &operands[1];
1400 if (operands.length () > 2)
1401 arg1 = &operands[2];
1402 if (TREE_CODE_CLASS (arg0->opcode) == tcc_constant
1403 || (arg0->opcode == ADDR_EXPR
1404 && is_gimple_min_invariant (arg0->op0)))
1405 anyconst = true;
1406 if (arg1
1407 && (TREE_CODE_CLASS (arg1->opcode) == tcc_constant
1408 || (arg1->opcode == ADDR_EXPR
1409 && is_gimple_min_invariant (arg1->op0))))
1410 anyconst = true;
1411 if (anyconst)
1413 tree folded = build_call_expr (TREE_OPERAND (op->op0, 0),
1414 arg1 ? 2 : 1,
1415 arg0->op0,
1416 arg1 ? arg1->op0 : NULL);
1417 if (folded
1418 && TREE_CODE (folded) == NOP_EXPR)
1419 folded = TREE_OPERAND (folded, 0);
1420 if (folded
1421 && is_gimple_min_invariant (folded))
1422 return folded;
1426 /* Simplify reads from constants or constant initializers. */
1427 else if (BITS_PER_UNIT == 8
1428 && COMPLETE_TYPE_P (ref->type)
1429 && is_gimple_reg_type (ref->type))
1431 poly_int64 off = 0;
1432 HOST_WIDE_INT size;
1433 if (INTEGRAL_TYPE_P (ref->type))
1434 size = TYPE_PRECISION (ref->type);
1435 else if (tree_fits_shwi_p (TYPE_SIZE (ref->type)))
1436 size = tree_to_shwi (TYPE_SIZE (ref->type));
1437 else
1438 return NULL_TREE;
1439 if (size % BITS_PER_UNIT != 0
1440 || size > MAX_BITSIZE_MODE_ANY_MODE)
1441 return NULL_TREE;
1442 size /= BITS_PER_UNIT;
1443 unsigned i;
1444 for (i = 0; i < operands.length (); ++i)
1446 if (TREE_CODE_CLASS (operands[i].opcode) == tcc_constant)
1448 ++i;
1449 break;
1451 if (known_eq (operands[i].off, -1))
1452 return NULL_TREE;
1453 off += operands[i].off;
1454 if (operands[i].opcode == MEM_REF)
1456 ++i;
1457 break;
1460 vn_reference_op_t base = &operands[--i];
1461 tree ctor = error_mark_node;
1462 tree decl = NULL_TREE;
1463 if (TREE_CODE_CLASS (base->opcode) == tcc_constant)
1464 ctor = base->op0;
1465 else if (base->opcode == MEM_REF
1466 && base[1].opcode == ADDR_EXPR
1467 && (TREE_CODE (TREE_OPERAND (base[1].op0, 0)) == VAR_DECL
1468 || TREE_CODE (TREE_OPERAND (base[1].op0, 0)) == CONST_DECL
1469 || TREE_CODE (TREE_OPERAND (base[1].op0, 0)) == STRING_CST))
1471 decl = TREE_OPERAND (base[1].op0, 0);
1472 if (TREE_CODE (decl) == STRING_CST)
1473 ctor = decl;
1474 else
1475 ctor = ctor_for_folding (decl);
1477 if (ctor == NULL_TREE)
1478 return build_zero_cst (ref->type);
1479 else if (ctor != error_mark_node)
1481 HOST_WIDE_INT const_off;
1482 if (decl)
1484 tree res = fold_ctor_reference (ref->type, ctor,
1485 off * BITS_PER_UNIT,
1486 size * BITS_PER_UNIT, decl);
1487 if (res)
1489 STRIP_USELESS_TYPE_CONVERSION (res);
1490 if (is_gimple_min_invariant (res))
1491 return res;
1494 else if (off.is_constant (&const_off))
1496 unsigned char buf[MAX_BITSIZE_MODE_ANY_MODE / BITS_PER_UNIT];
1497 int len = native_encode_expr (ctor, buf, size, const_off);
1498 if (len > 0)
1499 return native_interpret_expr (ref->type, buf, len);
1504 return NULL_TREE;
1507 /* Return true if OPS contain a storage order barrier. */
1509 static bool
1510 contains_storage_order_barrier_p (vec<vn_reference_op_s> ops)
1512 vn_reference_op_t op;
1513 unsigned i;
1515 FOR_EACH_VEC_ELT (ops, i, op)
1516 if (op->opcode == VIEW_CONVERT_EXPR && op->reverse)
1517 return true;
1519 return false;
1522 /* Transform any SSA_NAME's in a vector of vn_reference_op_s
1523 structures into their value numbers. This is done in-place, and
1524 the vector passed in is returned. *VALUEIZED_ANYTHING will specify
1525 whether any operands were valueized. */
1527 static vec<vn_reference_op_s>
1528 valueize_refs_1 (vec<vn_reference_op_s> orig, bool *valueized_anything,
1529 bool with_avail = false)
1531 vn_reference_op_t vro;
1532 unsigned int i;
1534 *valueized_anything = false;
1536 FOR_EACH_VEC_ELT (orig, i, vro)
1538 if (vro->opcode == SSA_NAME
1539 || (vro->op0 && TREE_CODE (vro->op0) == SSA_NAME))
1541 tree tem = with_avail ? vn_valueize (vro->op0) : SSA_VAL (vro->op0);
1542 if (tem != vro->op0)
1544 *valueized_anything = true;
1545 vro->op0 = tem;
1547 /* If it transforms from an SSA_NAME to a constant, update
1548 the opcode. */
1549 if (TREE_CODE (vro->op0) != SSA_NAME && vro->opcode == SSA_NAME)
1550 vro->opcode = TREE_CODE (vro->op0);
1552 if (vro->op1 && TREE_CODE (vro->op1) == SSA_NAME)
1554 tree tem = with_avail ? vn_valueize (vro->op1) : SSA_VAL (vro->op1);
1555 if (tem != vro->op1)
1557 *valueized_anything = true;
1558 vro->op1 = tem;
1561 if (vro->op2 && TREE_CODE (vro->op2) == SSA_NAME)
1563 tree tem = with_avail ? vn_valueize (vro->op2) : SSA_VAL (vro->op2);
1564 if (tem != vro->op2)
1566 *valueized_anything = true;
1567 vro->op2 = tem;
1570 /* If it transforms from an SSA_NAME to an address, fold with
1571 a preceding indirect reference. */
1572 if (i > 0
1573 && vro->op0
1574 && TREE_CODE (vro->op0) == ADDR_EXPR
1575 && orig[i - 1].opcode == MEM_REF)
1577 if (vn_reference_fold_indirect (&orig, &i))
1578 *valueized_anything = true;
1580 else if (i > 0
1581 && vro->opcode == SSA_NAME
1582 && orig[i - 1].opcode == MEM_REF)
1584 if (vn_reference_maybe_forwprop_address (&orig, &i))
1585 *valueized_anything = true;
1587 /* If it transforms a non-constant ARRAY_REF into a constant
1588 one, adjust the constant offset. */
1589 else if (vro->opcode == ARRAY_REF
1590 && known_eq (vro->off, -1)
1591 && poly_int_tree_p (vro->op0)
1592 && poly_int_tree_p (vro->op1)
1593 && TREE_CODE (vro->op2) == INTEGER_CST)
1595 poly_offset_int off = ((wi::to_poly_offset (vro->op0)
1596 - wi::to_poly_offset (vro->op1))
1597 * wi::to_offset (vro->op2)
1598 * vn_ref_op_align_unit (vro));
1599 off.to_shwi (&vro->off);
1603 return orig;
1606 static vec<vn_reference_op_s>
1607 valueize_refs (vec<vn_reference_op_s> orig)
1609 bool tem;
1610 return valueize_refs_1 (orig, &tem);
1613 static vec<vn_reference_op_s> shared_lookup_references;
1615 /* Create a vector of vn_reference_op_s structures from REF, a
1616 REFERENCE_CLASS_P tree. The vector is shared among all callers of
1617 this function. *VALUEIZED_ANYTHING will specify whether any
1618 operands were valueized. */
1620 static vec<vn_reference_op_s>
1621 valueize_shared_reference_ops_from_ref (tree ref, bool *valueized_anything)
1623 if (!ref)
1624 return vNULL;
1625 shared_lookup_references.truncate (0);
1626 copy_reference_ops_from_ref (ref, &shared_lookup_references);
1627 shared_lookup_references = valueize_refs_1 (shared_lookup_references,
1628 valueized_anything);
1629 return shared_lookup_references;
1632 /* Create a vector of vn_reference_op_s structures from CALL, a
1633 call statement. The vector is shared among all callers of
1634 this function. */
1636 static vec<vn_reference_op_s>
1637 valueize_shared_reference_ops_from_call (gcall *call)
1639 if (!call)
1640 return vNULL;
1641 shared_lookup_references.truncate (0);
1642 copy_reference_ops_from_call (call, &shared_lookup_references);
1643 shared_lookup_references = valueize_refs (shared_lookup_references);
1644 return shared_lookup_references;
1647 /* Lookup a SCCVN reference operation VR in the current hash table.
1648 Returns the resulting value number if it exists in the hash table,
1649 NULL_TREE otherwise. VNRESULT will be filled in with the actual
1650 vn_reference_t stored in the hashtable if something is found. */
1652 static tree
1653 vn_reference_lookup_1 (vn_reference_t vr, vn_reference_t *vnresult)
1655 vn_reference_s **slot;
1656 hashval_t hash;
1658 hash = vr->hashcode;
1659 slot = valid_info->references->find_slot_with_hash (vr, hash, NO_INSERT);
1660 if (slot)
1662 if (vnresult)
1663 *vnresult = (vn_reference_t)*slot;
1664 return ((vn_reference_t)*slot)->result;
1667 return NULL_TREE;
1670 /* Callback for walk_non_aliased_vuses. Adjusts the vn_reference_t VR_
1671 with the current VUSE and performs the expression lookup. */
1673 static void *
1674 vn_reference_lookup_2 (ao_ref *op ATTRIBUTE_UNUSED, tree vuse,
1675 unsigned int cnt, void *vr_)
1677 vn_reference_t vr = (vn_reference_t)vr_;
1678 vn_reference_s **slot;
1679 hashval_t hash;
1681 /* This bounds the stmt walks we perform on reference lookups
1682 to O(1) instead of O(N) where N is the number of dominating
1683 stores. */
1684 if (cnt > (unsigned) PARAM_VALUE (PARAM_SCCVN_MAX_ALIAS_QUERIES_PER_ACCESS))
1685 return (void *)-1;
1687 if (last_vuse_ptr)
1688 *last_vuse_ptr = vuse;
1690 /* Fixup vuse and hash. */
1691 if (vr->vuse)
1692 vr->hashcode = vr->hashcode - SSA_NAME_VERSION (vr->vuse);
1693 vr->vuse = vuse_ssa_val (vuse);
1694 if (vr->vuse)
1695 vr->hashcode = vr->hashcode + SSA_NAME_VERSION (vr->vuse);
1697 hash = vr->hashcode;
1698 slot = valid_info->references->find_slot_with_hash (vr, hash, NO_INSERT);
1699 if (slot)
1700 return *slot;
1702 return NULL;
1705 /* Lookup an existing or insert a new vn_reference entry into the
1706 value table for the VUSE, SET, TYPE, OPERANDS reference which
1707 has the value VALUE which is either a constant or an SSA name. */
1709 static vn_reference_t
1710 vn_reference_lookup_or_insert_for_pieces (tree vuse,
1711 alias_set_type set,
1712 tree type,
1713 vec<vn_reference_op_s,
1714 va_heap> operands,
1715 tree value)
1717 vn_reference_s vr1;
1718 vn_reference_t result;
1719 unsigned value_id;
1720 vr1.vuse = vuse ? SSA_VAL (vuse) : NULL_TREE;
1721 vr1.operands = operands;
1722 vr1.type = type;
1723 vr1.set = set;
1724 vr1.hashcode = vn_reference_compute_hash (&vr1);
1725 if (vn_reference_lookup_1 (&vr1, &result))
1726 return result;
1727 if (TREE_CODE (value) == SSA_NAME)
1728 value_id = VN_INFO (value)->value_id;
1729 else
1730 value_id = get_or_alloc_constant_value_id (value);
1731 return vn_reference_insert_pieces (vuse, set, type,
1732 operands.copy (), value, value_id);
1735 /* Return a value-number for RCODE OPS... either by looking up an existing
1736 value-number for the simplified result or by inserting the operation if
1737 INSERT is true. */
1739 static tree
1740 vn_nary_build_or_lookup_1 (gimple_match_op *res_op, bool insert)
1742 tree result = NULL_TREE;
1743 /* We will be creating a value number for
1744 RCODE (OPS...).
1745 So first simplify and lookup this expression to see if it
1746 is already available. */
1747 mprts_hook = vn_lookup_simplify_result;
1748 bool res = false;
1749 switch (TREE_CODE_LENGTH ((tree_code) res_op->code))
1751 case 1:
1752 res = gimple_resimplify1 (NULL, res_op, vn_valueize);
1753 break;
1754 case 2:
1755 res = gimple_resimplify2 (NULL, res_op, vn_valueize);
1756 break;
1757 case 3:
1758 res = gimple_resimplify3 (NULL, res_op, vn_valueize);
1759 break;
1761 mprts_hook = NULL;
1762 gimple *new_stmt = NULL;
1763 if (res
1764 && gimple_simplified_result_is_gimple_val (res_op))
1766 /* The expression is already available. */
1767 result = res_op->ops[0];
1768 /* Valueize it, simplification returns sth in AVAIL only. */
1769 if (TREE_CODE (result) == SSA_NAME)
1770 result = SSA_VAL (result);
1772 else
1774 tree val = vn_lookup_simplify_result (res_op);
1775 if (!val && insert)
1777 gimple_seq stmts = NULL;
1778 result = maybe_push_res_to_seq (res_op, &stmts);
1779 if (result)
1781 gcc_assert (gimple_seq_singleton_p (stmts));
1782 new_stmt = gimple_seq_first_stmt (stmts);
1785 else
1786 /* The expression is already available. */
1787 result = val;
1789 if (new_stmt)
1791 /* The expression is not yet available, value-number lhs to
1792 the new SSA_NAME we created. */
1793 /* Initialize value-number information properly. */
1794 vn_ssa_aux_t result_info = VN_INFO (result);
1795 result_info->valnum = result;
1796 result_info->value_id = get_next_value_id ();
1797 result_info->visited = 1;
1798 gimple_seq_add_stmt_without_update (&VN_INFO (result)->expr,
1799 new_stmt);
1800 result_info->needs_insertion = true;
1801 /* ??? PRE phi-translation inserts NARYs without corresponding
1802 SSA name result. Re-use those but set their result according
1803 to the stmt we just built. */
1804 vn_nary_op_t nary = NULL;
1805 vn_nary_op_lookup_stmt (new_stmt, &nary);
1806 if (nary)
1808 gcc_assert (! nary->predicated_values && nary->u.result == NULL_TREE);
1809 nary->u.result = gimple_assign_lhs (new_stmt);
1811 /* As all "inserted" statements are singleton SCCs, insert
1812 to the valid table. This is strictly needed to
1813 avoid re-generating new value SSA_NAMEs for the same
1814 expression during SCC iteration over and over (the
1815 optimistic table gets cleared after each iteration).
1816 We do not need to insert into the optimistic table, as
1817 lookups there will fall back to the valid table. */
1818 else
1820 unsigned int length = vn_nary_length_from_stmt (new_stmt);
1821 vn_nary_op_t vno1
1822 = alloc_vn_nary_op_noinit (length, &vn_tables_insert_obstack);
1823 vno1->value_id = result_info->value_id;
1824 vno1->length = length;
1825 vno1->predicated_values = 0;
1826 vno1->u.result = result;
1827 init_vn_nary_op_from_stmt (vno1, new_stmt);
1828 vn_nary_op_insert_into (vno1, valid_info->nary, true);
1829 /* Also do not link it into the undo chain. */
1830 last_inserted_nary = vno1->next;
1831 vno1->next = (vn_nary_op_t)(void *)-1;
1833 if (dump_file && (dump_flags & TDF_DETAILS))
1835 fprintf (dump_file, "Inserting name ");
1836 print_generic_expr (dump_file, result);
1837 fprintf (dump_file, " for expression ");
1838 print_gimple_expr (dump_file, new_stmt, 0, TDF_SLIM);
1839 fprintf (dump_file, "\n");
1842 return result;
1845 /* Return a value-number for RCODE OPS... either by looking up an existing
1846 value-number for the simplified result or by inserting the operation. */
1848 static tree
1849 vn_nary_build_or_lookup (gimple_match_op *res_op)
1851 return vn_nary_build_or_lookup_1 (res_op, true);
1854 /* Try to simplify the expression RCODE OPS... of type TYPE and return
1855 its value if present. */
1857 tree
1858 vn_nary_simplify (vn_nary_op_t nary)
1860 if (nary->length > gimple_match_op::MAX_NUM_OPS)
1861 return NULL_TREE;
1862 gimple_match_op op (gimple_match_cond::UNCOND, nary->opcode,
1863 nary->type, nary->length);
1864 memcpy (op.ops, nary->op, sizeof (tree) * nary->length);
1865 return vn_nary_build_or_lookup_1 (&op, false);
1868 /* Elimination engine. */
1870 class eliminate_dom_walker : public dom_walker
1872 public:
1873 eliminate_dom_walker (cdi_direction, bitmap);
1874 ~eliminate_dom_walker ();
1876 virtual edge before_dom_children (basic_block);
1877 virtual void after_dom_children (basic_block);
1879 virtual tree eliminate_avail (basic_block, tree op);
1880 virtual void eliminate_push_avail (basic_block, tree op);
1881 tree eliminate_insert (basic_block, gimple_stmt_iterator *gsi, tree val);
1883 void eliminate_stmt (basic_block, gimple_stmt_iterator *);
1885 unsigned eliminate_cleanup (bool region_p = false);
1887 bool do_pre;
1888 unsigned int el_todo;
1889 unsigned int eliminations;
1890 unsigned int insertions;
1892 /* SSA names that had their defs inserted by PRE if do_pre. */
1893 bitmap inserted_exprs;
1895 /* Blocks with statements that have had their EH properties changed. */
1896 bitmap need_eh_cleanup;
1898 /* Blocks with statements that have had their AB properties changed. */
1899 bitmap need_ab_cleanup;
1901 /* Local state for the eliminate domwalk. */
1902 auto_vec<gimple *> to_remove;
1903 auto_vec<gimple *> to_fixup;
1904 auto_vec<tree> avail;
1905 auto_vec<tree> avail_stack;
1908 /* Adaptor to the elimination engine using RPO availability. */
1910 class rpo_elim : public eliminate_dom_walker
1912 public:
1913 rpo_elim(basic_block entry_)
1914 : eliminate_dom_walker (CDI_DOMINATORS, NULL), entry (entry_) {}
1915 ~rpo_elim();
1917 virtual tree eliminate_avail (basic_block, tree op);
1919 virtual void eliminate_push_avail (basic_block, tree);
1921 basic_block entry;
1922 /* Instead of having a local availability lattice for each
1923 basic-block and availability at X defined as union of
1924 the local availabilities at X and its dominators we're
1925 turning this upside down and track availability per
1926 value given values are usually made available at very
1927 few points (at least one).
1928 So we have a value -> vec<location, leader> map where
1929 LOCATION is specifying the basic-block LEADER is made
1930 available for VALUE. We push to this vector in RPO
1931 order thus for iteration we can simply pop the last
1932 entries.
1933 LOCATION is the basic-block index and LEADER is its
1934 SSA name version. */
1935 /* ??? We'd like to use auto_vec here with embedded storage
1936 but that doesn't play well until we can provide move
1937 constructors and use std::move on hash-table expansion.
1938 So for now this is a bit more expensive than necessary.
1939 We eventually want to switch to a chaining scheme like
1940 for hashtable entries for unwinding which would make
1941 making the vector part of the vn_ssa_aux structure possible. */
1942 typedef hash_map<tree, vec<std::pair<int, int> > > rpo_avail_t;
1943 rpo_avail_t m_rpo_avail;
1946 /* Global RPO state for access from hooks. */
1947 static rpo_elim *rpo_avail;
1948 basic_block vn_context_bb;
1950 /* Callback for walk_non_aliased_vuses. Tries to perform a lookup
1951 from the statement defining VUSE and if not successful tries to
1952 translate *REFP and VR_ through an aggregate copy at the definition
1953 of VUSE. If *DISAMBIGUATE_ONLY is true then do not perform translation
1954 of *REF and *VR. If only disambiguation was performed then
1955 *DISAMBIGUATE_ONLY is set to true. */
1957 static void *
1958 vn_reference_lookup_3 (ao_ref *ref, tree vuse, void *vr_,
1959 bool *disambiguate_only)
1961 vn_reference_t vr = (vn_reference_t)vr_;
1962 gimple *def_stmt = SSA_NAME_DEF_STMT (vuse);
1963 tree base = ao_ref_base (ref);
1964 HOST_WIDE_INT offseti, maxsizei;
1965 static vec<vn_reference_op_s> lhs_ops;
1966 ao_ref lhs_ref;
1967 bool lhs_ref_ok = false;
1968 poly_int64 copy_size;
1970 /* First try to disambiguate after value-replacing in the definitions LHS. */
1971 if (is_gimple_assign (def_stmt))
1973 tree lhs = gimple_assign_lhs (def_stmt);
1974 bool valueized_anything = false;
1975 /* Avoid re-allocation overhead. */
1976 lhs_ops.truncate (0);
1977 basic_block saved_rpo_bb = vn_context_bb;
1978 vn_context_bb = gimple_bb (def_stmt);
1979 copy_reference_ops_from_ref (lhs, &lhs_ops);
1980 lhs_ops = valueize_refs_1 (lhs_ops, &valueized_anything, true);
1981 vn_context_bb = saved_rpo_bb;
1982 if (valueized_anything)
1984 lhs_ref_ok = ao_ref_init_from_vn_reference (&lhs_ref,
1985 get_alias_set (lhs),
1986 TREE_TYPE (lhs), lhs_ops);
1987 if (lhs_ref_ok
1988 && !refs_may_alias_p_1 (ref, &lhs_ref, true))
1990 *disambiguate_only = true;
1991 return NULL;
1994 else
1996 ao_ref_init (&lhs_ref, lhs);
1997 lhs_ref_ok = true;
2000 /* If we reach a clobbering statement try to skip it and see if
2001 we find a VN result with exactly the same value as the
2002 possible clobber. In this case we can ignore the clobber
2003 and return the found value.
2004 Note that we don't need to worry about partial overlapping
2005 accesses as we then can use TBAA to disambiguate against the
2006 clobbering statement when looking up a load (thus the
2007 VN_WALKREWRITE guard). */
2008 if (vn_walk_kind == VN_WALKREWRITE
2009 && is_gimple_reg_type (TREE_TYPE (lhs))
2010 && types_compatible_p (TREE_TYPE (lhs), vr->type)
2011 /* The overlap restriction breaks down when either access
2012 alias-set is zero. Still for accesses of the size of
2013 an addressable unit there can be no overlaps. Overlaps
2014 between different union members are not an issue since
2015 activation of a union member via a store makes the
2016 values of untouched bytes unspecified. */
2017 && (known_eq (ref->size, BITS_PER_UNIT)
2018 || (get_alias_set (lhs) != 0
2019 && ao_ref_alias_set (ref) != 0)))
2021 tree *saved_last_vuse_ptr = last_vuse_ptr;
2022 /* Do not update last_vuse_ptr in vn_reference_lookup_2. */
2023 last_vuse_ptr = NULL;
2024 tree saved_vuse = vr->vuse;
2025 hashval_t saved_hashcode = vr->hashcode;
2026 void *res = vn_reference_lookup_2 (ref,
2027 gimple_vuse (def_stmt), 0, vr);
2028 /* Need to restore vr->vuse and vr->hashcode. */
2029 vr->vuse = saved_vuse;
2030 vr->hashcode = saved_hashcode;
2031 last_vuse_ptr = saved_last_vuse_ptr;
2032 if (res && res != (void *)-1)
2034 vn_reference_t vnresult = (vn_reference_t) res;
2035 if (vnresult->result
2036 && operand_equal_p (vnresult->result,
2037 gimple_assign_rhs1 (def_stmt), 0))
2038 return res;
2042 else if (gimple_call_builtin_p (def_stmt, BUILT_IN_NORMAL)
2043 && gimple_call_num_args (def_stmt) <= 4)
2045 /* For builtin calls valueize its arguments and call the
2046 alias oracle again. Valueization may improve points-to
2047 info of pointers and constify size and position arguments.
2048 Originally this was motivated by PR61034 which has
2049 conditional calls to free falsely clobbering ref because
2050 of imprecise points-to info of the argument. */
2051 tree oldargs[4];
2052 bool valueized_anything = false;
2053 for (unsigned i = 0; i < gimple_call_num_args (def_stmt); ++i)
2055 oldargs[i] = gimple_call_arg (def_stmt, i);
2056 tree val = vn_valueize (oldargs[i]);
2057 if (val != oldargs[i])
2059 gimple_call_set_arg (def_stmt, i, val);
2060 valueized_anything = true;
2063 if (valueized_anything)
2065 bool res = call_may_clobber_ref_p_1 (as_a <gcall *> (def_stmt),
2066 ref);
2067 for (unsigned i = 0; i < gimple_call_num_args (def_stmt); ++i)
2068 gimple_call_set_arg (def_stmt, i, oldargs[i]);
2069 if (!res)
2071 *disambiguate_only = true;
2072 return NULL;
2077 if (*disambiguate_only)
2078 return (void *)-1;
2080 /* If we cannot constrain the size of the reference we cannot
2081 test if anything kills it. */
2082 if (!ref->max_size_known_p ())
2083 return (void *)-1;
2085 poly_int64 offset = ref->offset;
2086 poly_int64 maxsize = ref->max_size;
2088 /* We can't deduce anything useful from clobbers. */
2089 if (gimple_clobber_p (def_stmt))
2090 return (void *)-1;
2092 /* def_stmt may-defs *ref. See if we can derive a value for *ref
2093 from that definition.
2094 1) Memset. */
2095 if (is_gimple_reg_type (vr->type)
2096 && gimple_call_builtin_p (def_stmt, BUILT_IN_MEMSET)
2097 && (integer_zerop (gimple_call_arg (def_stmt, 1))
2098 || ((TREE_CODE (gimple_call_arg (def_stmt, 1)) == INTEGER_CST
2099 || (INTEGRAL_TYPE_P (vr->type) && known_eq (ref->size, 8)))
2100 && CHAR_BIT == 8 && BITS_PER_UNIT == 8
2101 && offset.is_constant (&offseti)
2102 && offseti % BITS_PER_UNIT == 0))
2103 && poly_int_tree_p (gimple_call_arg (def_stmt, 2))
2104 && (TREE_CODE (gimple_call_arg (def_stmt, 0)) == ADDR_EXPR
2105 || TREE_CODE (gimple_call_arg (def_stmt, 0)) == SSA_NAME))
2107 tree base2;
2108 poly_int64 offset2, size2, maxsize2;
2109 bool reverse;
2110 tree ref2 = gimple_call_arg (def_stmt, 0);
2111 if (TREE_CODE (ref2) == SSA_NAME)
2113 ref2 = SSA_VAL (ref2);
2114 if (TREE_CODE (ref2) == SSA_NAME
2115 && (TREE_CODE (base) != MEM_REF
2116 || TREE_OPERAND (base, 0) != ref2))
2118 gimple *def_stmt = SSA_NAME_DEF_STMT (ref2);
2119 if (gimple_assign_single_p (def_stmt)
2120 && gimple_assign_rhs_code (def_stmt) == ADDR_EXPR)
2121 ref2 = gimple_assign_rhs1 (def_stmt);
2124 if (TREE_CODE (ref2) == ADDR_EXPR)
2126 ref2 = TREE_OPERAND (ref2, 0);
2127 base2 = get_ref_base_and_extent (ref2, &offset2, &size2, &maxsize2,
2128 &reverse);
2129 if (!known_size_p (maxsize2)
2130 || !known_eq (maxsize2, size2)
2131 || !operand_equal_p (base, base2, OEP_ADDRESS_OF))
2132 return (void *)-1;
2134 else if (TREE_CODE (ref2) == SSA_NAME)
2136 poly_int64 soff;
2137 if (TREE_CODE (base) != MEM_REF
2138 || !(mem_ref_offset (base) << LOG2_BITS_PER_UNIT).to_shwi (&soff))
2139 return (void *)-1;
2140 offset += soff;
2141 offset2 = 0;
2142 if (TREE_OPERAND (base, 0) != ref2)
2144 gimple *def = SSA_NAME_DEF_STMT (ref2);
2145 if (is_gimple_assign (def)
2146 && gimple_assign_rhs_code (def) == POINTER_PLUS_EXPR
2147 && gimple_assign_rhs1 (def) == TREE_OPERAND (base, 0)
2148 && poly_int_tree_p (gimple_assign_rhs2 (def))
2149 && (wi::to_poly_offset (gimple_assign_rhs2 (def))
2150 << LOG2_BITS_PER_UNIT).to_shwi (&offset2))
2152 ref2 = gimple_assign_rhs1 (def);
2153 if (TREE_CODE (ref2) == SSA_NAME)
2154 ref2 = SSA_VAL (ref2);
2156 else
2157 return (void *)-1;
2160 else
2161 return (void *)-1;
2162 tree len = gimple_call_arg (def_stmt, 2);
2163 if (known_subrange_p (offset, maxsize, offset2,
2164 wi::to_poly_offset (len) << LOG2_BITS_PER_UNIT))
2166 tree val;
2167 if (integer_zerop (gimple_call_arg (def_stmt, 1)))
2168 val = build_zero_cst (vr->type);
2169 else if (INTEGRAL_TYPE_P (vr->type)
2170 && known_eq (ref->size, 8))
2172 gimple_match_op res_op (gimple_match_cond::UNCOND, NOP_EXPR,
2173 vr->type, gimple_call_arg (def_stmt, 1));
2174 val = vn_nary_build_or_lookup (&res_op);
2175 if (!val
2176 || (TREE_CODE (val) == SSA_NAME
2177 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (val)))
2178 return (void *)-1;
2180 else
2182 unsigned len = TREE_INT_CST_LOW (TYPE_SIZE_UNIT (vr->type));
2183 unsigned char *buf = XALLOCAVEC (unsigned char, len);
2184 memset (buf, TREE_INT_CST_LOW (gimple_call_arg (def_stmt, 1)),
2185 len);
2186 val = native_interpret_expr (vr->type, buf, len);
2187 if (!val)
2188 return (void *)-1;
2190 return vn_reference_lookup_or_insert_for_pieces
2191 (vuse, vr->set, vr->type, vr->operands, val);
2195 /* 2) Assignment from an empty CONSTRUCTOR. */
2196 else if (is_gimple_reg_type (vr->type)
2197 && gimple_assign_single_p (def_stmt)
2198 && gimple_assign_rhs_code (def_stmt) == CONSTRUCTOR
2199 && CONSTRUCTOR_NELTS (gimple_assign_rhs1 (def_stmt)) == 0)
2201 tree base2;
2202 poly_int64 offset2, size2, maxsize2;
2203 bool reverse;
2204 base2 = get_ref_base_and_extent (gimple_assign_lhs (def_stmt),
2205 &offset2, &size2, &maxsize2, &reverse);
2206 if (known_size_p (maxsize2)
2207 && known_eq (maxsize2, size2)
2208 && operand_equal_p (base, base2, 0)
2209 && known_subrange_p (offset, maxsize, offset2, size2))
2211 tree val = build_zero_cst (vr->type);
2212 return vn_reference_lookup_or_insert_for_pieces
2213 (vuse, vr->set, vr->type, vr->operands, val);
2217 /* 3) Assignment from a constant. We can use folds native encode/interpret
2218 routines to extract the assigned bits. */
2219 else if (known_eq (ref->size, maxsize)
2220 && is_gimple_reg_type (vr->type)
2221 && !contains_storage_order_barrier_p (vr->operands)
2222 && gimple_assign_single_p (def_stmt)
2223 && CHAR_BIT == 8 && BITS_PER_UNIT == 8
2224 /* native_encode and native_decode operate on arrays of bytes
2225 and so fundamentally need a compile-time size and offset. */
2226 && maxsize.is_constant (&maxsizei)
2227 && maxsizei % BITS_PER_UNIT == 0
2228 && offset.is_constant (&offseti)
2229 && offseti % BITS_PER_UNIT == 0
2230 && (is_gimple_min_invariant (gimple_assign_rhs1 (def_stmt))
2231 || (TREE_CODE (gimple_assign_rhs1 (def_stmt)) == SSA_NAME
2232 && is_gimple_min_invariant (SSA_VAL (gimple_assign_rhs1 (def_stmt))))))
2234 tree base2;
2235 HOST_WIDE_INT offset2, size2;
2236 bool reverse;
2237 base2 = get_ref_base_and_extent_hwi (gimple_assign_lhs (def_stmt),
2238 &offset2, &size2, &reverse);
2239 if (base2
2240 && !reverse
2241 && size2 % BITS_PER_UNIT == 0
2242 && offset2 % BITS_PER_UNIT == 0
2243 && operand_equal_p (base, base2, 0)
2244 && known_subrange_p (offseti, maxsizei, offset2, size2))
2246 /* We support up to 512-bit values (for V8DFmode). */
2247 unsigned char buffer[64];
2248 int len;
2250 tree rhs = gimple_assign_rhs1 (def_stmt);
2251 if (TREE_CODE (rhs) == SSA_NAME)
2252 rhs = SSA_VAL (rhs);
2253 len = native_encode_expr (gimple_assign_rhs1 (def_stmt),
2254 buffer, sizeof (buffer),
2255 (offseti - offset2) / BITS_PER_UNIT);
2256 if (len > 0 && len * BITS_PER_UNIT >= maxsizei)
2258 tree type = vr->type;
2259 /* Make sure to interpret in a type that has a range
2260 covering the whole access size. */
2261 if (INTEGRAL_TYPE_P (vr->type)
2262 && maxsizei != TYPE_PRECISION (vr->type))
2263 type = build_nonstandard_integer_type (maxsizei,
2264 TYPE_UNSIGNED (type));
2265 tree val = native_interpret_expr (type, buffer,
2266 maxsizei / BITS_PER_UNIT);
2267 /* If we chop off bits because the types precision doesn't
2268 match the memory access size this is ok when optimizing
2269 reads but not when called from the DSE code during
2270 elimination. */
2271 if (val
2272 && type != vr->type)
2274 if (! int_fits_type_p (val, vr->type))
2275 val = NULL_TREE;
2276 else
2277 val = fold_convert (vr->type, val);
2280 if (val)
2281 return vn_reference_lookup_or_insert_for_pieces
2282 (vuse, vr->set, vr->type, vr->operands, val);
2287 /* 4) Assignment from an SSA name which definition we may be able
2288 to access pieces from. */
2289 else if (known_eq (ref->size, maxsize)
2290 && is_gimple_reg_type (vr->type)
2291 && !contains_storage_order_barrier_p (vr->operands)
2292 && gimple_assign_single_p (def_stmt)
2293 && TREE_CODE (gimple_assign_rhs1 (def_stmt)) == SSA_NAME)
2295 tree base2;
2296 poly_int64 offset2, size2, maxsize2;
2297 bool reverse;
2298 base2 = get_ref_base_and_extent (gimple_assign_lhs (def_stmt),
2299 &offset2, &size2, &maxsize2,
2300 &reverse);
2301 tree def_rhs = gimple_assign_rhs1 (def_stmt);
2302 if (!reverse
2303 && known_size_p (maxsize2)
2304 && known_eq (maxsize2, size2)
2305 && operand_equal_p (base, base2, 0)
2306 && known_subrange_p (offset, maxsize, offset2, size2)
2307 /* ??? We can't handle bitfield precision extracts without
2308 either using an alternate type for the BIT_FIELD_REF and
2309 then doing a conversion or possibly adjusting the offset
2310 according to endianness. */
2311 && (! INTEGRAL_TYPE_P (vr->type)
2312 || known_eq (ref->size, TYPE_PRECISION (vr->type)))
2313 && multiple_p (ref->size, BITS_PER_UNIT)
2314 && (! INTEGRAL_TYPE_P (TREE_TYPE (def_rhs))
2315 || type_has_mode_precision_p (TREE_TYPE (def_rhs))))
2317 gimple_match_op op (gimple_match_cond::UNCOND,
2318 BIT_FIELD_REF, vr->type,
2319 vn_valueize (def_rhs),
2320 bitsize_int (ref->size),
2321 bitsize_int (offset - offset2));
2322 tree val = vn_nary_build_or_lookup (&op);
2323 if (val
2324 && (TREE_CODE (val) != SSA_NAME
2325 || ! SSA_NAME_OCCURS_IN_ABNORMAL_PHI (val)))
2327 vn_reference_t res = vn_reference_lookup_or_insert_for_pieces
2328 (vuse, vr->set, vr->type, vr->operands, val);
2329 return res;
2334 /* 5) For aggregate copies translate the reference through them if
2335 the copy kills ref. */
2336 else if (vn_walk_kind == VN_WALKREWRITE
2337 && gimple_assign_single_p (def_stmt)
2338 && (DECL_P (gimple_assign_rhs1 (def_stmt))
2339 || TREE_CODE (gimple_assign_rhs1 (def_stmt)) == MEM_REF
2340 || handled_component_p (gimple_assign_rhs1 (def_stmt))))
2342 tree base2;
2343 int i, j, k;
2344 auto_vec<vn_reference_op_s> rhs;
2345 vn_reference_op_t vro;
2346 ao_ref r;
2348 if (!lhs_ref_ok)
2349 return (void *)-1;
2351 /* See if the assignment kills REF. */
2352 base2 = ao_ref_base (&lhs_ref);
2353 if (!lhs_ref.max_size_known_p ()
2354 || (base != base2
2355 && (TREE_CODE (base) != MEM_REF
2356 || TREE_CODE (base2) != MEM_REF
2357 || TREE_OPERAND (base, 0) != TREE_OPERAND (base2, 0)
2358 || !tree_int_cst_equal (TREE_OPERAND (base, 1),
2359 TREE_OPERAND (base2, 1))))
2360 || !stmt_kills_ref_p (def_stmt, ref))
2361 return (void *)-1;
2363 /* Find the common base of ref and the lhs. lhs_ops already
2364 contains valueized operands for the lhs. */
2365 i = vr->operands.length () - 1;
2366 j = lhs_ops.length () - 1;
2367 while (j >= 0 && i >= 0
2368 && vn_reference_op_eq (&vr->operands[i], &lhs_ops[j]))
2370 i--;
2371 j--;
2374 /* ??? The innermost op should always be a MEM_REF and we already
2375 checked that the assignment to the lhs kills vr. Thus for
2376 aggregate copies using char[] types the vn_reference_op_eq
2377 may fail when comparing types for compatibility. But we really
2378 don't care here - further lookups with the rewritten operands
2379 will simply fail if we messed up types too badly. */
2380 poly_int64 extra_off = 0;
2381 if (j == 0 && i >= 0
2382 && lhs_ops[0].opcode == MEM_REF
2383 && maybe_ne (lhs_ops[0].off, -1))
2385 if (known_eq (lhs_ops[0].off, vr->operands[i].off))
2386 i--, j--;
2387 else if (vr->operands[i].opcode == MEM_REF
2388 && maybe_ne (vr->operands[i].off, -1))
2390 extra_off = vr->operands[i].off - lhs_ops[0].off;
2391 i--, j--;
2395 /* i now points to the first additional op.
2396 ??? LHS may not be completely contained in VR, one or more
2397 VIEW_CONVERT_EXPRs could be in its way. We could at least
2398 try handling outermost VIEW_CONVERT_EXPRs. */
2399 if (j != -1)
2400 return (void *)-1;
2402 /* Punt if the additional ops contain a storage order barrier. */
2403 for (k = i; k >= 0; k--)
2405 vro = &vr->operands[k];
2406 if (vro->opcode == VIEW_CONVERT_EXPR && vro->reverse)
2407 return (void *)-1;
2410 /* Now re-write REF to be based on the rhs of the assignment. */
2411 copy_reference_ops_from_ref (gimple_assign_rhs1 (def_stmt), &rhs);
2413 /* Apply an extra offset to the inner MEM_REF of the RHS. */
2414 if (maybe_ne (extra_off, 0))
2416 if (rhs.length () < 2)
2417 return (void *)-1;
2418 int ix = rhs.length () - 2;
2419 if (rhs[ix].opcode != MEM_REF
2420 || known_eq (rhs[ix].off, -1))
2421 return (void *)-1;
2422 rhs[ix].off += extra_off;
2423 rhs[ix].op0 = int_const_binop (PLUS_EXPR, rhs[ix].op0,
2424 build_int_cst (TREE_TYPE (rhs[ix].op0),
2425 extra_off));
2428 /* We need to pre-pend vr->operands[0..i] to rhs. */
2429 vec<vn_reference_op_s> old = vr->operands;
2430 if (i + 1 + rhs.length () > vr->operands.length ())
2431 vr->operands.safe_grow (i + 1 + rhs.length ());
2432 else
2433 vr->operands.truncate (i + 1 + rhs.length ());
2434 FOR_EACH_VEC_ELT (rhs, j, vro)
2435 vr->operands[i + 1 + j] = *vro;
2436 vr->operands = valueize_refs (vr->operands);
2437 if (old == shared_lookup_references)
2438 shared_lookup_references = vr->operands;
2439 vr->hashcode = vn_reference_compute_hash (vr);
2441 /* Try folding the new reference to a constant. */
2442 tree val = fully_constant_vn_reference_p (vr);
2443 if (val)
2444 return vn_reference_lookup_or_insert_for_pieces
2445 (vuse, vr->set, vr->type, vr->operands, val);
2447 /* Adjust *ref from the new operands. */
2448 if (!ao_ref_init_from_vn_reference (&r, vr->set, vr->type, vr->operands))
2449 return (void *)-1;
2450 /* This can happen with bitfields. */
2451 if (maybe_ne (ref->size, r.size))
2452 return (void *)-1;
2453 *ref = r;
2455 /* Do not update last seen VUSE after translating. */
2456 last_vuse_ptr = NULL;
2458 /* Keep looking for the adjusted *REF / VR pair. */
2459 return NULL;
2462 /* 6) For memcpy copies translate the reference through them if
2463 the copy kills ref. */
2464 else if (vn_walk_kind == VN_WALKREWRITE
2465 && is_gimple_reg_type (vr->type)
2466 /* ??? Handle BCOPY as well. */
2467 && (gimple_call_builtin_p (def_stmt, BUILT_IN_MEMCPY)
2468 || gimple_call_builtin_p (def_stmt, BUILT_IN_MEMPCPY)
2469 || gimple_call_builtin_p (def_stmt, BUILT_IN_MEMMOVE))
2470 && (TREE_CODE (gimple_call_arg (def_stmt, 0)) == ADDR_EXPR
2471 || TREE_CODE (gimple_call_arg (def_stmt, 0)) == SSA_NAME)
2472 && (TREE_CODE (gimple_call_arg (def_stmt, 1)) == ADDR_EXPR
2473 || TREE_CODE (gimple_call_arg (def_stmt, 1)) == SSA_NAME)
2474 && poly_int_tree_p (gimple_call_arg (def_stmt, 2), &copy_size))
2476 tree lhs, rhs;
2477 ao_ref r;
2478 poly_int64 rhs_offset, lhs_offset;
2479 vn_reference_op_s op;
2480 poly_uint64 mem_offset;
2481 poly_int64 at, byte_maxsize;
2483 /* Only handle non-variable, addressable refs. */
2484 if (maybe_ne (ref->size, maxsize)
2485 || !multiple_p (offset, BITS_PER_UNIT, &at)
2486 || !multiple_p (maxsize, BITS_PER_UNIT, &byte_maxsize))
2487 return (void *)-1;
2489 /* Extract a pointer base and an offset for the destination. */
2490 lhs = gimple_call_arg (def_stmt, 0);
2491 lhs_offset = 0;
2492 if (TREE_CODE (lhs) == SSA_NAME)
2494 lhs = vn_valueize (lhs);
2495 if (TREE_CODE (lhs) == SSA_NAME)
2497 gimple *def_stmt = SSA_NAME_DEF_STMT (lhs);
2498 if (gimple_assign_single_p (def_stmt)
2499 && gimple_assign_rhs_code (def_stmt) == ADDR_EXPR)
2500 lhs = gimple_assign_rhs1 (def_stmt);
2503 if (TREE_CODE (lhs) == ADDR_EXPR)
2505 tree tem = get_addr_base_and_unit_offset (TREE_OPERAND (lhs, 0),
2506 &lhs_offset);
2507 if (!tem)
2508 return (void *)-1;
2509 if (TREE_CODE (tem) == MEM_REF
2510 && poly_int_tree_p (TREE_OPERAND (tem, 1), &mem_offset))
2512 lhs = TREE_OPERAND (tem, 0);
2513 if (TREE_CODE (lhs) == SSA_NAME)
2514 lhs = vn_valueize (lhs);
2515 lhs_offset += mem_offset;
2517 else if (DECL_P (tem))
2518 lhs = build_fold_addr_expr (tem);
2519 else
2520 return (void *)-1;
2522 if (TREE_CODE (lhs) != SSA_NAME
2523 && TREE_CODE (lhs) != ADDR_EXPR)
2524 return (void *)-1;
2526 /* Extract a pointer base and an offset for the source. */
2527 rhs = gimple_call_arg (def_stmt, 1);
2528 rhs_offset = 0;
2529 if (TREE_CODE (rhs) == SSA_NAME)
2530 rhs = vn_valueize (rhs);
2531 if (TREE_CODE (rhs) == ADDR_EXPR)
2533 tree tem = get_addr_base_and_unit_offset (TREE_OPERAND (rhs, 0),
2534 &rhs_offset);
2535 if (!tem)
2536 return (void *)-1;
2537 if (TREE_CODE (tem) == MEM_REF
2538 && poly_int_tree_p (TREE_OPERAND (tem, 1), &mem_offset))
2540 rhs = TREE_OPERAND (tem, 0);
2541 rhs_offset += mem_offset;
2543 else if (DECL_P (tem)
2544 || TREE_CODE (tem) == STRING_CST)
2545 rhs = build_fold_addr_expr (tem);
2546 else
2547 return (void *)-1;
2549 if (TREE_CODE (rhs) != SSA_NAME
2550 && TREE_CODE (rhs) != ADDR_EXPR)
2551 return (void *)-1;
2553 /* The bases of the destination and the references have to agree. */
2554 if (TREE_CODE (base) == MEM_REF)
2556 if (TREE_OPERAND (base, 0) != lhs
2557 || !poly_int_tree_p (TREE_OPERAND (base, 1), &mem_offset))
2558 return (void *) -1;
2559 at += mem_offset;
2561 else if (!DECL_P (base)
2562 || TREE_CODE (lhs) != ADDR_EXPR
2563 || TREE_OPERAND (lhs, 0) != base)
2564 return (void *)-1;
2566 /* If the access is completely outside of the memcpy destination
2567 area there is no aliasing. */
2568 if (!ranges_maybe_overlap_p (lhs_offset, copy_size, at, byte_maxsize))
2569 return NULL;
2570 /* And the access has to be contained within the memcpy destination. */
2571 if (!known_subrange_p (at, byte_maxsize, lhs_offset, copy_size))
2572 return (void *)-1;
2574 /* Make room for 2 operands in the new reference. */
2575 if (vr->operands.length () < 2)
2577 vec<vn_reference_op_s> old = vr->operands;
2578 vr->operands.safe_grow_cleared (2);
2579 if (old == shared_lookup_references)
2580 shared_lookup_references = vr->operands;
2582 else
2583 vr->operands.truncate (2);
2585 /* The looked-through reference is a simple MEM_REF. */
2586 memset (&op, 0, sizeof (op));
2587 op.type = vr->type;
2588 op.opcode = MEM_REF;
2589 op.op0 = build_int_cst (ptr_type_node, at - lhs_offset + rhs_offset);
2590 op.off = at - lhs_offset + rhs_offset;
2591 vr->operands[0] = op;
2592 op.type = TREE_TYPE (rhs);
2593 op.opcode = TREE_CODE (rhs);
2594 op.op0 = rhs;
2595 op.off = -1;
2596 vr->operands[1] = op;
2597 vr->hashcode = vn_reference_compute_hash (vr);
2599 /* Try folding the new reference to a constant. */
2600 tree val = fully_constant_vn_reference_p (vr);
2601 if (val)
2602 return vn_reference_lookup_or_insert_for_pieces
2603 (vuse, vr->set, vr->type, vr->operands, val);
2605 /* Adjust *ref from the new operands. */
2606 if (!ao_ref_init_from_vn_reference (&r, vr->set, vr->type, vr->operands))
2607 return (void *)-1;
2608 /* This can happen with bitfields. */
2609 if (maybe_ne (ref->size, r.size))
2610 return (void *)-1;
2611 *ref = r;
2613 /* Do not update last seen VUSE after translating. */
2614 last_vuse_ptr = NULL;
2616 /* Keep looking for the adjusted *REF / VR pair. */
2617 return NULL;
2620 /* Bail out and stop walking. */
2621 return (void *)-1;
2624 /* Return a reference op vector from OP that can be used for
2625 vn_reference_lookup_pieces. The caller is responsible for releasing
2626 the vector. */
2628 vec<vn_reference_op_s>
2629 vn_reference_operands_for_lookup (tree op)
2631 bool valueized;
2632 return valueize_shared_reference_ops_from_ref (op, &valueized).copy ();
2635 /* Lookup a reference operation by it's parts, in the current hash table.
2636 Returns the resulting value number if it exists in the hash table,
2637 NULL_TREE otherwise. VNRESULT will be filled in with the actual
2638 vn_reference_t stored in the hashtable if something is found. */
2640 tree
2641 vn_reference_lookup_pieces (tree vuse, alias_set_type set, tree type,
2642 vec<vn_reference_op_s> operands,
2643 vn_reference_t *vnresult, vn_lookup_kind kind)
2645 struct vn_reference_s vr1;
2646 vn_reference_t tmp;
2647 tree cst;
2649 if (!vnresult)
2650 vnresult = &tmp;
2651 *vnresult = NULL;
2653 vr1.vuse = vuse_ssa_val (vuse);
2654 shared_lookup_references.truncate (0);
2655 shared_lookup_references.safe_grow (operands.length ());
2656 memcpy (shared_lookup_references.address (),
2657 operands.address (),
2658 sizeof (vn_reference_op_s)
2659 * operands.length ());
2660 vr1.operands = operands = shared_lookup_references
2661 = valueize_refs (shared_lookup_references);
2662 vr1.type = type;
2663 vr1.set = set;
2664 vr1.hashcode = vn_reference_compute_hash (&vr1);
2665 if ((cst = fully_constant_vn_reference_p (&vr1)))
2666 return cst;
2668 vn_reference_lookup_1 (&vr1, vnresult);
2669 if (!*vnresult
2670 && kind != VN_NOWALK
2671 && vr1.vuse)
2673 ao_ref r;
2674 vn_walk_kind = kind;
2675 if (ao_ref_init_from_vn_reference (&r, set, type, vr1.operands))
2676 *vnresult =
2677 (vn_reference_t)walk_non_aliased_vuses (&r, vr1.vuse,
2678 vn_reference_lookup_2,
2679 vn_reference_lookup_3,
2680 vuse_valueize, &vr1);
2681 gcc_checking_assert (vr1.operands == shared_lookup_references);
2684 if (*vnresult)
2685 return (*vnresult)->result;
2687 return NULL_TREE;
2690 /* Lookup OP in the current hash table, and return the resulting value
2691 number if it exists in the hash table. Return NULL_TREE if it does
2692 not exist in the hash table or if the result field of the structure
2693 was NULL.. VNRESULT will be filled in with the vn_reference_t
2694 stored in the hashtable if one exists. When TBAA_P is false assume
2695 we are looking up a store and treat it as having alias-set zero. */
2697 tree
2698 vn_reference_lookup (tree op, tree vuse, vn_lookup_kind kind,
2699 vn_reference_t *vnresult, bool tbaa_p)
2701 vec<vn_reference_op_s> operands;
2702 struct vn_reference_s vr1;
2703 tree cst;
2704 bool valuezied_anything;
2706 if (vnresult)
2707 *vnresult = NULL;
2709 vr1.vuse = vuse_ssa_val (vuse);
2710 vr1.operands = operands
2711 = valueize_shared_reference_ops_from_ref (op, &valuezied_anything);
2712 vr1.type = TREE_TYPE (op);
2713 vr1.set = tbaa_p ? get_alias_set (op) : 0;
2714 vr1.hashcode = vn_reference_compute_hash (&vr1);
2715 if ((cst = fully_constant_vn_reference_p (&vr1)))
2716 return cst;
2718 if (kind != VN_NOWALK
2719 && vr1.vuse)
2721 vn_reference_t wvnresult;
2722 ao_ref r;
2723 /* Make sure to use a valueized reference if we valueized anything.
2724 Otherwise preserve the full reference for advanced TBAA. */
2725 if (!valuezied_anything
2726 || !ao_ref_init_from_vn_reference (&r, vr1.set, vr1.type,
2727 vr1.operands))
2728 ao_ref_init (&r, op);
2729 if (! tbaa_p)
2730 r.ref_alias_set = r.base_alias_set = 0;
2731 vn_walk_kind = kind;
2732 wvnresult =
2733 (vn_reference_t)walk_non_aliased_vuses (&r, vr1.vuse,
2734 vn_reference_lookup_2,
2735 vn_reference_lookup_3,
2736 vuse_valueize, &vr1);
2737 gcc_checking_assert (vr1.operands == shared_lookup_references);
2738 if (wvnresult)
2740 if (vnresult)
2741 *vnresult = wvnresult;
2742 return wvnresult->result;
2745 return NULL_TREE;
2748 return vn_reference_lookup_1 (&vr1, vnresult);
2751 /* Lookup CALL in the current hash table and return the entry in
2752 *VNRESULT if found. Populates *VR for the hashtable lookup. */
2754 void
2755 vn_reference_lookup_call (gcall *call, vn_reference_t *vnresult,
2756 vn_reference_t vr)
2758 if (vnresult)
2759 *vnresult = NULL;
2761 tree vuse = gimple_vuse (call);
2763 vr->vuse = vuse ? SSA_VAL (vuse) : NULL_TREE;
2764 vr->operands = valueize_shared_reference_ops_from_call (call);
2765 vr->type = gimple_expr_type (call);
2766 vr->set = 0;
2767 vr->hashcode = vn_reference_compute_hash (vr);
2768 vn_reference_lookup_1 (vr, vnresult);
2771 /* Insert OP into the current hash table with a value number of RESULT. */
2773 static void
2774 vn_reference_insert (tree op, tree result, tree vuse, tree vdef)
2776 vn_reference_s **slot;
2777 vn_reference_t vr1;
2778 bool tem;
2780 vr1 = XOBNEW (&vn_tables_obstack, vn_reference_s);
2781 if (TREE_CODE (result) == SSA_NAME)
2782 vr1->value_id = VN_INFO (result)->value_id;
2783 else
2784 vr1->value_id = get_or_alloc_constant_value_id (result);
2785 vr1->vuse = vuse_ssa_val (vuse);
2786 vr1->operands = valueize_shared_reference_ops_from_ref (op, &tem).copy ();
2787 vr1->type = TREE_TYPE (op);
2788 vr1->set = get_alias_set (op);
2789 vr1->hashcode = vn_reference_compute_hash (vr1);
2790 vr1->result = TREE_CODE (result) == SSA_NAME ? SSA_VAL (result) : result;
2791 vr1->result_vdef = vdef;
2793 slot = valid_info->references->find_slot_with_hash (vr1, vr1->hashcode,
2794 INSERT);
2796 /* Because IL walking on reference lookup can end up visiting
2797 a def that is only to be visited later in iteration order
2798 when we are about to make an irreducible region reducible
2799 the def can be effectively processed and its ref being inserted
2800 by vn_reference_lookup_3 already. So we cannot assert (!*slot)
2801 but save a lookup if we deal with already inserted refs here. */
2802 if (*slot)
2804 /* We cannot assert that we have the same value either because
2805 when disentangling an irreducible region we may end up visiting
2806 a use before the corresponding def. That's a missed optimization
2807 only though. See gcc.dg/tree-ssa/pr87126.c for example. */
2808 if (dump_file && (dump_flags & TDF_DETAILS)
2809 && !operand_equal_p ((*slot)->result, vr1->result, 0))
2811 fprintf (dump_file, "Keeping old value ");
2812 print_generic_expr (dump_file, (*slot)->result);
2813 fprintf (dump_file, " because of collision\n");
2815 free_reference (vr1);
2816 obstack_free (&vn_tables_obstack, vr1);
2817 return;
2820 *slot = vr1;
2821 vr1->next = last_inserted_ref;
2822 last_inserted_ref = vr1;
2825 /* Insert a reference by it's pieces into the current hash table with
2826 a value number of RESULT. Return the resulting reference
2827 structure we created. */
2829 vn_reference_t
2830 vn_reference_insert_pieces (tree vuse, alias_set_type set, tree type,
2831 vec<vn_reference_op_s> operands,
2832 tree result, unsigned int value_id)
2835 vn_reference_s **slot;
2836 vn_reference_t vr1;
2838 vr1 = XOBNEW (&vn_tables_obstack, vn_reference_s);
2839 vr1->value_id = value_id;
2840 vr1->vuse = vuse_ssa_val (vuse);
2841 vr1->operands = valueize_refs (operands);
2842 vr1->type = type;
2843 vr1->set = set;
2844 vr1->hashcode = vn_reference_compute_hash (vr1);
2845 if (result && TREE_CODE (result) == SSA_NAME)
2846 result = SSA_VAL (result);
2847 vr1->result = result;
2849 slot = valid_info->references->find_slot_with_hash (vr1, vr1->hashcode,
2850 INSERT);
2852 /* At this point we should have all the things inserted that we have
2853 seen before, and we should never try inserting something that
2854 already exists. */
2855 gcc_assert (!*slot);
2857 *slot = vr1;
2858 vr1->next = last_inserted_ref;
2859 last_inserted_ref = vr1;
2860 return vr1;
2863 /* Compute and return the hash value for nary operation VBO1. */
2865 static hashval_t
2866 vn_nary_op_compute_hash (const vn_nary_op_t vno1)
2868 inchash::hash hstate;
2869 unsigned i;
2871 for (i = 0; i < vno1->length; ++i)
2872 if (TREE_CODE (vno1->op[i]) == SSA_NAME)
2873 vno1->op[i] = SSA_VAL (vno1->op[i]);
2875 if (((vno1->length == 2
2876 && commutative_tree_code (vno1->opcode))
2877 || (vno1->length == 3
2878 && commutative_ternary_tree_code (vno1->opcode)))
2879 && tree_swap_operands_p (vno1->op[0], vno1->op[1]))
2880 std::swap (vno1->op[0], vno1->op[1]);
2881 else if (TREE_CODE_CLASS (vno1->opcode) == tcc_comparison
2882 && tree_swap_operands_p (vno1->op[0], vno1->op[1]))
2884 std::swap (vno1->op[0], vno1->op[1]);
2885 vno1->opcode = swap_tree_comparison (vno1->opcode);
2888 hstate.add_int (vno1->opcode);
2889 for (i = 0; i < vno1->length; ++i)
2890 inchash::add_expr (vno1->op[i], hstate);
2892 return hstate.end ();
2895 /* Compare nary operations VNO1 and VNO2 and return true if they are
2896 equivalent. */
2898 bool
2899 vn_nary_op_eq (const_vn_nary_op_t const vno1, const_vn_nary_op_t const vno2)
2901 unsigned i;
2903 if (vno1->hashcode != vno2->hashcode)
2904 return false;
2906 if (vno1->length != vno2->length)
2907 return false;
2909 if (vno1->opcode != vno2->opcode
2910 || !types_compatible_p (vno1->type, vno2->type))
2911 return false;
2913 for (i = 0; i < vno1->length; ++i)
2914 if (!expressions_equal_p (vno1->op[i], vno2->op[i]))
2915 return false;
2917 /* BIT_INSERT_EXPR has an implict operand as the type precision
2918 of op1. Need to check to make sure they are the same. */
2919 if (vno1->opcode == BIT_INSERT_EXPR
2920 && TREE_CODE (vno1->op[1]) == INTEGER_CST
2921 && TYPE_PRECISION (TREE_TYPE (vno1->op[1]))
2922 != TYPE_PRECISION (TREE_TYPE (vno2->op[1])))
2923 return false;
2925 return true;
2928 /* Initialize VNO from the pieces provided. */
2930 static void
2931 init_vn_nary_op_from_pieces (vn_nary_op_t vno, unsigned int length,
2932 enum tree_code code, tree type, tree *ops)
2934 vno->opcode = code;
2935 vno->length = length;
2936 vno->type = type;
2937 memcpy (&vno->op[0], ops, sizeof (tree) * length);
2940 /* Initialize VNO from OP. */
2942 static void
2943 init_vn_nary_op_from_op (vn_nary_op_t vno, tree op)
2945 unsigned i;
2947 vno->opcode = TREE_CODE (op);
2948 vno->length = TREE_CODE_LENGTH (TREE_CODE (op));
2949 vno->type = TREE_TYPE (op);
2950 for (i = 0; i < vno->length; ++i)
2951 vno->op[i] = TREE_OPERAND (op, i);
2954 /* Return the number of operands for a vn_nary ops structure from STMT. */
2956 static unsigned int
2957 vn_nary_length_from_stmt (gimple *stmt)
2959 switch (gimple_assign_rhs_code (stmt))
2961 case REALPART_EXPR:
2962 case IMAGPART_EXPR:
2963 case VIEW_CONVERT_EXPR:
2964 return 1;
2966 case BIT_FIELD_REF:
2967 return 3;
2969 case CONSTRUCTOR:
2970 return CONSTRUCTOR_NELTS (gimple_assign_rhs1 (stmt));
2972 default:
2973 return gimple_num_ops (stmt) - 1;
2977 /* Initialize VNO from STMT. */
2979 static void
2980 init_vn_nary_op_from_stmt (vn_nary_op_t vno, gimple *stmt)
2982 unsigned i;
2984 vno->opcode = gimple_assign_rhs_code (stmt);
2985 vno->type = gimple_expr_type (stmt);
2986 switch (vno->opcode)
2988 case REALPART_EXPR:
2989 case IMAGPART_EXPR:
2990 case VIEW_CONVERT_EXPR:
2991 vno->length = 1;
2992 vno->op[0] = TREE_OPERAND (gimple_assign_rhs1 (stmt), 0);
2993 break;
2995 case BIT_FIELD_REF:
2996 vno->length = 3;
2997 vno->op[0] = TREE_OPERAND (gimple_assign_rhs1 (stmt), 0);
2998 vno->op[1] = TREE_OPERAND (gimple_assign_rhs1 (stmt), 1);
2999 vno->op[2] = TREE_OPERAND (gimple_assign_rhs1 (stmt), 2);
3000 break;
3002 case CONSTRUCTOR:
3003 vno->length = CONSTRUCTOR_NELTS (gimple_assign_rhs1 (stmt));
3004 for (i = 0; i < vno->length; ++i)
3005 vno->op[i] = CONSTRUCTOR_ELT (gimple_assign_rhs1 (stmt), i)->value;
3006 break;
3008 default:
3009 gcc_checking_assert (!gimple_assign_single_p (stmt));
3010 vno->length = gimple_num_ops (stmt) - 1;
3011 for (i = 0; i < vno->length; ++i)
3012 vno->op[i] = gimple_op (stmt, i + 1);
3016 /* Compute the hashcode for VNO and look for it in the hash table;
3017 return the resulting value number if it exists in the hash table.
3018 Return NULL_TREE if it does not exist in the hash table or if the
3019 result field of the operation is NULL. VNRESULT will contain the
3020 vn_nary_op_t from the hashtable if it exists. */
3022 static tree
3023 vn_nary_op_lookup_1 (vn_nary_op_t vno, vn_nary_op_t *vnresult)
3025 vn_nary_op_s **slot;
3027 if (vnresult)
3028 *vnresult = NULL;
3030 vno->hashcode = vn_nary_op_compute_hash (vno);
3031 slot = valid_info->nary->find_slot_with_hash (vno, vno->hashcode, NO_INSERT);
3032 if (!slot)
3033 return NULL_TREE;
3034 if (vnresult)
3035 *vnresult = *slot;
3036 return (*slot)->predicated_values ? NULL_TREE : (*slot)->u.result;
3039 /* Lookup a n-ary operation by its pieces and return the resulting value
3040 number if it exists in the hash table. Return NULL_TREE if it does
3041 not exist in the hash table or if the result field of the operation
3042 is NULL. VNRESULT will contain the vn_nary_op_t from the hashtable
3043 if it exists. */
3045 tree
3046 vn_nary_op_lookup_pieces (unsigned int length, enum tree_code code,
3047 tree type, tree *ops, vn_nary_op_t *vnresult)
3049 vn_nary_op_t vno1 = XALLOCAVAR (struct vn_nary_op_s,
3050 sizeof_vn_nary_op (length));
3051 init_vn_nary_op_from_pieces (vno1, length, code, type, ops);
3052 return vn_nary_op_lookup_1 (vno1, vnresult);
3055 /* Lookup OP in the current hash table, and return the resulting value
3056 number if it exists in the hash table. Return NULL_TREE if it does
3057 not exist in the hash table or if the result field of the operation
3058 is NULL. VNRESULT will contain the vn_nary_op_t from the hashtable
3059 if it exists. */
3061 tree
3062 vn_nary_op_lookup (tree op, vn_nary_op_t *vnresult)
3064 vn_nary_op_t vno1
3065 = XALLOCAVAR (struct vn_nary_op_s,
3066 sizeof_vn_nary_op (TREE_CODE_LENGTH (TREE_CODE (op))));
3067 init_vn_nary_op_from_op (vno1, op);
3068 return vn_nary_op_lookup_1 (vno1, vnresult);
3071 /* Lookup the rhs of STMT in the current hash table, and return the resulting
3072 value number if it exists in the hash table. Return NULL_TREE if
3073 it does not exist in the hash table. VNRESULT will contain the
3074 vn_nary_op_t from the hashtable if it exists. */
3076 tree
3077 vn_nary_op_lookup_stmt (gimple *stmt, vn_nary_op_t *vnresult)
3079 vn_nary_op_t vno1
3080 = XALLOCAVAR (struct vn_nary_op_s,
3081 sizeof_vn_nary_op (vn_nary_length_from_stmt (stmt)));
3082 init_vn_nary_op_from_stmt (vno1, stmt);
3083 return vn_nary_op_lookup_1 (vno1, vnresult);
3086 /* Allocate a vn_nary_op_t with LENGTH operands on STACK. */
3088 static vn_nary_op_t
3089 alloc_vn_nary_op_noinit (unsigned int length, struct obstack *stack)
3091 return (vn_nary_op_t) obstack_alloc (stack, sizeof_vn_nary_op (length));
3094 /* Allocate and initialize a vn_nary_op_t on CURRENT_INFO's
3095 obstack. */
3097 static vn_nary_op_t
3098 alloc_vn_nary_op (unsigned int length, tree result, unsigned int value_id)
3100 vn_nary_op_t vno1 = alloc_vn_nary_op_noinit (length, &vn_tables_obstack);
3102 vno1->value_id = value_id;
3103 vno1->length = length;
3104 vno1->predicated_values = 0;
3105 vno1->u.result = result;
3107 return vno1;
3110 /* Insert VNO into TABLE. If COMPUTE_HASH is true, then compute
3111 VNO->HASHCODE first. */
3113 static vn_nary_op_t
3114 vn_nary_op_insert_into (vn_nary_op_t vno, vn_nary_op_table_type *table,
3115 bool compute_hash)
3117 vn_nary_op_s **slot;
3119 if (compute_hash)
3121 vno->hashcode = vn_nary_op_compute_hash (vno);
3122 gcc_assert (! vno->predicated_values
3123 || (! vno->u.values->next
3124 && vno->u.values->n == 1));
3127 slot = table->find_slot_with_hash (vno, vno->hashcode, INSERT);
3128 vno->unwind_to = *slot;
3129 if (*slot)
3131 /* Prefer non-predicated values.
3132 ??? Only if those are constant, otherwise, with constant predicated
3133 value, turn them into predicated values with entry-block validity
3134 (??? but we always find the first valid result currently). */
3135 if ((*slot)->predicated_values
3136 && ! vno->predicated_values)
3138 /* ??? We cannot remove *slot from the unwind stack list.
3139 For the moment we deal with this by skipping not found
3140 entries but this isn't ideal ... */
3141 *slot = vno;
3142 /* ??? Maintain a stack of states we can unwind in
3143 vn_nary_op_s? But how far do we unwind? In reality
3144 we need to push change records somewhere... Or not
3145 unwind vn_nary_op_s and linking them but instead
3146 unwind the results "list", linking that, which also
3147 doesn't move on hashtable resize. */
3148 /* We can also have a ->unwind_to recording *slot there.
3149 That way we can make u.values a fixed size array with
3150 recording the number of entries but of course we then
3151 have always N copies for each unwind_to-state. Or we
3152 make sure to only ever append and each unwinding will
3153 pop off one entry (but how to deal with predicated
3154 replaced with non-predicated here?) */
3155 vno->next = last_inserted_nary;
3156 last_inserted_nary = vno;
3157 return vno;
3159 else if (vno->predicated_values
3160 && ! (*slot)->predicated_values)
3161 return *slot;
3162 else if (vno->predicated_values
3163 && (*slot)->predicated_values)
3165 /* ??? Factor this all into a insert_single_predicated_value
3166 routine. */
3167 gcc_assert (!vno->u.values->next && vno->u.values->n == 1);
3168 basic_block vno_bb
3169 = BASIC_BLOCK_FOR_FN (cfun, vno->u.values->valid_dominated_by_p[0]);
3170 vn_pval *nval = vno->u.values;
3171 vn_pval **next = &vno->u.values;
3172 bool found = false;
3173 for (vn_pval *val = (*slot)->u.values; val; val = val->next)
3175 if (expressions_equal_p (val->result, vno->u.values->result))
3177 found = true;
3178 for (unsigned i = 0; i < val->n; ++i)
3180 basic_block val_bb
3181 = BASIC_BLOCK_FOR_FN (cfun,
3182 val->valid_dominated_by_p[i]);
3183 if (dominated_by_p (CDI_DOMINATORS, vno_bb, val_bb))
3184 /* Value registered with more generic predicate. */
3185 return *slot;
3186 else if (dominated_by_p (CDI_DOMINATORS, val_bb, vno_bb))
3187 /* Shouldn't happen, we insert in RPO order. */
3188 gcc_unreachable ();
3190 /* Append value. */
3191 *next = (vn_pval *) obstack_alloc (&vn_tables_obstack,
3192 sizeof (vn_pval)
3193 + val->n * sizeof (int));
3194 (*next)->next = NULL;
3195 (*next)->result = val->result;
3196 (*next)->n = val->n + 1;
3197 memcpy ((*next)->valid_dominated_by_p,
3198 val->valid_dominated_by_p,
3199 val->n * sizeof (int));
3200 (*next)->valid_dominated_by_p[val->n] = vno_bb->index;
3201 next = &(*next)->next;
3202 if (dump_file && (dump_flags & TDF_DETAILS))
3203 fprintf (dump_file, "Appending predicate to value.\n");
3204 continue;
3206 /* Copy other predicated values. */
3207 *next = (vn_pval *) obstack_alloc (&vn_tables_obstack,
3208 sizeof (vn_pval)
3209 + (val->n-1) * sizeof (int));
3210 memcpy (*next, val, sizeof (vn_pval) + (val->n-1) * sizeof (int));
3211 (*next)->next = NULL;
3212 next = &(*next)->next;
3214 if (!found)
3215 *next = nval;
3217 *slot = vno;
3218 vno->next = last_inserted_nary;
3219 last_inserted_nary = vno;
3220 return vno;
3223 /* While we do not want to insert things twice it's awkward to
3224 avoid it in the case where visit_nary_op pattern-matches stuff
3225 and ends up simplifying the replacement to itself. We then
3226 get two inserts, one from visit_nary_op and one from
3227 vn_nary_build_or_lookup.
3228 So allow inserts with the same value number. */
3229 if ((*slot)->u.result == vno->u.result)
3230 return *slot;
3233 /* ??? There's also optimistic vs. previous commited state merging
3234 that is problematic for the case of unwinding. */
3236 /* ??? We should return NULL if we do not use 'vno' and have the
3237 caller release it. */
3238 gcc_assert (!*slot);
3240 *slot = vno;
3241 vno->next = last_inserted_nary;
3242 last_inserted_nary = vno;
3243 return vno;
3246 /* Insert a n-ary operation into the current hash table using it's
3247 pieces. Return the vn_nary_op_t structure we created and put in
3248 the hashtable. */
3250 vn_nary_op_t
3251 vn_nary_op_insert_pieces (unsigned int length, enum tree_code code,
3252 tree type, tree *ops,
3253 tree result, unsigned int value_id)
3255 vn_nary_op_t vno1 = alloc_vn_nary_op (length, result, value_id);
3256 init_vn_nary_op_from_pieces (vno1, length, code, type, ops);
3257 return vn_nary_op_insert_into (vno1, valid_info->nary, true);
3260 static vn_nary_op_t
3261 vn_nary_op_insert_pieces_predicated (unsigned int length, enum tree_code code,
3262 tree type, tree *ops,
3263 tree result, unsigned int value_id,
3264 edge pred_e)
3266 /* ??? Currently tracking BBs. */
3267 if (! single_pred_p (pred_e->dest))
3269 /* Never record for backedges. */
3270 if (pred_e->flags & EDGE_DFS_BACK)
3271 return NULL;
3272 edge_iterator ei;
3273 edge e;
3274 int cnt = 0;
3275 /* Ignore backedges. */
3276 FOR_EACH_EDGE (e, ei, pred_e->dest->preds)
3277 if (! dominated_by_p (CDI_DOMINATORS, e->src, e->dest))
3278 cnt++;
3279 if (cnt != 1)
3280 return NULL;
3282 if (dump_file && (dump_flags & TDF_DETAILS)
3283 /* ??? Fix dumping, but currently we only get comparisons. */
3284 && TREE_CODE_CLASS (code) == tcc_comparison)
3286 fprintf (dump_file, "Recording on edge %d->%d ", pred_e->src->index,
3287 pred_e->dest->index);
3288 print_generic_expr (dump_file, ops[0], TDF_SLIM);
3289 fprintf (dump_file, " %s ", get_tree_code_name (code));
3290 print_generic_expr (dump_file, ops[1], TDF_SLIM);
3291 fprintf (dump_file, " == %s\n",
3292 integer_zerop (result) ? "false" : "true");
3294 vn_nary_op_t vno1 = alloc_vn_nary_op (length, NULL_TREE, value_id);
3295 init_vn_nary_op_from_pieces (vno1, length, code, type, ops);
3296 vno1->predicated_values = 1;
3297 vno1->u.values = (vn_pval *) obstack_alloc (&vn_tables_obstack,
3298 sizeof (vn_pval));
3299 vno1->u.values->next = NULL;
3300 vno1->u.values->result = result;
3301 vno1->u.values->n = 1;
3302 vno1->u.values->valid_dominated_by_p[0] = pred_e->dest->index;
3303 return vn_nary_op_insert_into (vno1, valid_info->nary, true);
3306 static bool
3307 dominated_by_p_w_unex (basic_block bb1, basic_block bb2);
3309 static tree
3310 vn_nary_op_get_predicated_value (vn_nary_op_t vno, basic_block bb)
3312 if (! vno->predicated_values)
3313 return vno->u.result;
3314 for (vn_pval *val = vno->u.values; val; val = val->next)
3315 for (unsigned i = 0; i < val->n; ++i)
3316 if (dominated_by_p_w_unex (bb,
3317 BASIC_BLOCK_FOR_FN
3318 (cfun, val->valid_dominated_by_p[i])))
3319 return val->result;
3320 return NULL_TREE;
3323 /* Insert OP into the current hash table with a value number of
3324 RESULT. Return the vn_nary_op_t structure we created and put in
3325 the hashtable. */
3327 vn_nary_op_t
3328 vn_nary_op_insert (tree op, tree result)
3330 unsigned length = TREE_CODE_LENGTH (TREE_CODE (op));
3331 vn_nary_op_t vno1;
3333 vno1 = alloc_vn_nary_op (length, result, VN_INFO (result)->value_id);
3334 init_vn_nary_op_from_op (vno1, op);
3335 return vn_nary_op_insert_into (vno1, valid_info->nary, true);
3338 /* Insert the rhs of STMT into the current hash table with a value number of
3339 RESULT. */
3341 static vn_nary_op_t
3342 vn_nary_op_insert_stmt (gimple *stmt, tree result)
3344 vn_nary_op_t vno1
3345 = alloc_vn_nary_op (vn_nary_length_from_stmt (stmt),
3346 result, VN_INFO (result)->value_id);
3347 init_vn_nary_op_from_stmt (vno1, stmt);
3348 return vn_nary_op_insert_into (vno1, valid_info->nary, true);
3351 /* Compute a hashcode for PHI operation VP1 and return it. */
3353 static inline hashval_t
3354 vn_phi_compute_hash (vn_phi_t vp1)
3356 inchash::hash hstate (EDGE_COUNT (vp1->block->preds) > 2
3357 ? vp1->block->index : EDGE_COUNT (vp1->block->preds));
3358 tree phi1op;
3359 tree type;
3360 edge e;
3361 edge_iterator ei;
3363 /* If all PHI arguments are constants we need to distinguish
3364 the PHI node via its type. */
3365 type = vp1->type;
3366 hstate.merge_hash (vn_hash_type (type));
3368 FOR_EACH_EDGE (e, ei, vp1->block->preds)
3370 /* Don't hash backedge values they need to be handled as VN_TOP
3371 for optimistic value-numbering. */
3372 if (e->flags & EDGE_DFS_BACK)
3373 continue;
3375 phi1op = vp1->phiargs[e->dest_idx];
3376 if (phi1op == VN_TOP)
3377 continue;
3378 inchash::add_expr (phi1op, hstate);
3381 return hstate.end ();
3385 /* Return true if COND1 and COND2 represent the same condition, set
3386 *INVERTED_P if one needs to be inverted to make it the same as
3387 the other. */
3389 static bool
3390 cond_stmts_equal_p (gcond *cond1, tree lhs1, tree rhs1,
3391 gcond *cond2, tree lhs2, tree rhs2, bool *inverted_p)
3393 enum tree_code code1 = gimple_cond_code (cond1);
3394 enum tree_code code2 = gimple_cond_code (cond2);
3396 *inverted_p = false;
3397 if (code1 == code2)
3399 else if (code1 == swap_tree_comparison (code2))
3400 std::swap (lhs2, rhs2);
3401 else if (code1 == invert_tree_comparison (code2, HONOR_NANS (lhs2)))
3402 *inverted_p = true;
3403 else if (code1 == invert_tree_comparison
3404 (swap_tree_comparison (code2), HONOR_NANS (lhs2)))
3406 std::swap (lhs2, rhs2);
3407 *inverted_p = true;
3409 else
3410 return false;
3412 return ((expressions_equal_p (lhs1, lhs2)
3413 && expressions_equal_p (rhs1, rhs2))
3414 || (commutative_tree_code (code1)
3415 && expressions_equal_p (lhs1, rhs2)
3416 && expressions_equal_p (rhs1, lhs2)));
3419 /* Compare two phi entries for equality, ignoring VN_TOP arguments. */
3421 static int
3422 vn_phi_eq (const_vn_phi_t const vp1, const_vn_phi_t const vp2)
3424 if (vp1->hashcode != vp2->hashcode)
3425 return false;
3427 if (vp1->block != vp2->block)
3429 if (EDGE_COUNT (vp1->block->preds) != EDGE_COUNT (vp2->block->preds))
3430 return false;
3432 switch (EDGE_COUNT (vp1->block->preds))
3434 case 1:
3435 /* Single-arg PHIs are just copies. */
3436 break;
3438 case 2:
3440 /* Rule out backedges into the PHI. */
3441 if (vp1->block->loop_father->header == vp1->block
3442 || vp2->block->loop_father->header == vp2->block)
3443 return false;
3445 /* If the PHI nodes do not have compatible types
3446 they are not the same. */
3447 if (!types_compatible_p (vp1->type, vp2->type))
3448 return false;
3450 basic_block idom1
3451 = get_immediate_dominator (CDI_DOMINATORS, vp1->block);
3452 basic_block idom2
3453 = get_immediate_dominator (CDI_DOMINATORS, vp2->block);
3454 /* If the immediate dominator end in switch stmts multiple
3455 values may end up in the same PHI arg via intermediate
3456 CFG merges. */
3457 if (EDGE_COUNT (idom1->succs) != 2
3458 || EDGE_COUNT (idom2->succs) != 2)
3459 return false;
3461 /* Verify the controlling stmt is the same. */
3462 gcond *last1 = safe_dyn_cast <gcond *> (last_stmt (idom1));
3463 gcond *last2 = safe_dyn_cast <gcond *> (last_stmt (idom2));
3464 if (! last1 || ! last2)
3465 return false;
3466 bool inverted_p;
3467 if (! cond_stmts_equal_p (last1, vp1->cclhs, vp1->ccrhs,
3468 last2, vp2->cclhs, vp2->ccrhs,
3469 &inverted_p))
3470 return false;
3472 /* Get at true/false controlled edges into the PHI. */
3473 edge te1, te2, fe1, fe2;
3474 if (! extract_true_false_controlled_edges (idom1, vp1->block,
3475 &te1, &fe1)
3476 || ! extract_true_false_controlled_edges (idom2, vp2->block,
3477 &te2, &fe2))
3478 return false;
3480 /* Swap edges if the second condition is the inverted of the
3481 first. */
3482 if (inverted_p)
3483 std::swap (te2, fe2);
3485 /* ??? Handle VN_TOP specially. */
3486 if (! expressions_equal_p (vp1->phiargs[te1->dest_idx],
3487 vp2->phiargs[te2->dest_idx])
3488 || ! expressions_equal_p (vp1->phiargs[fe1->dest_idx],
3489 vp2->phiargs[fe2->dest_idx]))
3490 return false;
3492 return true;
3495 default:
3496 return false;
3500 /* If the PHI nodes do not have compatible types
3501 they are not the same. */
3502 if (!types_compatible_p (vp1->type, vp2->type))
3503 return false;
3505 /* Any phi in the same block will have it's arguments in the
3506 same edge order, because of how we store phi nodes. */
3507 for (unsigned i = 0; i < EDGE_COUNT (vp1->block->preds); ++i)
3509 tree phi1op = vp1->phiargs[i];
3510 tree phi2op = vp2->phiargs[i];
3511 if (phi1op == VN_TOP || phi2op == VN_TOP)
3512 continue;
3513 if (!expressions_equal_p (phi1op, phi2op))
3514 return false;
3517 return true;
3520 /* Lookup PHI in the current hash table, and return the resulting
3521 value number if it exists in the hash table. Return NULL_TREE if
3522 it does not exist in the hash table. */
3524 static tree
3525 vn_phi_lookup (gimple *phi, bool backedges_varying_p)
3527 vn_phi_s **slot;
3528 struct vn_phi_s *vp1;
3529 edge e;
3530 edge_iterator ei;
3532 vp1 = XALLOCAVAR (struct vn_phi_s,
3533 sizeof (struct vn_phi_s)
3534 + (gimple_phi_num_args (phi) - 1) * sizeof (tree));
3536 /* Canonicalize the SSA_NAME's to their value number. */
3537 FOR_EACH_EDGE (e, ei, gimple_bb (phi)->preds)
3539 tree def = PHI_ARG_DEF_FROM_EDGE (phi, e);
3540 if (TREE_CODE (def) == SSA_NAME
3541 && (!backedges_varying_p || !(e->flags & EDGE_DFS_BACK)))
3542 def = SSA_VAL (def);
3543 vp1->phiargs[e->dest_idx] = def;
3545 vp1->type = TREE_TYPE (gimple_phi_result (phi));
3546 vp1->block = gimple_bb (phi);
3547 /* Extract values of the controlling condition. */
3548 vp1->cclhs = NULL_TREE;
3549 vp1->ccrhs = NULL_TREE;
3550 basic_block idom1 = get_immediate_dominator (CDI_DOMINATORS, vp1->block);
3551 if (EDGE_COUNT (idom1->succs) == 2)
3552 if (gcond *last1 = safe_dyn_cast <gcond *> (last_stmt (idom1)))
3554 /* ??? We want to use SSA_VAL here. But possibly not
3555 allow VN_TOP. */
3556 vp1->cclhs = vn_valueize (gimple_cond_lhs (last1));
3557 vp1->ccrhs = vn_valueize (gimple_cond_rhs (last1));
3559 vp1->hashcode = vn_phi_compute_hash (vp1);
3560 slot = valid_info->phis->find_slot_with_hash (vp1, vp1->hashcode, NO_INSERT);
3561 if (!slot)
3562 return NULL_TREE;
3563 return (*slot)->result;
3566 /* Insert PHI into the current hash table with a value number of
3567 RESULT. */
3569 static vn_phi_t
3570 vn_phi_insert (gimple *phi, tree result, bool backedges_varying_p)
3572 vn_phi_s **slot;
3573 vn_phi_t vp1 = (vn_phi_t) obstack_alloc (&vn_tables_obstack,
3574 sizeof (vn_phi_s)
3575 + ((gimple_phi_num_args (phi) - 1)
3576 * sizeof (tree)));
3577 edge e;
3578 edge_iterator ei;
3580 /* Canonicalize the SSA_NAME's to their value number. */
3581 FOR_EACH_EDGE (e, ei, gimple_bb (phi)->preds)
3583 tree def = PHI_ARG_DEF_FROM_EDGE (phi, e);
3584 if (TREE_CODE (def) == SSA_NAME
3585 && (!backedges_varying_p || !(e->flags & EDGE_DFS_BACK)))
3586 def = SSA_VAL (def);
3587 vp1->phiargs[e->dest_idx] = def;
3589 vp1->value_id = VN_INFO (result)->value_id;
3590 vp1->type = TREE_TYPE (gimple_phi_result (phi));
3591 vp1->block = gimple_bb (phi);
3592 /* Extract values of the controlling condition. */
3593 vp1->cclhs = NULL_TREE;
3594 vp1->ccrhs = NULL_TREE;
3595 basic_block idom1 = get_immediate_dominator (CDI_DOMINATORS, vp1->block);
3596 if (EDGE_COUNT (idom1->succs) == 2)
3597 if (gcond *last1 = safe_dyn_cast <gcond *> (last_stmt (idom1)))
3599 /* ??? We want to use SSA_VAL here. But possibly not
3600 allow VN_TOP. */
3601 vp1->cclhs = vn_valueize (gimple_cond_lhs (last1));
3602 vp1->ccrhs = vn_valueize (gimple_cond_rhs (last1));
3604 vp1->result = result;
3605 vp1->hashcode = vn_phi_compute_hash (vp1);
3607 slot = valid_info->phis->find_slot_with_hash (vp1, vp1->hashcode, INSERT);
3608 gcc_assert (!*slot);
3610 *slot = vp1;
3611 vp1->next = last_inserted_phi;
3612 last_inserted_phi = vp1;
3613 return vp1;
3617 /* Return true if BB1 is dominated by BB2 taking into account edges
3618 that are not executable. */
3620 static bool
3621 dominated_by_p_w_unex (basic_block bb1, basic_block bb2)
3623 edge_iterator ei;
3624 edge e;
3626 if (dominated_by_p (CDI_DOMINATORS, bb1, bb2))
3627 return true;
3629 /* Before iterating we'd like to know if there exists a
3630 (executable) path from bb2 to bb1 at all, if not we can
3631 directly return false. For now simply iterate once. */
3633 /* Iterate to the single executable bb1 predecessor. */
3634 if (EDGE_COUNT (bb1->preds) > 1)
3636 edge prede = NULL;
3637 FOR_EACH_EDGE (e, ei, bb1->preds)
3638 if (e->flags & EDGE_EXECUTABLE)
3640 if (prede)
3642 prede = NULL;
3643 break;
3645 prede = e;
3647 if (prede)
3649 bb1 = prede->src;
3651 /* Re-do the dominance check with changed bb1. */
3652 if (dominated_by_p (CDI_DOMINATORS, bb1, bb2))
3653 return true;
3657 /* Iterate to the single executable bb2 successor. */
3658 edge succe = NULL;
3659 FOR_EACH_EDGE (e, ei, bb2->succs)
3660 if (e->flags & EDGE_EXECUTABLE)
3662 if (succe)
3664 succe = NULL;
3665 break;
3667 succe = e;
3669 if (succe)
3671 /* Verify the reached block is only reached through succe.
3672 If there is only one edge we can spare us the dominator
3673 check and iterate directly. */
3674 if (EDGE_COUNT (succe->dest->preds) > 1)
3676 FOR_EACH_EDGE (e, ei, succe->dest->preds)
3677 if (e != succe
3678 && (e->flags & EDGE_EXECUTABLE))
3680 succe = NULL;
3681 break;
3684 if (succe)
3686 bb2 = succe->dest;
3688 /* Re-do the dominance check with changed bb2. */
3689 if (dominated_by_p (CDI_DOMINATORS, bb1, bb2))
3690 return true;
3694 /* We could now iterate updating bb1 / bb2. */
3695 return false;
3698 /* Set the value number of FROM to TO, return true if it has changed
3699 as a result. */
3701 static inline bool
3702 set_ssa_val_to (tree from, tree to)
3704 vn_ssa_aux_t from_info = VN_INFO (from);
3705 tree currval = from_info->valnum; // SSA_VAL (from)
3706 poly_int64 toff, coff;
3708 /* The only thing we allow as value numbers are ssa_names
3709 and invariants. So assert that here. We don't allow VN_TOP
3710 as visiting a stmt should produce a value-number other than
3711 that.
3712 ??? Still VN_TOP can happen for unreachable code, so force
3713 it to varying in that case. Not all code is prepared to
3714 get VN_TOP on valueization. */
3715 if (to == VN_TOP)
3717 /* ??? When iterating and visiting PHI <undef, backedge-value>
3718 for the first time we rightfully get VN_TOP and we need to
3719 preserve that to optimize for example gcc.dg/tree-ssa/ssa-sccvn-2.c.
3720 With SCCVN we were simply lucky we iterated the other PHI
3721 cycles first and thus visited the backedge-value DEF. */
3722 if (currval == VN_TOP)
3723 goto set_and_exit;
3724 if (dump_file && (dump_flags & TDF_DETAILS))
3725 fprintf (dump_file, "Forcing value number to varying on "
3726 "receiving VN_TOP\n");
3727 to = from;
3730 gcc_checking_assert (to != NULL_TREE
3731 && ((TREE_CODE (to) == SSA_NAME
3732 && (to == from || SSA_VAL (to) == to))
3733 || is_gimple_min_invariant (to)));
3735 if (from != to)
3737 if (currval == from)
3739 if (dump_file && (dump_flags & TDF_DETAILS))
3741 fprintf (dump_file, "Not changing value number of ");
3742 print_generic_expr (dump_file, from);
3743 fprintf (dump_file, " from VARYING to ");
3744 print_generic_expr (dump_file, to);
3745 fprintf (dump_file, "\n");
3747 return false;
3749 else if (currval != VN_TOP
3750 && ! is_gimple_min_invariant (currval)
3751 && ! ssa_undefined_value_p (currval, false)
3752 && is_gimple_min_invariant (to))
3754 if (dump_file && (dump_flags & TDF_DETAILS))
3756 fprintf (dump_file, "Forcing VARYING instead of changing "
3757 "value number of ");
3758 print_generic_expr (dump_file, from);
3759 fprintf (dump_file, " from ");
3760 print_generic_expr (dump_file, currval);
3761 fprintf (dump_file, " (non-constant) to ");
3762 print_generic_expr (dump_file, to);
3763 fprintf (dump_file, " (constant)\n");
3765 to = from;
3767 else if (TREE_CODE (to) == SSA_NAME
3768 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (to))
3769 to = from;
3772 set_and_exit:
3773 if (dump_file && (dump_flags & TDF_DETAILS))
3775 fprintf (dump_file, "Setting value number of ");
3776 print_generic_expr (dump_file, from);
3777 fprintf (dump_file, " to ");
3778 print_generic_expr (dump_file, to);
3781 if (currval != to
3782 && !operand_equal_p (currval, to, 0)
3783 /* Different undefined SSA names are not actually different. See
3784 PR82320 for a testcase were we'd otherwise not terminate iteration. */
3785 && !(TREE_CODE (currval) == SSA_NAME
3786 && TREE_CODE (to) == SSA_NAME
3787 && ssa_undefined_value_p (currval, false)
3788 && ssa_undefined_value_p (to, false))
3789 /* ??? For addresses involving volatile objects or types operand_equal_p
3790 does not reliably detect ADDR_EXPRs as equal. We know we are only
3791 getting invariant gimple addresses here, so can use
3792 get_addr_base_and_unit_offset to do this comparison. */
3793 && !(TREE_CODE (currval) == ADDR_EXPR
3794 && TREE_CODE (to) == ADDR_EXPR
3795 && (get_addr_base_and_unit_offset (TREE_OPERAND (currval, 0), &coff)
3796 == get_addr_base_and_unit_offset (TREE_OPERAND (to, 0), &toff))
3797 && known_eq (coff, toff)))
3799 if (dump_file && (dump_flags & TDF_DETAILS))
3800 fprintf (dump_file, " (changed)\n");
3801 from_info->valnum = to;
3802 return true;
3804 if (dump_file && (dump_flags & TDF_DETAILS))
3805 fprintf (dump_file, "\n");
3806 return false;
3809 /* Set all definitions in STMT to value number to themselves.
3810 Return true if a value number changed. */
3812 static bool
3813 defs_to_varying (gimple *stmt)
3815 bool changed = false;
3816 ssa_op_iter iter;
3817 def_operand_p defp;
3819 FOR_EACH_SSA_DEF_OPERAND (defp, stmt, iter, SSA_OP_ALL_DEFS)
3821 tree def = DEF_FROM_PTR (defp);
3822 changed |= set_ssa_val_to (def, def);
3824 return changed;
3827 /* Visit a copy between LHS and RHS, return true if the value number
3828 changed. */
3830 static bool
3831 visit_copy (tree lhs, tree rhs)
3833 /* Valueize. */
3834 rhs = SSA_VAL (rhs);
3836 return set_ssa_val_to (lhs, rhs);
3839 /* Lookup a value for OP in type WIDE_TYPE where the value in type of OP
3840 is the same. */
3842 static tree
3843 valueized_wider_op (tree wide_type, tree op)
3845 if (TREE_CODE (op) == SSA_NAME)
3846 op = vn_valueize (op);
3848 /* Either we have the op widened available. */
3849 tree ops[3] = {};
3850 ops[0] = op;
3851 tree tem = vn_nary_op_lookup_pieces (1, NOP_EXPR,
3852 wide_type, ops, NULL);
3853 if (tem)
3854 return tem;
3856 /* Or the op is truncated from some existing value. */
3857 if (TREE_CODE (op) == SSA_NAME)
3859 gimple *def = SSA_NAME_DEF_STMT (op);
3860 if (is_gimple_assign (def)
3861 && CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (def)))
3863 tem = gimple_assign_rhs1 (def);
3864 if (useless_type_conversion_p (wide_type, TREE_TYPE (tem)))
3866 if (TREE_CODE (tem) == SSA_NAME)
3867 tem = vn_valueize (tem);
3868 return tem;
3873 /* For constants simply extend it. */
3874 if (TREE_CODE (op) == INTEGER_CST)
3875 return wide_int_to_tree (wide_type, wi::to_wide (op));
3877 return NULL_TREE;
3880 /* Visit a nary operator RHS, value number it, and return true if the
3881 value number of LHS has changed as a result. */
3883 static bool
3884 visit_nary_op (tree lhs, gassign *stmt)
3886 vn_nary_op_t vnresult;
3887 tree result = vn_nary_op_lookup_stmt (stmt, &vnresult);
3888 if (! result && vnresult)
3889 result = vn_nary_op_get_predicated_value (vnresult, gimple_bb (stmt));
3890 if (result)
3891 return set_ssa_val_to (lhs, result);
3893 /* Do some special pattern matching for redundancies of operations
3894 in different types. */
3895 enum tree_code code = gimple_assign_rhs_code (stmt);
3896 tree type = TREE_TYPE (lhs);
3897 tree rhs1 = gimple_assign_rhs1 (stmt);
3898 switch (code)
3900 CASE_CONVERT:
3901 /* Match arithmetic done in a different type where we can easily
3902 substitute the result from some earlier sign-changed or widened
3903 operation. */
3904 if (INTEGRAL_TYPE_P (type)
3905 && TREE_CODE (rhs1) == SSA_NAME
3906 /* We only handle sign-changes or zero-extension -> & mask. */
3907 && ((TYPE_UNSIGNED (TREE_TYPE (rhs1))
3908 && TYPE_PRECISION (type) > TYPE_PRECISION (TREE_TYPE (rhs1)))
3909 || TYPE_PRECISION (type) == TYPE_PRECISION (TREE_TYPE (rhs1))))
3911 gassign *def = dyn_cast <gassign *> (SSA_NAME_DEF_STMT (rhs1));
3912 if (def
3913 && (gimple_assign_rhs_code (def) == PLUS_EXPR
3914 || gimple_assign_rhs_code (def) == MINUS_EXPR
3915 || gimple_assign_rhs_code (def) == MULT_EXPR))
3917 tree ops[3] = {};
3918 /* Either we have the op widened available. */
3919 ops[0] = valueized_wider_op (type,
3920 gimple_assign_rhs1 (def));
3921 if (ops[0])
3922 ops[1] = valueized_wider_op (type,
3923 gimple_assign_rhs2 (def));
3924 if (ops[0] && ops[1])
3926 ops[0] = vn_nary_op_lookup_pieces
3927 (2, gimple_assign_rhs_code (def), type, ops, NULL);
3928 /* We have wider operation available. */
3929 if (ops[0]
3930 /* If the leader is a wrapping operation we can
3931 insert it for code hoisting w/o introducing
3932 undefined overflow. If it is not it has to
3933 be available. See PR86554. */
3934 && (TYPE_OVERFLOW_WRAPS (TREE_TYPE (ops[0]))
3935 || (rpo_avail && vn_context_bb
3936 && rpo_avail->eliminate_avail (vn_context_bb,
3937 ops[0]))))
3939 unsigned lhs_prec = TYPE_PRECISION (type);
3940 unsigned rhs_prec = TYPE_PRECISION (TREE_TYPE (rhs1));
3941 if (lhs_prec == rhs_prec)
3943 gimple_match_op match_op (gimple_match_cond::UNCOND,
3944 NOP_EXPR, type, ops[0]);
3945 result = vn_nary_build_or_lookup (&match_op);
3946 if (result)
3948 bool changed = set_ssa_val_to (lhs, result);
3949 vn_nary_op_insert_stmt (stmt, result);
3950 return changed;
3953 else
3955 tree mask = wide_int_to_tree
3956 (type, wi::mask (rhs_prec, false, lhs_prec));
3957 gimple_match_op match_op (gimple_match_cond::UNCOND,
3958 BIT_AND_EXPR,
3959 TREE_TYPE (lhs),
3960 ops[0], mask);
3961 result = vn_nary_build_or_lookup (&match_op);
3962 if (result)
3964 bool changed = set_ssa_val_to (lhs, result);
3965 vn_nary_op_insert_stmt (stmt, result);
3966 return changed;
3973 default:;
3976 bool changed = set_ssa_val_to (lhs, lhs);
3977 vn_nary_op_insert_stmt (stmt, lhs);
3978 return changed;
3981 /* Visit a call STMT storing into LHS. Return true if the value number
3982 of the LHS has changed as a result. */
3984 static bool
3985 visit_reference_op_call (tree lhs, gcall *stmt)
3987 bool changed = false;
3988 struct vn_reference_s vr1;
3989 vn_reference_t vnresult = NULL;
3990 tree vdef = gimple_vdef (stmt);
3992 /* Non-ssa lhs is handled in copy_reference_ops_from_call. */
3993 if (lhs && TREE_CODE (lhs) != SSA_NAME)
3994 lhs = NULL_TREE;
3996 vn_reference_lookup_call (stmt, &vnresult, &vr1);
3997 if (vnresult)
3999 if (vnresult->result_vdef && vdef)
4000 changed |= set_ssa_val_to (vdef, vnresult->result_vdef);
4001 else if (vdef)
4002 /* If the call was discovered to be pure or const reflect
4003 that as far as possible. */
4004 changed |= set_ssa_val_to (vdef, vuse_ssa_val (gimple_vuse (stmt)));
4006 if (!vnresult->result && lhs)
4007 vnresult->result = lhs;
4009 if (vnresult->result && lhs)
4010 changed |= set_ssa_val_to (lhs, vnresult->result);
4012 else
4014 vn_reference_t vr2;
4015 vn_reference_s **slot;
4016 tree vdef_val = vdef;
4017 if (vdef)
4019 /* If we value numbered an indirect functions function to
4020 one not clobbering memory value number its VDEF to its
4021 VUSE. */
4022 tree fn = gimple_call_fn (stmt);
4023 if (fn && TREE_CODE (fn) == SSA_NAME)
4025 fn = SSA_VAL (fn);
4026 if (TREE_CODE (fn) == ADDR_EXPR
4027 && TREE_CODE (TREE_OPERAND (fn, 0)) == FUNCTION_DECL
4028 && (flags_from_decl_or_type (TREE_OPERAND (fn, 0))
4029 & (ECF_CONST | ECF_PURE)))
4030 vdef_val = vuse_ssa_val (gimple_vuse (stmt));
4032 changed |= set_ssa_val_to (vdef, vdef_val);
4034 if (lhs)
4035 changed |= set_ssa_val_to (lhs, lhs);
4036 vr2 = XOBNEW (&vn_tables_obstack, vn_reference_s);
4037 vr2->vuse = vr1.vuse;
4038 /* As we are not walking the virtual operand chain we know the
4039 shared_lookup_references are still original so we can re-use
4040 them here. */
4041 vr2->operands = vr1.operands.copy ();
4042 vr2->type = vr1.type;
4043 vr2->set = vr1.set;
4044 vr2->hashcode = vr1.hashcode;
4045 vr2->result = lhs;
4046 vr2->result_vdef = vdef_val;
4047 slot = valid_info->references->find_slot_with_hash (vr2, vr2->hashcode,
4048 INSERT);
4049 gcc_assert (!*slot);
4050 *slot = vr2;
4051 vr2->next = last_inserted_ref;
4052 last_inserted_ref = vr2;
4055 return changed;
4058 /* Visit a load from a reference operator RHS, part of STMT, value number it,
4059 and return true if the value number of the LHS has changed as a result. */
4061 static bool
4062 visit_reference_op_load (tree lhs, tree op, gimple *stmt)
4064 bool changed = false;
4065 tree last_vuse;
4066 tree result;
4068 last_vuse = gimple_vuse (stmt);
4069 last_vuse_ptr = &last_vuse;
4070 result = vn_reference_lookup (op, gimple_vuse (stmt),
4071 default_vn_walk_kind, NULL, true);
4072 last_vuse_ptr = NULL;
4074 /* We handle type-punning through unions by value-numbering based
4075 on offset and size of the access. Be prepared to handle a
4076 type-mismatch here via creating a VIEW_CONVERT_EXPR. */
4077 if (result
4078 && !useless_type_conversion_p (TREE_TYPE (result), TREE_TYPE (op)))
4080 /* We will be setting the value number of lhs to the value number
4081 of VIEW_CONVERT_EXPR <TREE_TYPE (result)> (result).
4082 So first simplify and lookup this expression to see if it
4083 is already available. */
4084 gimple_match_op res_op (gimple_match_cond::UNCOND,
4085 VIEW_CONVERT_EXPR, TREE_TYPE (op), result);
4086 result = vn_nary_build_or_lookup (&res_op);
4087 /* When building the conversion fails avoid inserting the reference
4088 again. */
4089 if (!result)
4090 return set_ssa_val_to (lhs, lhs);
4093 if (result)
4094 changed = set_ssa_val_to (lhs, result);
4095 else
4097 changed = set_ssa_val_to (lhs, lhs);
4098 vn_reference_insert (op, lhs, last_vuse, NULL_TREE);
4101 return changed;
4105 /* Visit a store to a reference operator LHS, part of STMT, value number it,
4106 and return true if the value number of the LHS has changed as a result. */
4108 static bool
4109 visit_reference_op_store (tree lhs, tree op, gimple *stmt)
4111 bool changed = false;
4112 vn_reference_t vnresult = NULL;
4113 tree assign;
4114 bool resultsame = false;
4115 tree vuse = gimple_vuse (stmt);
4116 tree vdef = gimple_vdef (stmt);
4118 if (TREE_CODE (op) == SSA_NAME)
4119 op = SSA_VAL (op);
4121 /* First we want to lookup using the *vuses* from the store and see
4122 if there the last store to this location with the same address
4123 had the same value.
4125 The vuses represent the memory state before the store. If the
4126 memory state, address, and value of the store is the same as the
4127 last store to this location, then this store will produce the
4128 same memory state as that store.
4130 In this case the vdef versions for this store are value numbered to those
4131 vuse versions, since they represent the same memory state after
4132 this store.
4134 Otherwise, the vdefs for the store are used when inserting into
4135 the table, since the store generates a new memory state. */
4137 vn_reference_lookup (lhs, vuse, VN_NOWALK, &vnresult, false);
4138 if (vnresult
4139 && vnresult->result)
4141 tree result = vnresult->result;
4142 gcc_checking_assert (TREE_CODE (result) != SSA_NAME
4143 || result == SSA_VAL (result));
4144 resultsame = expressions_equal_p (result, op);
4145 if (resultsame)
4147 /* If the TBAA state isn't compatible for downstream reads
4148 we cannot value-number the VDEFs the same. */
4149 alias_set_type set = get_alias_set (lhs);
4150 if (vnresult->set != set
4151 && ! alias_set_subset_of (set, vnresult->set))
4152 resultsame = false;
4156 if (!resultsame)
4158 /* Only perform the following when being called from PRE
4159 which embeds tail merging. */
4160 if (default_vn_walk_kind == VN_WALK)
4162 assign = build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, op);
4163 vn_reference_lookup (assign, vuse, VN_NOWALK, &vnresult, false);
4164 if (vnresult)
4166 VN_INFO (vdef)->visited = true;
4167 return set_ssa_val_to (vdef, vnresult->result_vdef);
4171 if (dump_file && (dump_flags & TDF_DETAILS))
4173 fprintf (dump_file, "No store match\n");
4174 fprintf (dump_file, "Value numbering store ");
4175 print_generic_expr (dump_file, lhs);
4176 fprintf (dump_file, " to ");
4177 print_generic_expr (dump_file, op);
4178 fprintf (dump_file, "\n");
4180 /* Have to set value numbers before insert, since insert is
4181 going to valueize the references in-place. */
4182 if (vdef)
4183 changed |= set_ssa_val_to (vdef, vdef);
4185 /* Do not insert structure copies into the tables. */
4186 if (is_gimple_min_invariant (op)
4187 || is_gimple_reg (op))
4188 vn_reference_insert (lhs, op, vdef, NULL);
4190 /* Only perform the following when being called from PRE
4191 which embeds tail merging. */
4192 if (default_vn_walk_kind == VN_WALK)
4194 assign = build2 (MODIFY_EXPR, TREE_TYPE (lhs), lhs, op);
4195 vn_reference_insert (assign, lhs, vuse, vdef);
4198 else
4200 /* We had a match, so value number the vdef to have the value
4201 number of the vuse it came from. */
4203 if (dump_file && (dump_flags & TDF_DETAILS))
4204 fprintf (dump_file, "Store matched earlier value, "
4205 "value numbering store vdefs to matching vuses.\n");
4207 changed |= set_ssa_val_to (vdef, SSA_VAL (vuse));
4210 return changed;
4213 /* Visit and value number PHI, return true if the value number
4214 changed. When BACKEDGES_VARYING_P is true then assume all
4215 backedge values are varying. When INSERTED is not NULL then
4216 this is just a ahead query for a possible iteration, set INSERTED
4217 to true if we'd insert into the hashtable. */
4219 static bool
4220 visit_phi (gimple *phi, bool *inserted, bool backedges_varying_p)
4222 tree result, sameval = VN_TOP, seen_undef = NULL_TREE;
4223 tree backedge_val = NULL_TREE;
4224 bool seen_non_backedge = false;
4225 tree sameval_base = NULL_TREE;
4226 poly_int64 soff, doff;
4227 unsigned n_executable = 0;
4228 edge_iterator ei;
4229 edge e;
4231 /* TODO: We could check for this in initialization, and replace this
4232 with a gcc_assert. */
4233 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)))
4234 return set_ssa_val_to (PHI_RESULT (phi), PHI_RESULT (phi));
4236 /* We track whether a PHI was CSEd to to avoid excessive iterations
4237 that would be necessary only because the PHI changed arguments
4238 but not value. */
4239 if (!inserted)
4240 gimple_set_plf (phi, GF_PLF_1, false);
4242 /* See if all non-TOP arguments have the same value. TOP is
4243 equivalent to everything, so we can ignore it. */
4244 FOR_EACH_EDGE (e, ei, gimple_bb (phi)->preds)
4245 if (e->flags & EDGE_EXECUTABLE)
4247 tree def = PHI_ARG_DEF_FROM_EDGE (phi, e);
4249 ++n_executable;
4250 if (TREE_CODE (def) == SSA_NAME)
4252 if (!backedges_varying_p || !(e->flags & EDGE_DFS_BACK))
4253 def = SSA_VAL (def);
4254 if (e->flags & EDGE_DFS_BACK)
4255 backedge_val = def;
4257 if (!(e->flags & EDGE_DFS_BACK))
4258 seen_non_backedge = true;
4259 if (def == VN_TOP)
4261 /* Ignore undefined defs for sameval but record one. */
4262 else if (TREE_CODE (def) == SSA_NAME
4263 && ! virtual_operand_p (def)
4264 && ssa_undefined_value_p (def, false))
4265 seen_undef = def;
4266 else if (sameval == VN_TOP)
4267 sameval = def;
4268 else if (!expressions_equal_p (def, sameval))
4270 /* We know we're arriving only with invariant addresses here,
4271 try harder comparing them. We can do some caching here
4272 which we cannot do in expressions_equal_p. */
4273 if (TREE_CODE (def) == ADDR_EXPR
4274 && TREE_CODE (sameval) == ADDR_EXPR
4275 && sameval_base != (void *)-1)
4277 if (!sameval_base)
4278 sameval_base = get_addr_base_and_unit_offset
4279 (TREE_OPERAND (sameval, 0), &soff);
4280 if (!sameval_base)
4281 sameval_base = (tree)(void *)-1;
4282 else if ((get_addr_base_and_unit_offset
4283 (TREE_OPERAND (def, 0), &doff) == sameval_base)
4284 && known_eq (soff, doff))
4285 continue;
4287 sameval = NULL_TREE;
4288 break;
4292 /* If the value we want to use is flowing over the backedge and we
4293 should take it as VARYING but it has a non-VARYING value drop to
4294 VARYING.
4295 If we value-number a virtual operand never value-number to the
4296 value from the backedge as that confuses the alias-walking code.
4297 See gcc.dg/torture/pr87176.c. If the value is the same on a
4298 non-backedge everything is OK though. */
4299 bool visited_p;
4300 if ((backedge_val
4301 && !seen_non_backedge
4302 && TREE_CODE (backedge_val) == SSA_NAME
4303 && sameval == backedge_val
4304 && (SSA_NAME_IS_VIRTUAL_OPERAND (backedge_val)
4305 || SSA_VAL (backedge_val) != backedge_val))
4306 /* Do not value-number a virtual operand to sth not visited though
4307 given that allows us to escape a region in alias walking. */
4308 || (sameval
4309 && TREE_CODE (sameval) == SSA_NAME
4310 && !SSA_NAME_IS_DEFAULT_DEF (sameval)
4311 && SSA_NAME_IS_VIRTUAL_OPERAND (sameval)
4312 && (SSA_VAL (sameval, &visited_p), !visited_p)))
4313 /* Note this just drops to VARYING without inserting the PHI into
4314 the hashes. */
4315 result = PHI_RESULT (phi);
4316 /* If none of the edges was executable keep the value-number at VN_TOP,
4317 if only a single edge is exectuable use its value. */
4318 else if (n_executable <= 1)
4319 result = seen_undef ? seen_undef : sameval;
4320 /* If we saw only undefined values and VN_TOP use one of the
4321 undefined values. */
4322 else if (sameval == VN_TOP)
4323 result = seen_undef ? seen_undef : sameval;
4324 /* First see if it is equivalent to a phi node in this block. We prefer
4325 this as it allows IV elimination - see PRs 66502 and 67167. */
4326 else if ((result = vn_phi_lookup (phi, backedges_varying_p)))
4328 if (!inserted
4329 && TREE_CODE (result) == SSA_NAME
4330 && gimple_code (SSA_NAME_DEF_STMT (result)) == GIMPLE_PHI)
4332 gimple_set_plf (SSA_NAME_DEF_STMT (result), GF_PLF_1, true);
4333 if (dump_file && (dump_flags & TDF_DETAILS))
4335 fprintf (dump_file, "Marking CSEd to PHI node ");
4336 print_gimple_expr (dump_file, SSA_NAME_DEF_STMT (result),
4337 0, TDF_SLIM);
4338 fprintf (dump_file, "\n");
4342 /* If all values are the same use that, unless we've seen undefined
4343 values as well and the value isn't constant.
4344 CCP/copyprop have the same restriction to not remove uninit warnings. */
4345 else if (sameval
4346 && (! seen_undef || is_gimple_min_invariant (sameval)))
4347 result = sameval;
4348 else
4350 result = PHI_RESULT (phi);
4351 /* Only insert PHIs that are varying, for constant value numbers
4352 we mess up equivalences otherwise as we are only comparing
4353 the immediate controlling predicates. */
4354 vn_phi_insert (phi, result, backedges_varying_p);
4355 if (inserted)
4356 *inserted = true;
4359 return set_ssa_val_to (PHI_RESULT (phi), result);
4362 /* Try to simplify RHS using equivalences and constant folding. */
4364 static tree
4365 try_to_simplify (gassign *stmt)
4367 enum tree_code code = gimple_assign_rhs_code (stmt);
4368 tree tem;
4370 /* For stores we can end up simplifying a SSA_NAME rhs. Just return
4371 in this case, there is no point in doing extra work. */
4372 if (code == SSA_NAME)
4373 return NULL_TREE;
4375 /* First try constant folding based on our current lattice. */
4376 mprts_hook = vn_lookup_simplify_result;
4377 tem = gimple_fold_stmt_to_constant_1 (stmt, vn_valueize, vn_valueize);
4378 mprts_hook = NULL;
4379 if (tem
4380 && (TREE_CODE (tem) == SSA_NAME
4381 || is_gimple_min_invariant (tem)))
4382 return tem;
4384 return NULL_TREE;
4387 /* Visit and value number STMT, return true if the value number
4388 changed. */
4390 static bool
4391 visit_stmt (gimple *stmt, bool backedges_varying_p = false)
4393 bool changed = false;
4395 if (dump_file && (dump_flags & TDF_DETAILS))
4397 fprintf (dump_file, "Value numbering stmt = ");
4398 print_gimple_stmt (dump_file, stmt, 0);
4401 if (gimple_code (stmt) == GIMPLE_PHI)
4402 changed = visit_phi (stmt, NULL, backedges_varying_p);
4403 else if (gimple_has_volatile_ops (stmt))
4404 changed = defs_to_varying (stmt);
4405 else if (gassign *ass = dyn_cast <gassign *> (stmt))
4407 enum tree_code code = gimple_assign_rhs_code (ass);
4408 tree lhs = gimple_assign_lhs (ass);
4409 tree rhs1 = gimple_assign_rhs1 (ass);
4410 tree simplified;
4412 /* Shortcut for copies. Simplifying copies is pointless,
4413 since we copy the expression and value they represent. */
4414 if (code == SSA_NAME
4415 && TREE_CODE (lhs) == SSA_NAME)
4417 changed = visit_copy (lhs, rhs1);
4418 goto done;
4420 simplified = try_to_simplify (ass);
4421 if (simplified)
4423 if (dump_file && (dump_flags & TDF_DETAILS))
4425 fprintf (dump_file, "RHS ");
4426 print_gimple_expr (dump_file, ass, 0);
4427 fprintf (dump_file, " simplified to ");
4428 print_generic_expr (dump_file, simplified);
4429 fprintf (dump_file, "\n");
4432 /* Setting value numbers to constants will occasionally
4433 screw up phi congruence because constants are not
4434 uniquely associated with a single ssa name that can be
4435 looked up. */
4436 if (simplified
4437 && is_gimple_min_invariant (simplified)
4438 && TREE_CODE (lhs) == SSA_NAME)
4440 changed = set_ssa_val_to (lhs, simplified);
4441 goto done;
4443 else if (simplified
4444 && TREE_CODE (simplified) == SSA_NAME
4445 && TREE_CODE (lhs) == SSA_NAME)
4447 changed = visit_copy (lhs, simplified);
4448 goto done;
4451 if ((TREE_CODE (lhs) == SSA_NAME
4452 /* We can substitute SSA_NAMEs that are live over
4453 abnormal edges with their constant value. */
4454 && !(gimple_assign_copy_p (ass)
4455 && is_gimple_min_invariant (rhs1))
4456 && !(simplified
4457 && is_gimple_min_invariant (simplified))
4458 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
4459 /* Stores or copies from SSA_NAMEs that are live over
4460 abnormal edges are a problem. */
4461 || (code == SSA_NAME
4462 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (rhs1)))
4463 changed = defs_to_varying (ass);
4464 else if (REFERENCE_CLASS_P (lhs)
4465 || DECL_P (lhs))
4466 changed = visit_reference_op_store (lhs, rhs1, ass);
4467 else if (TREE_CODE (lhs) == SSA_NAME)
4469 if ((gimple_assign_copy_p (ass)
4470 && is_gimple_min_invariant (rhs1))
4471 || (simplified
4472 && is_gimple_min_invariant (simplified)))
4474 if (simplified)
4475 changed = set_ssa_val_to (lhs, simplified);
4476 else
4477 changed = set_ssa_val_to (lhs, rhs1);
4479 else
4481 /* Visit the original statement. */
4482 switch (vn_get_stmt_kind (ass))
4484 case VN_NARY:
4485 changed = visit_nary_op (lhs, ass);
4486 break;
4487 case VN_REFERENCE:
4488 changed = visit_reference_op_load (lhs, rhs1, ass);
4489 break;
4490 default:
4491 changed = defs_to_varying (ass);
4492 break;
4496 else
4497 changed = defs_to_varying (ass);
4499 else if (gcall *call_stmt = dyn_cast <gcall *> (stmt))
4501 tree lhs = gimple_call_lhs (call_stmt);
4502 if (lhs && TREE_CODE (lhs) == SSA_NAME)
4504 /* Try constant folding based on our current lattice. */
4505 tree simplified = gimple_fold_stmt_to_constant_1 (call_stmt,
4506 vn_valueize);
4507 if (simplified)
4509 if (dump_file && (dump_flags & TDF_DETAILS))
4511 fprintf (dump_file, "call ");
4512 print_gimple_expr (dump_file, call_stmt, 0);
4513 fprintf (dump_file, " simplified to ");
4514 print_generic_expr (dump_file, simplified);
4515 fprintf (dump_file, "\n");
4518 /* Setting value numbers to constants will occasionally
4519 screw up phi congruence because constants are not
4520 uniquely associated with a single ssa name that can be
4521 looked up. */
4522 if (simplified
4523 && is_gimple_min_invariant (simplified))
4525 changed = set_ssa_val_to (lhs, simplified);
4526 if (gimple_vdef (call_stmt))
4527 changed |= set_ssa_val_to (gimple_vdef (call_stmt),
4528 SSA_VAL (gimple_vuse (call_stmt)));
4529 goto done;
4531 else if (simplified
4532 && TREE_CODE (simplified) == SSA_NAME)
4534 changed = visit_copy (lhs, simplified);
4535 if (gimple_vdef (call_stmt))
4536 changed |= set_ssa_val_to (gimple_vdef (call_stmt),
4537 SSA_VAL (gimple_vuse (call_stmt)));
4538 goto done;
4540 else if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
4542 changed = defs_to_varying (call_stmt);
4543 goto done;
4547 /* Pick up flags from a devirtualization target. */
4548 tree fn = gimple_call_fn (stmt);
4549 int extra_fnflags = 0;
4550 if (fn && TREE_CODE (fn) == SSA_NAME)
4552 fn = SSA_VAL (fn);
4553 if (TREE_CODE (fn) == ADDR_EXPR
4554 && TREE_CODE (TREE_OPERAND (fn, 0)) == FUNCTION_DECL)
4555 extra_fnflags = flags_from_decl_or_type (TREE_OPERAND (fn, 0));
4557 if (!gimple_call_internal_p (call_stmt)
4558 && (/* Calls to the same function with the same vuse
4559 and the same operands do not necessarily return the same
4560 value, unless they're pure or const. */
4561 ((gimple_call_flags (call_stmt) | extra_fnflags)
4562 & (ECF_PURE | ECF_CONST))
4563 /* If calls have a vdef, subsequent calls won't have
4564 the same incoming vuse. So, if 2 calls with vdef have the
4565 same vuse, we know they're not subsequent.
4566 We can value number 2 calls to the same function with the
4567 same vuse and the same operands which are not subsequent
4568 the same, because there is no code in the program that can
4569 compare the 2 values... */
4570 || (gimple_vdef (call_stmt)
4571 /* ... unless the call returns a pointer which does
4572 not alias with anything else. In which case the
4573 information that the values are distinct are encoded
4574 in the IL. */
4575 && !(gimple_call_return_flags (call_stmt) & ERF_NOALIAS)
4576 /* Only perform the following when being called from PRE
4577 which embeds tail merging. */
4578 && default_vn_walk_kind == VN_WALK)))
4579 changed = visit_reference_op_call (lhs, call_stmt);
4580 else
4581 changed = defs_to_varying (call_stmt);
4583 else
4584 changed = defs_to_varying (stmt);
4585 done:
4586 return changed;
4590 /* Allocate a value number table. */
4592 static void
4593 allocate_vn_table (vn_tables_t table, unsigned size)
4595 table->phis = new vn_phi_table_type (size);
4596 table->nary = new vn_nary_op_table_type (size);
4597 table->references = new vn_reference_table_type (size);
4600 /* Free a value number table. */
4602 static void
4603 free_vn_table (vn_tables_t table)
4605 /* Walk over elements and release vectors. */
4606 vn_reference_iterator_type hir;
4607 vn_reference_t vr;
4608 FOR_EACH_HASH_TABLE_ELEMENT (*table->references, vr, vn_reference_t, hir)
4609 vr->operands.release ();
4610 delete table->phis;
4611 table->phis = NULL;
4612 delete table->nary;
4613 table->nary = NULL;
4614 delete table->references;
4615 table->references = NULL;
4618 /* Set *ID according to RESULT. */
4620 static void
4621 set_value_id_for_result (tree result, unsigned int *id)
4623 if (result && TREE_CODE (result) == SSA_NAME)
4624 *id = VN_INFO (result)->value_id;
4625 else if (result && is_gimple_min_invariant (result))
4626 *id = get_or_alloc_constant_value_id (result);
4627 else
4628 *id = get_next_value_id ();
4631 /* Set the value ids in the valid hash tables. */
4633 static void
4634 set_hashtable_value_ids (void)
4636 vn_nary_op_iterator_type hin;
4637 vn_phi_iterator_type hip;
4638 vn_reference_iterator_type hir;
4639 vn_nary_op_t vno;
4640 vn_reference_t vr;
4641 vn_phi_t vp;
4643 /* Now set the value ids of the things we had put in the hash
4644 table. */
4646 FOR_EACH_HASH_TABLE_ELEMENT (*valid_info->nary, vno, vn_nary_op_t, hin)
4647 if (! vno->predicated_values)
4648 set_value_id_for_result (vno->u.result, &vno->value_id);
4650 FOR_EACH_HASH_TABLE_ELEMENT (*valid_info->phis, vp, vn_phi_t, hip)
4651 set_value_id_for_result (vp->result, &vp->value_id);
4653 FOR_EACH_HASH_TABLE_ELEMENT (*valid_info->references, vr, vn_reference_t,
4654 hir)
4655 set_value_id_for_result (vr->result, &vr->value_id);
4658 /* Return the maximum value id we have ever seen. */
4660 unsigned int
4661 get_max_value_id (void)
4663 return next_value_id;
4666 /* Return the next unique value id. */
4668 unsigned int
4669 get_next_value_id (void)
4671 return next_value_id++;
4675 /* Compare two expressions E1 and E2 and return true if they are equal. */
4677 bool
4678 expressions_equal_p (tree e1, tree e2)
4680 /* The obvious case. */
4681 if (e1 == e2)
4682 return true;
4684 /* If either one is VN_TOP consider them equal. */
4685 if (e1 == VN_TOP || e2 == VN_TOP)
4686 return true;
4688 /* If only one of them is null, they cannot be equal. */
4689 if (!e1 || !e2)
4690 return false;
4692 /* Now perform the actual comparison. */
4693 if (TREE_CODE (e1) == TREE_CODE (e2)
4694 && operand_equal_p (e1, e2, OEP_PURE_SAME))
4695 return true;
4697 return false;
4701 /* Return true if the nary operation NARY may trap. This is a copy
4702 of stmt_could_throw_1_p adjusted to the SCCVN IL. */
4704 bool
4705 vn_nary_may_trap (vn_nary_op_t nary)
4707 tree type;
4708 tree rhs2 = NULL_TREE;
4709 bool honor_nans = false;
4710 bool honor_snans = false;
4711 bool fp_operation = false;
4712 bool honor_trapv = false;
4713 bool handled, ret;
4714 unsigned i;
4716 if (TREE_CODE_CLASS (nary->opcode) == tcc_comparison
4717 || TREE_CODE_CLASS (nary->opcode) == tcc_unary
4718 || TREE_CODE_CLASS (nary->opcode) == tcc_binary)
4720 type = nary->type;
4721 fp_operation = FLOAT_TYPE_P (type);
4722 if (fp_operation)
4724 honor_nans = flag_trapping_math && !flag_finite_math_only;
4725 honor_snans = flag_signaling_nans != 0;
4727 else if (INTEGRAL_TYPE_P (type)
4728 && TYPE_OVERFLOW_TRAPS (type))
4729 honor_trapv = true;
4731 if (nary->length >= 2)
4732 rhs2 = nary->op[1];
4733 ret = operation_could_trap_helper_p (nary->opcode, fp_operation,
4734 honor_trapv,
4735 honor_nans, honor_snans, rhs2,
4736 &handled);
4737 if (handled
4738 && ret)
4739 return true;
4741 for (i = 0; i < nary->length; ++i)
4742 if (tree_could_trap_p (nary->op[i]))
4743 return true;
4745 return false;
4748 eliminate_dom_walker::eliminate_dom_walker (cdi_direction direction,
4749 bitmap inserted_exprs_)
4750 : dom_walker (direction), do_pre (inserted_exprs_ != NULL),
4751 el_todo (0), eliminations (0), insertions (0),
4752 inserted_exprs (inserted_exprs_)
4754 need_eh_cleanup = BITMAP_ALLOC (NULL);
4755 need_ab_cleanup = BITMAP_ALLOC (NULL);
4758 eliminate_dom_walker::~eliminate_dom_walker ()
4760 BITMAP_FREE (need_eh_cleanup);
4761 BITMAP_FREE (need_ab_cleanup);
4764 /* Return a leader for OP that is available at the current point of the
4765 eliminate domwalk. */
4767 tree
4768 eliminate_dom_walker::eliminate_avail (basic_block, tree op)
4770 tree valnum = VN_INFO (op)->valnum;
4771 if (TREE_CODE (valnum) == SSA_NAME)
4773 if (SSA_NAME_IS_DEFAULT_DEF (valnum))
4774 return valnum;
4775 if (avail.length () > SSA_NAME_VERSION (valnum))
4776 return avail[SSA_NAME_VERSION (valnum)];
4778 else if (is_gimple_min_invariant (valnum))
4779 return valnum;
4780 return NULL_TREE;
4783 /* At the current point of the eliminate domwalk make OP available. */
4785 void
4786 eliminate_dom_walker::eliminate_push_avail (basic_block, tree op)
4788 tree valnum = VN_INFO (op)->valnum;
4789 if (TREE_CODE (valnum) == SSA_NAME)
4791 if (avail.length () <= SSA_NAME_VERSION (valnum))
4792 avail.safe_grow_cleared (SSA_NAME_VERSION (valnum) + 1);
4793 tree pushop = op;
4794 if (avail[SSA_NAME_VERSION (valnum)])
4795 pushop = avail[SSA_NAME_VERSION (valnum)];
4796 avail_stack.safe_push (pushop);
4797 avail[SSA_NAME_VERSION (valnum)] = op;
4801 /* Insert the expression recorded by SCCVN for VAL at *GSI. Returns
4802 the leader for the expression if insertion was successful. */
4804 tree
4805 eliminate_dom_walker::eliminate_insert (basic_block bb,
4806 gimple_stmt_iterator *gsi, tree val)
4808 /* We can insert a sequence with a single assignment only. */
4809 gimple_seq stmts = VN_INFO (val)->expr;
4810 if (!gimple_seq_singleton_p (stmts))
4811 return NULL_TREE;
4812 gassign *stmt = dyn_cast <gassign *> (gimple_seq_first_stmt (stmts));
4813 if (!stmt
4814 || (!CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt))
4815 && gimple_assign_rhs_code (stmt) != VIEW_CONVERT_EXPR
4816 && gimple_assign_rhs_code (stmt) != BIT_FIELD_REF
4817 && (gimple_assign_rhs_code (stmt) != BIT_AND_EXPR
4818 || TREE_CODE (gimple_assign_rhs2 (stmt)) != INTEGER_CST)))
4819 return NULL_TREE;
4821 tree op = gimple_assign_rhs1 (stmt);
4822 if (gimple_assign_rhs_code (stmt) == VIEW_CONVERT_EXPR
4823 || gimple_assign_rhs_code (stmt) == BIT_FIELD_REF)
4824 op = TREE_OPERAND (op, 0);
4825 tree leader = TREE_CODE (op) == SSA_NAME ? eliminate_avail (bb, op) : op;
4826 if (!leader)
4827 return NULL_TREE;
4829 tree res;
4830 stmts = NULL;
4831 if (gimple_assign_rhs_code (stmt) == BIT_FIELD_REF)
4832 res = gimple_build (&stmts, BIT_FIELD_REF,
4833 TREE_TYPE (val), leader,
4834 TREE_OPERAND (gimple_assign_rhs1 (stmt), 1),
4835 TREE_OPERAND (gimple_assign_rhs1 (stmt), 2));
4836 else if (gimple_assign_rhs_code (stmt) == BIT_AND_EXPR)
4837 res = gimple_build (&stmts, BIT_AND_EXPR,
4838 TREE_TYPE (val), leader, gimple_assign_rhs2 (stmt));
4839 else
4840 res = gimple_build (&stmts, gimple_assign_rhs_code (stmt),
4841 TREE_TYPE (val), leader);
4842 if (TREE_CODE (res) != SSA_NAME
4843 || SSA_NAME_IS_DEFAULT_DEF (res)
4844 || gimple_bb (SSA_NAME_DEF_STMT (res)))
4846 gimple_seq_discard (stmts);
4848 /* During propagation we have to treat SSA info conservatively
4849 and thus we can end up simplifying the inserted expression
4850 at elimination time to sth not defined in stmts. */
4851 /* But then this is a redundancy we failed to detect. Which means
4852 res now has two values. That doesn't play well with how
4853 we track availability here, so give up. */
4854 if (dump_file && (dump_flags & TDF_DETAILS))
4856 if (TREE_CODE (res) == SSA_NAME)
4857 res = eliminate_avail (bb, res);
4858 if (res)
4860 fprintf (dump_file, "Failed to insert expression for value ");
4861 print_generic_expr (dump_file, val);
4862 fprintf (dump_file, " which is really fully redundant to ");
4863 print_generic_expr (dump_file, res);
4864 fprintf (dump_file, "\n");
4868 return NULL_TREE;
4870 else
4872 gsi_insert_seq_before (gsi, stmts, GSI_SAME_STMT);
4873 VN_INFO (res)->valnum = val;
4874 VN_INFO (res)->visited = true;
4877 insertions++;
4878 if (dump_file && (dump_flags & TDF_DETAILS))
4880 fprintf (dump_file, "Inserted ");
4881 print_gimple_stmt (dump_file, SSA_NAME_DEF_STMT (res), 0);
4884 return res;
4887 void
4888 eliminate_dom_walker::eliminate_stmt (basic_block b, gimple_stmt_iterator *gsi)
4890 tree sprime = NULL_TREE;
4891 gimple *stmt = gsi_stmt (*gsi);
4892 tree lhs = gimple_get_lhs (stmt);
4893 if (lhs && TREE_CODE (lhs) == SSA_NAME
4894 && !gimple_has_volatile_ops (stmt)
4895 /* See PR43491. Do not replace a global register variable when
4896 it is a the RHS of an assignment. Do replace local register
4897 variables since gcc does not guarantee a local variable will
4898 be allocated in register.
4899 ??? The fix isn't effective here. This should instead
4900 be ensured by not value-numbering them the same but treating
4901 them like volatiles? */
4902 && !(gimple_assign_single_p (stmt)
4903 && (TREE_CODE (gimple_assign_rhs1 (stmt)) == VAR_DECL
4904 && DECL_HARD_REGISTER (gimple_assign_rhs1 (stmt))
4905 && is_global_var (gimple_assign_rhs1 (stmt)))))
4907 sprime = eliminate_avail (b, lhs);
4908 if (!sprime)
4910 /* If there is no existing usable leader but SCCVN thinks
4911 it has an expression it wants to use as replacement,
4912 insert that. */
4913 tree val = VN_INFO (lhs)->valnum;
4914 if (val != VN_TOP
4915 && TREE_CODE (val) == SSA_NAME
4916 && VN_INFO (val)->needs_insertion
4917 && VN_INFO (val)->expr != NULL
4918 && (sprime = eliminate_insert (b, gsi, val)) != NULL_TREE)
4919 eliminate_push_avail (b, sprime);
4922 /* If this now constitutes a copy duplicate points-to
4923 and range info appropriately. This is especially
4924 important for inserted code. See tree-ssa-copy.c
4925 for similar code. */
4926 if (sprime
4927 && TREE_CODE (sprime) == SSA_NAME)
4929 basic_block sprime_b = gimple_bb (SSA_NAME_DEF_STMT (sprime));
4930 if (POINTER_TYPE_P (TREE_TYPE (lhs))
4931 && SSA_NAME_PTR_INFO (lhs)
4932 && ! SSA_NAME_PTR_INFO (sprime))
4934 duplicate_ssa_name_ptr_info (sprime,
4935 SSA_NAME_PTR_INFO (lhs));
4936 if (b != sprime_b)
4937 mark_ptr_info_alignment_unknown
4938 (SSA_NAME_PTR_INFO (sprime));
4940 else if (INTEGRAL_TYPE_P (TREE_TYPE (lhs))
4941 && SSA_NAME_RANGE_INFO (lhs)
4942 && ! SSA_NAME_RANGE_INFO (sprime)
4943 && b == sprime_b)
4944 duplicate_ssa_name_range_info (sprime,
4945 SSA_NAME_RANGE_TYPE (lhs),
4946 SSA_NAME_RANGE_INFO (lhs));
4949 /* Inhibit the use of an inserted PHI on a loop header when
4950 the address of the memory reference is a simple induction
4951 variable. In other cases the vectorizer won't do anything
4952 anyway (either it's loop invariant or a complicated
4953 expression). */
4954 if (sprime
4955 && TREE_CODE (sprime) == SSA_NAME
4956 && do_pre
4957 && (flag_tree_loop_vectorize || flag_tree_parallelize_loops > 1)
4958 && loop_outer (b->loop_father)
4959 && has_zero_uses (sprime)
4960 && bitmap_bit_p (inserted_exprs, SSA_NAME_VERSION (sprime))
4961 && gimple_assign_load_p (stmt))
4963 gimple *def_stmt = SSA_NAME_DEF_STMT (sprime);
4964 basic_block def_bb = gimple_bb (def_stmt);
4965 if (gimple_code (def_stmt) == GIMPLE_PHI
4966 && def_bb->loop_father->header == def_bb)
4968 loop_p loop = def_bb->loop_father;
4969 ssa_op_iter iter;
4970 tree op;
4971 bool found = false;
4972 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
4974 affine_iv iv;
4975 def_bb = gimple_bb (SSA_NAME_DEF_STMT (op));
4976 if (def_bb
4977 && flow_bb_inside_loop_p (loop, def_bb)
4978 && simple_iv (loop, loop, op, &iv, true))
4980 found = true;
4981 break;
4984 if (found)
4986 if (dump_file && (dump_flags & TDF_DETAILS))
4988 fprintf (dump_file, "Not replacing ");
4989 print_gimple_expr (dump_file, stmt, 0);
4990 fprintf (dump_file, " with ");
4991 print_generic_expr (dump_file, sprime);
4992 fprintf (dump_file, " which would add a loop"
4993 " carried dependence to loop %d\n",
4994 loop->num);
4996 /* Don't keep sprime available. */
4997 sprime = NULL_TREE;
5002 if (sprime)
5004 /* If we can propagate the value computed for LHS into
5005 all uses don't bother doing anything with this stmt. */
5006 if (may_propagate_copy (lhs, sprime))
5008 /* Mark it for removal. */
5009 to_remove.safe_push (stmt);
5011 /* ??? Don't count copy/constant propagations. */
5012 if (gimple_assign_single_p (stmt)
5013 && (TREE_CODE (gimple_assign_rhs1 (stmt)) == SSA_NAME
5014 || gimple_assign_rhs1 (stmt) == sprime))
5015 return;
5017 if (dump_file && (dump_flags & TDF_DETAILS))
5019 fprintf (dump_file, "Replaced ");
5020 print_gimple_expr (dump_file, stmt, 0);
5021 fprintf (dump_file, " with ");
5022 print_generic_expr (dump_file, sprime);
5023 fprintf (dump_file, " in all uses of ");
5024 print_gimple_stmt (dump_file, stmt, 0);
5027 eliminations++;
5028 return;
5031 /* If this is an assignment from our leader (which
5032 happens in the case the value-number is a constant)
5033 then there is nothing to do. */
5034 if (gimple_assign_single_p (stmt)
5035 && sprime == gimple_assign_rhs1 (stmt))
5036 return;
5038 /* Else replace its RHS. */
5039 if (dump_file && (dump_flags & TDF_DETAILS))
5041 fprintf (dump_file, "Replaced ");
5042 print_gimple_expr (dump_file, stmt, 0);
5043 fprintf (dump_file, " with ");
5044 print_generic_expr (dump_file, sprime);
5045 fprintf (dump_file, " in ");
5046 print_gimple_stmt (dump_file, stmt, 0);
5048 eliminations++;
5050 bool can_make_abnormal_goto = (is_gimple_call (stmt)
5051 && stmt_can_make_abnormal_goto (stmt));
5052 gimple *orig_stmt = stmt;
5053 if (!useless_type_conversion_p (TREE_TYPE (lhs),
5054 TREE_TYPE (sprime)))
5056 /* We preserve conversions to but not from function or method
5057 types. This asymmetry makes it necessary to re-instantiate
5058 conversions here. */
5059 if (POINTER_TYPE_P (TREE_TYPE (lhs))
5060 && FUNC_OR_METHOD_TYPE_P (TREE_TYPE (TREE_TYPE (lhs))))
5061 sprime = fold_convert (TREE_TYPE (lhs), sprime);
5062 else
5063 gcc_unreachable ();
5065 tree vdef = gimple_vdef (stmt);
5066 tree vuse = gimple_vuse (stmt);
5067 propagate_tree_value_into_stmt (gsi, sprime);
5068 stmt = gsi_stmt (*gsi);
5069 update_stmt (stmt);
5070 /* In case the VDEF on the original stmt was released, value-number
5071 it to the VUSE. This is to make vuse_ssa_val able to skip
5072 released virtual operands. */
5073 if (vdef != gimple_vdef (stmt))
5075 gcc_assert (SSA_NAME_IN_FREE_LIST (vdef));
5076 VN_INFO (vdef)->valnum = vuse;
5079 /* If we removed EH side-effects from the statement, clean
5080 its EH information. */
5081 if (maybe_clean_or_replace_eh_stmt (orig_stmt, stmt))
5083 bitmap_set_bit (need_eh_cleanup,
5084 gimple_bb (stmt)->index);
5085 if (dump_file && (dump_flags & TDF_DETAILS))
5086 fprintf (dump_file, " Removed EH side-effects.\n");
5089 /* Likewise for AB side-effects. */
5090 if (can_make_abnormal_goto
5091 && !stmt_can_make_abnormal_goto (stmt))
5093 bitmap_set_bit (need_ab_cleanup,
5094 gimple_bb (stmt)->index);
5095 if (dump_file && (dump_flags & TDF_DETAILS))
5096 fprintf (dump_file, " Removed AB side-effects.\n");
5099 return;
5103 /* If the statement is a scalar store, see if the expression
5104 has the same value number as its rhs. If so, the store is
5105 dead. */
5106 if (gimple_assign_single_p (stmt)
5107 && !gimple_has_volatile_ops (stmt)
5108 && !is_gimple_reg (gimple_assign_lhs (stmt))
5109 && (TREE_CODE (gimple_assign_rhs1 (stmt)) == SSA_NAME
5110 || is_gimple_min_invariant (gimple_assign_rhs1 (stmt))))
5112 tree val;
5113 tree rhs = gimple_assign_rhs1 (stmt);
5114 vn_reference_t vnresult;
5115 val = vn_reference_lookup (lhs, gimple_vuse (stmt), VN_WALKREWRITE,
5116 &vnresult, false);
5117 if (TREE_CODE (rhs) == SSA_NAME)
5118 rhs = VN_INFO (rhs)->valnum;
5119 if (val
5120 && operand_equal_p (val, rhs, 0))
5122 /* We can only remove the later store if the former aliases
5123 at least all accesses the later one does or if the store
5124 was to readonly memory storing the same value. */
5125 alias_set_type set = get_alias_set (lhs);
5126 if (! vnresult
5127 || vnresult->set == set
5128 || alias_set_subset_of (set, vnresult->set))
5130 if (dump_file && (dump_flags & TDF_DETAILS))
5132 fprintf (dump_file, "Deleted redundant store ");
5133 print_gimple_stmt (dump_file, stmt, 0);
5136 /* Queue stmt for removal. */
5137 to_remove.safe_push (stmt);
5138 return;
5143 /* If this is a control statement value numbering left edges
5144 unexecuted on force the condition in a way consistent with
5145 that. */
5146 if (gcond *cond = dyn_cast <gcond *> (stmt))
5148 if ((EDGE_SUCC (b, 0)->flags & EDGE_EXECUTABLE)
5149 ^ (EDGE_SUCC (b, 1)->flags & EDGE_EXECUTABLE))
5151 if (dump_file && (dump_flags & TDF_DETAILS))
5153 fprintf (dump_file, "Removing unexecutable edge from ");
5154 print_gimple_stmt (dump_file, stmt, 0);
5156 if (((EDGE_SUCC (b, 0)->flags & EDGE_TRUE_VALUE) != 0)
5157 == ((EDGE_SUCC (b, 0)->flags & EDGE_EXECUTABLE) != 0))
5158 gimple_cond_make_true (cond);
5159 else
5160 gimple_cond_make_false (cond);
5161 update_stmt (cond);
5162 el_todo |= TODO_cleanup_cfg;
5163 return;
5167 bool can_make_abnormal_goto = stmt_can_make_abnormal_goto (stmt);
5168 bool was_noreturn = (is_gimple_call (stmt)
5169 && gimple_call_noreturn_p (stmt));
5170 tree vdef = gimple_vdef (stmt);
5171 tree vuse = gimple_vuse (stmt);
5173 /* If we didn't replace the whole stmt (or propagate the result
5174 into all uses), replace all uses on this stmt with their
5175 leaders. */
5176 bool modified = false;
5177 use_operand_p use_p;
5178 ssa_op_iter iter;
5179 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5181 tree use = USE_FROM_PTR (use_p);
5182 /* ??? The call code above leaves stmt operands un-updated. */
5183 if (TREE_CODE (use) != SSA_NAME)
5184 continue;
5185 tree sprime;
5186 if (SSA_NAME_IS_DEFAULT_DEF (use))
5187 /* ??? For default defs BB shouldn't matter, but we have to
5188 solve the inconsistency between rpo eliminate and
5189 dom eliminate avail valueization first. */
5190 sprime = eliminate_avail (b, use);
5191 else
5192 /* Look for sth available at the definition block of the argument.
5193 This avoids inconsistencies between availability there which
5194 decides if the stmt can be removed and availability at the
5195 use site. The SSA property ensures that things available
5196 at the definition are also available at uses. */
5197 sprime = eliminate_avail (gimple_bb (SSA_NAME_DEF_STMT (use)), use);
5198 if (sprime && sprime != use
5199 && may_propagate_copy (use, sprime)
5200 /* We substitute into debug stmts to avoid excessive
5201 debug temporaries created by removed stmts, but we need
5202 to avoid doing so for inserted sprimes as we never want
5203 to create debug temporaries for them. */
5204 && (!inserted_exprs
5205 || TREE_CODE (sprime) != SSA_NAME
5206 || !is_gimple_debug (stmt)
5207 || !bitmap_bit_p (inserted_exprs, SSA_NAME_VERSION (sprime))))
5209 propagate_value (use_p, sprime);
5210 modified = true;
5214 /* Fold the stmt if modified, this canonicalizes MEM_REFs we propagated
5215 into which is a requirement for the IPA devirt machinery. */
5216 gimple *old_stmt = stmt;
5217 if (modified)
5219 /* If a formerly non-invariant ADDR_EXPR is turned into an
5220 invariant one it was on a separate stmt. */
5221 if (gimple_assign_single_p (stmt)
5222 && TREE_CODE (gimple_assign_rhs1 (stmt)) == ADDR_EXPR)
5223 recompute_tree_invariant_for_addr_expr (gimple_assign_rhs1 (stmt));
5224 gimple_stmt_iterator prev = *gsi;
5225 gsi_prev (&prev);
5226 if (fold_stmt (gsi))
5228 /* fold_stmt may have created new stmts inbetween
5229 the previous stmt and the folded stmt. Mark
5230 all defs created there as varying to not confuse
5231 the SCCVN machinery as we're using that even during
5232 elimination. */
5233 if (gsi_end_p (prev))
5234 prev = gsi_start_bb (b);
5235 else
5236 gsi_next (&prev);
5237 if (gsi_stmt (prev) != gsi_stmt (*gsi))
5240 tree def;
5241 ssa_op_iter dit;
5242 FOR_EACH_SSA_TREE_OPERAND (def, gsi_stmt (prev),
5243 dit, SSA_OP_ALL_DEFS)
5244 /* As existing DEFs may move between stmts
5245 only process new ones. */
5246 if (! has_VN_INFO (def))
5248 VN_INFO (def)->valnum = def;
5249 VN_INFO (def)->visited = true;
5251 if (gsi_stmt (prev) == gsi_stmt (*gsi))
5252 break;
5253 gsi_next (&prev);
5255 while (1);
5257 stmt = gsi_stmt (*gsi);
5258 /* In case we folded the stmt away schedule the NOP for removal. */
5259 if (gimple_nop_p (stmt))
5260 to_remove.safe_push (stmt);
5263 /* Visit indirect calls and turn them into direct calls if
5264 possible using the devirtualization machinery. Do this before
5265 checking for required EH/abnormal/noreturn cleanup as devird
5266 may expose more of those. */
5267 if (gcall *call_stmt = dyn_cast <gcall *> (stmt))
5269 tree fn = gimple_call_fn (call_stmt);
5270 if (fn
5271 && flag_devirtualize
5272 && virtual_method_call_p (fn))
5274 tree otr_type = obj_type_ref_class (fn);
5275 unsigned HOST_WIDE_INT otr_tok
5276 = tree_to_uhwi (OBJ_TYPE_REF_TOKEN (fn));
5277 tree instance;
5278 ipa_polymorphic_call_context context (current_function_decl,
5279 fn, stmt, &instance);
5280 context.get_dynamic_type (instance, OBJ_TYPE_REF_OBJECT (fn),
5281 otr_type, stmt, NULL);
5282 bool final;
5283 vec <cgraph_node *> targets
5284 = possible_polymorphic_call_targets (obj_type_ref_class (fn),
5285 otr_tok, context, &final);
5286 if (dump_file)
5287 dump_possible_polymorphic_call_targets (dump_file,
5288 obj_type_ref_class (fn),
5289 otr_tok, context);
5290 if (final && targets.length () <= 1 && dbg_cnt (devirt))
5292 tree fn;
5293 if (targets.length () == 1)
5294 fn = targets[0]->decl;
5295 else
5296 fn = builtin_decl_implicit (BUILT_IN_UNREACHABLE);
5297 if (dump_enabled_p ())
5299 dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, stmt,
5300 "converting indirect call to "
5301 "function %s\n",
5302 lang_hooks.decl_printable_name (fn, 2));
5304 gimple_call_set_fndecl (call_stmt, fn);
5305 /* If changing the call to __builtin_unreachable
5306 or similar noreturn function, adjust gimple_call_fntype
5307 too. */
5308 if (gimple_call_noreturn_p (call_stmt)
5309 && VOID_TYPE_P (TREE_TYPE (TREE_TYPE (fn)))
5310 && TYPE_ARG_TYPES (TREE_TYPE (fn))
5311 && (TREE_VALUE (TYPE_ARG_TYPES (TREE_TYPE (fn)))
5312 == void_type_node))
5313 gimple_call_set_fntype (call_stmt, TREE_TYPE (fn));
5314 maybe_remove_unused_call_args (cfun, call_stmt);
5315 modified = true;
5320 if (modified)
5322 /* When changing a call into a noreturn call, cfg cleanup
5323 is needed to fix up the noreturn call. */
5324 if (!was_noreturn
5325 && is_gimple_call (stmt) && gimple_call_noreturn_p (stmt))
5326 to_fixup.safe_push (stmt);
5327 /* When changing a condition or switch into one we know what
5328 edge will be executed, schedule a cfg cleanup. */
5329 if ((gimple_code (stmt) == GIMPLE_COND
5330 && (gimple_cond_true_p (as_a <gcond *> (stmt))
5331 || gimple_cond_false_p (as_a <gcond *> (stmt))))
5332 || (gimple_code (stmt) == GIMPLE_SWITCH
5333 && TREE_CODE (gimple_switch_index
5334 (as_a <gswitch *> (stmt))) == INTEGER_CST))
5335 el_todo |= TODO_cleanup_cfg;
5336 /* If we removed EH side-effects from the statement, clean
5337 its EH information. */
5338 if (maybe_clean_or_replace_eh_stmt (old_stmt, stmt))
5340 bitmap_set_bit (need_eh_cleanup,
5341 gimple_bb (stmt)->index);
5342 if (dump_file && (dump_flags & TDF_DETAILS))
5343 fprintf (dump_file, " Removed EH side-effects.\n");
5345 /* Likewise for AB side-effects. */
5346 if (can_make_abnormal_goto
5347 && !stmt_can_make_abnormal_goto (stmt))
5349 bitmap_set_bit (need_ab_cleanup,
5350 gimple_bb (stmt)->index);
5351 if (dump_file && (dump_flags & TDF_DETAILS))
5352 fprintf (dump_file, " Removed AB side-effects.\n");
5354 update_stmt (stmt);
5355 /* In case the VDEF on the original stmt was released, value-number
5356 it to the VUSE. This is to make vuse_ssa_val able to skip
5357 released virtual operands. */
5358 if (vdef && SSA_NAME_IN_FREE_LIST (vdef))
5359 VN_INFO (vdef)->valnum = vuse;
5362 /* Make new values available - for fully redundant LHS we
5363 continue with the next stmt above and skip this. */
5364 def_operand_p defp;
5365 FOR_EACH_SSA_DEF_OPERAND (defp, stmt, iter, SSA_OP_DEF)
5366 eliminate_push_avail (b, DEF_FROM_PTR (defp));
5369 /* Perform elimination for the basic-block B during the domwalk. */
5371 edge
5372 eliminate_dom_walker::before_dom_children (basic_block b)
5374 /* Mark new bb. */
5375 avail_stack.safe_push (NULL_TREE);
5377 /* Skip unreachable blocks marked unreachable during the SCCVN domwalk. */
5378 if (!(b->flags & BB_EXECUTABLE))
5379 return NULL;
5381 vn_context_bb = b;
5383 for (gphi_iterator gsi = gsi_start_phis (b); !gsi_end_p (gsi);)
5385 gphi *phi = gsi.phi ();
5386 tree res = PHI_RESULT (phi);
5388 if (virtual_operand_p (res))
5390 gsi_next (&gsi);
5391 continue;
5394 tree sprime = eliminate_avail (b, res);
5395 if (sprime
5396 && sprime != res)
5398 if (dump_file && (dump_flags & TDF_DETAILS))
5400 fprintf (dump_file, "Replaced redundant PHI node defining ");
5401 print_generic_expr (dump_file, res);
5402 fprintf (dump_file, " with ");
5403 print_generic_expr (dump_file, sprime);
5404 fprintf (dump_file, "\n");
5407 /* If we inserted this PHI node ourself, it's not an elimination. */
5408 if (! inserted_exprs
5409 || ! bitmap_bit_p (inserted_exprs, SSA_NAME_VERSION (res)))
5410 eliminations++;
5412 /* If we will propagate into all uses don't bother to do
5413 anything. */
5414 if (may_propagate_copy (res, sprime))
5416 /* Mark the PHI for removal. */
5417 to_remove.safe_push (phi);
5418 gsi_next (&gsi);
5419 continue;
5422 remove_phi_node (&gsi, false);
5424 if (!useless_type_conversion_p (TREE_TYPE (res), TREE_TYPE (sprime)))
5425 sprime = fold_convert (TREE_TYPE (res), sprime);
5426 gimple *stmt = gimple_build_assign (res, sprime);
5427 gimple_stmt_iterator gsi2 = gsi_after_labels (b);
5428 gsi_insert_before (&gsi2, stmt, GSI_NEW_STMT);
5429 continue;
5432 eliminate_push_avail (b, res);
5433 gsi_next (&gsi);
5436 for (gimple_stmt_iterator gsi = gsi_start_bb (b);
5437 !gsi_end_p (gsi);
5438 gsi_next (&gsi))
5439 eliminate_stmt (b, &gsi);
5441 /* Replace destination PHI arguments. */
5442 edge_iterator ei;
5443 edge e;
5444 FOR_EACH_EDGE (e, ei, b->succs)
5445 if (e->flags & EDGE_EXECUTABLE)
5446 for (gphi_iterator gsi = gsi_start_phis (e->dest);
5447 !gsi_end_p (gsi);
5448 gsi_next (&gsi))
5450 gphi *phi = gsi.phi ();
5451 use_operand_p use_p = PHI_ARG_DEF_PTR_FROM_EDGE (phi, e);
5452 tree arg = USE_FROM_PTR (use_p);
5453 if (TREE_CODE (arg) != SSA_NAME
5454 || virtual_operand_p (arg))
5455 continue;
5456 tree sprime = eliminate_avail (b, arg);
5457 if (sprime && may_propagate_copy (arg, sprime))
5458 propagate_value (use_p, sprime);
5461 vn_context_bb = NULL;
5463 return NULL;
5466 /* Make no longer available leaders no longer available. */
5468 void
5469 eliminate_dom_walker::after_dom_children (basic_block)
5471 tree entry;
5472 while ((entry = avail_stack.pop ()) != NULL_TREE)
5474 tree valnum = VN_INFO (entry)->valnum;
5475 tree old = avail[SSA_NAME_VERSION (valnum)];
5476 if (old == entry)
5477 avail[SSA_NAME_VERSION (valnum)] = NULL_TREE;
5478 else
5479 avail[SSA_NAME_VERSION (valnum)] = entry;
5483 /* Remove queued stmts and perform delayed cleanups. */
5485 unsigned
5486 eliminate_dom_walker::eliminate_cleanup (bool region_p)
5488 statistics_counter_event (cfun, "Eliminated", eliminations);
5489 statistics_counter_event (cfun, "Insertions", insertions);
5491 /* We cannot remove stmts during BB walk, especially not release SSA
5492 names there as this confuses the VN machinery. The stmts ending
5493 up in to_remove are either stores or simple copies.
5494 Remove stmts in reverse order to make debug stmt creation possible. */
5495 while (!to_remove.is_empty ())
5497 bool do_release_defs = true;
5498 gimple *stmt = to_remove.pop ();
5500 /* When we are value-numbering a region we do not require exit PHIs to
5501 be present so we have to make sure to deal with uses outside of the
5502 region of stmts that we thought are eliminated.
5503 ??? Note we may be confused by uses in dead regions we didn't run
5504 elimination on. Rather than checking individual uses we accept
5505 dead copies to be generated here (gcc.c-torture/execute/20060905-1.c
5506 contains such example). */
5507 if (region_p)
5509 if (gphi *phi = dyn_cast <gphi *> (stmt))
5511 tree lhs = gimple_phi_result (phi);
5512 if (!has_zero_uses (lhs))
5514 if (dump_file && (dump_flags & TDF_DETAILS))
5515 fprintf (dump_file, "Keeping eliminated stmt live "
5516 "as copy because of out-of-region uses\n");
5517 tree sprime = eliminate_avail (gimple_bb (stmt), lhs);
5518 gimple *copy = gimple_build_assign (lhs, sprime);
5519 gimple_stmt_iterator gsi
5520 = gsi_after_labels (gimple_bb (stmt));
5521 gsi_insert_before (&gsi, copy, GSI_SAME_STMT);
5522 do_release_defs = false;
5525 else if (tree lhs = gimple_get_lhs (stmt))
5526 if (TREE_CODE (lhs) == SSA_NAME
5527 && !has_zero_uses (lhs))
5529 if (dump_file && (dump_flags & TDF_DETAILS))
5530 fprintf (dump_file, "Keeping eliminated stmt live "
5531 "as copy because of out-of-region uses\n");
5532 tree sprime = eliminate_avail (gimple_bb (stmt), lhs);
5533 gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
5534 if (is_gimple_assign (stmt))
5536 gimple_assign_set_rhs_from_tree (&gsi, sprime);
5537 stmt = gsi_stmt (gsi);
5538 update_stmt (stmt);
5539 if (maybe_clean_or_replace_eh_stmt (stmt, stmt))
5540 bitmap_set_bit (need_eh_cleanup, gimple_bb (stmt)->index);
5541 continue;
5543 else
5545 gimple *copy = gimple_build_assign (lhs, sprime);
5546 gsi_insert_before (&gsi, copy, GSI_SAME_STMT);
5547 do_release_defs = false;
5552 if (dump_file && (dump_flags & TDF_DETAILS))
5554 fprintf (dump_file, "Removing dead stmt ");
5555 print_gimple_stmt (dump_file, stmt, 0, TDF_NONE);
5558 gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
5559 if (gimple_code (stmt) == GIMPLE_PHI)
5560 remove_phi_node (&gsi, do_release_defs);
5561 else
5563 basic_block bb = gimple_bb (stmt);
5564 unlink_stmt_vdef (stmt);
5565 if (gsi_remove (&gsi, true))
5566 bitmap_set_bit (need_eh_cleanup, bb->index);
5567 if (is_gimple_call (stmt) && stmt_can_make_abnormal_goto (stmt))
5568 bitmap_set_bit (need_ab_cleanup, bb->index);
5569 if (do_release_defs)
5570 release_defs (stmt);
5573 /* Removing a stmt may expose a forwarder block. */
5574 el_todo |= TODO_cleanup_cfg;
5577 /* Fixup stmts that became noreturn calls. This may require splitting
5578 blocks and thus isn't possible during the dominator walk. Do this
5579 in reverse order so we don't inadvertedly remove a stmt we want to
5580 fixup by visiting a dominating now noreturn call first. */
5581 while (!to_fixup.is_empty ())
5583 gimple *stmt = to_fixup.pop ();
5585 if (dump_file && (dump_flags & TDF_DETAILS))
5587 fprintf (dump_file, "Fixing up noreturn call ");
5588 print_gimple_stmt (dump_file, stmt, 0);
5591 if (fixup_noreturn_call (stmt))
5592 el_todo |= TODO_cleanup_cfg;
5595 bool do_eh_cleanup = !bitmap_empty_p (need_eh_cleanup);
5596 bool do_ab_cleanup = !bitmap_empty_p (need_ab_cleanup);
5598 if (do_eh_cleanup)
5599 gimple_purge_all_dead_eh_edges (need_eh_cleanup);
5601 if (do_ab_cleanup)
5602 gimple_purge_all_dead_abnormal_call_edges (need_ab_cleanup);
5604 if (do_eh_cleanup || do_ab_cleanup)
5605 el_todo |= TODO_cleanup_cfg;
5607 return el_todo;
5610 /* Eliminate fully redundant computations. */
5612 unsigned
5613 eliminate_with_rpo_vn (bitmap inserted_exprs)
5615 eliminate_dom_walker walker (CDI_DOMINATORS, inserted_exprs);
5617 walker.walk (cfun->cfg->x_entry_block_ptr);
5618 return walker.eliminate_cleanup ();
5621 static unsigned
5622 do_rpo_vn (function *fn, edge entry, bitmap exit_bbs,
5623 bool iterate, bool eliminate);
5625 void
5626 run_rpo_vn (vn_lookup_kind kind)
5628 default_vn_walk_kind = kind;
5629 do_rpo_vn (cfun, NULL, NULL, true, false);
5631 /* ??? Prune requirement of these. */
5632 constant_to_value_id = new hash_table<vn_constant_hasher> (23);
5633 constant_value_ids = BITMAP_ALLOC (NULL);
5635 /* Initialize the value ids and prune out remaining VN_TOPs
5636 from dead code. */
5637 tree name;
5638 unsigned i;
5639 FOR_EACH_SSA_NAME (i, name, cfun)
5641 vn_ssa_aux_t info = VN_INFO (name);
5642 if (!info->visited
5643 || info->valnum == VN_TOP)
5644 info->valnum = name;
5645 if (info->valnum == name)
5646 info->value_id = get_next_value_id ();
5647 else if (is_gimple_min_invariant (info->valnum))
5648 info->value_id = get_or_alloc_constant_value_id (info->valnum);
5651 /* Propagate. */
5652 FOR_EACH_SSA_NAME (i, name, cfun)
5654 vn_ssa_aux_t info = VN_INFO (name);
5655 if (TREE_CODE (info->valnum) == SSA_NAME
5656 && info->valnum != name
5657 && info->value_id != VN_INFO (info->valnum)->value_id)
5658 info->value_id = VN_INFO (info->valnum)->value_id;
5661 set_hashtable_value_ids ();
5663 if (dump_file && (dump_flags & TDF_DETAILS))
5665 fprintf (dump_file, "Value numbers:\n");
5666 FOR_EACH_SSA_NAME (i, name, cfun)
5668 if (VN_INFO (name)->visited
5669 && SSA_VAL (name) != name)
5671 print_generic_expr (dump_file, name);
5672 fprintf (dump_file, " = ");
5673 print_generic_expr (dump_file, SSA_VAL (name));
5674 fprintf (dump_file, " (%04d)\n", VN_INFO (name)->value_id);
5680 /* Free VN associated data structures. */
5682 void
5683 free_rpo_vn (void)
5685 free_vn_table (valid_info);
5686 XDELETE (valid_info);
5687 obstack_free (&vn_tables_obstack, NULL);
5688 obstack_free (&vn_tables_insert_obstack, NULL);
5690 vn_ssa_aux_iterator_type it;
5691 vn_ssa_aux_t info;
5692 FOR_EACH_HASH_TABLE_ELEMENT (*vn_ssa_aux_hash, info, vn_ssa_aux_t, it)
5693 if (info->needs_insertion)
5694 release_ssa_name (info->name);
5695 obstack_free (&vn_ssa_aux_obstack, NULL);
5696 delete vn_ssa_aux_hash;
5698 delete constant_to_value_id;
5699 constant_to_value_id = NULL;
5700 BITMAP_FREE (constant_value_ids);
5703 /* Hook for maybe_push_res_to_seq, lookup the expression in the VN tables. */
5705 static tree
5706 vn_lookup_simplify_result (gimple_match_op *res_op)
5708 if (!res_op->code.is_tree_code ())
5709 return NULL_TREE;
5710 tree *ops = res_op->ops;
5711 unsigned int length = res_op->num_ops;
5712 if (res_op->code == CONSTRUCTOR
5713 /* ??? We're arriving here with SCCVNs view, decomposed CONSTRUCTOR
5714 and GIMPLEs / match-and-simplifies, CONSTRUCTOR as GENERIC tree. */
5715 && TREE_CODE (res_op->ops[0]) == CONSTRUCTOR)
5717 length = CONSTRUCTOR_NELTS (res_op->ops[0]);
5718 ops = XALLOCAVEC (tree, length);
5719 for (unsigned i = 0; i < length; ++i)
5720 ops[i] = CONSTRUCTOR_ELT (res_op->ops[0], i)->value;
5722 vn_nary_op_t vnresult = NULL;
5723 tree res = vn_nary_op_lookup_pieces (length, (tree_code) res_op->code,
5724 res_op->type, ops, &vnresult);
5725 /* If this is used from expression simplification make sure to
5726 return an available expression. */
5727 if (res && TREE_CODE (res) == SSA_NAME && mprts_hook && rpo_avail)
5728 res = rpo_avail->eliminate_avail (vn_context_bb, res);
5729 return res;
5732 rpo_elim::~rpo_elim ()
5734 /* Release the avail vectors. */
5735 for (rpo_avail_t::iterator i = m_rpo_avail.begin ();
5736 i != m_rpo_avail.end (); ++i)
5737 (*i).second.release ();
5740 /* Return a leader for OPs value that is valid at BB. */
5742 tree
5743 rpo_elim::eliminate_avail (basic_block bb, tree op)
5745 bool visited;
5746 tree valnum = SSA_VAL (op, &visited);
5747 /* If we didn't visit OP then it must be defined outside of the
5748 region we process and also dominate it. So it is available. */
5749 if (!visited)
5750 return op;
5751 if (TREE_CODE (valnum) == SSA_NAME)
5753 if (SSA_NAME_IS_DEFAULT_DEF (valnum))
5754 return valnum;
5755 vec<std::pair<int, int> > *av = m_rpo_avail.get (valnum);
5756 if (!av || av->is_empty ())
5757 return NULL_TREE;
5758 int i = av->length () - 1;
5759 if ((*av)[i].first == bb->index)
5760 /* On tramp3d 90% of the cases are here. */
5761 return ssa_name ((*av)[i].second);
5764 basic_block abb = BASIC_BLOCK_FOR_FN (cfun, (*av)[i].first);
5765 /* ??? During elimination we have to use availability at the
5766 definition site of a use we try to replace. This
5767 is required to not run into inconsistencies because
5768 of dominated_by_p_w_unex behavior and removing a definition
5769 while not replacing all uses.
5770 ??? We could try to consistently walk dominators
5771 ignoring non-executable regions. The nearest common
5772 dominator of bb and abb is where we can stop walking. We
5773 may also be able to "pre-compute" (bits of) the next immediate
5774 (non-)dominator during the RPO walk when marking edges as
5775 executable. */
5776 if (dominated_by_p_w_unex (bb, abb))
5778 tree leader = ssa_name ((*av)[i].second);
5779 /* Prevent eliminations that break loop-closed SSA. */
5780 if (loops_state_satisfies_p (LOOP_CLOSED_SSA)
5781 && ! SSA_NAME_IS_DEFAULT_DEF (leader)
5782 && ! flow_bb_inside_loop_p (gimple_bb (SSA_NAME_DEF_STMT
5783 (leader))->loop_father,
5784 bb))
5785 return NULL_TREE;
5786 if (dump_file && (dump_flags & TDF_DETAILS))
5788 print_generic_expr (dump_file, leader);
5789 fprintf (dump_file, " is available for ");
5790 print_generic_expr (dump_file, valnum);
5791 fprintf (dump_file, "\n");
5793 /* On tramp3d 99% of the _remaining_ cases succeed at
5794 the first enty. */
5795 return leader;
5797 /* ??? Can we somehow skip to the immediate dominator
5798 RPO index (bb_to_rpo)? Again, maybe not worth, on
5799 tramp3d the worst number of elements in the vector is 9. */
5801 while (--i >= 0);
5803 else if (valnum != VN_TOP)
5804 /* valnum is is_gimple_min_invariant. */
5805 return valnum;
5806 return NULL_TREE;
5809 /* Make LEADER a leader for its value at BB. */
5811 void
5812 rpo_elim::eliminate_push_avail (basic_block bb, tree leader)
5814 tree valnum = VN_INFO (leader)->valnum;
5815 if (valnum == VN_TOP)
5816 return;
5817 if (dump_file && (dump_flags & TDF_DETAILS))
5819 fprintf (dump_file, "Making available beyond BB%d ", bb->index);
5820 print_generic_expr (dump_file, leader);
5821 fprintf (dump_file, " for value ");
5822 print_generic_expr (dump_file, valnum);
5823 fprintf (dump_file, "\n");
5825 bool existed;
5826 vec<std::pair<int, int> > &av = m_rpo_avail.get_or_insert (valnum, &existed);
5827 if (!existed)
5829 new (&av) vec<std::pair<int, int> >;
5830 av = vNULL;
5831 av.reserve_exact (2);
5833 av.safe_push (std::make_pair (bb->index, SSA_NAME_VERSION (leader)));
5836 /* Valueization hook for RPO VN plus required state. */
5838 tree
5839 rpo_vn_valueize (tree name)
5841 if (TREE_CODE (name) == SSA_NAME)
5843 vn_ssa_aux_t val = VN_INFO (name);
5844 if (val)
5846 tree tem = val->valnum;
5847 if (tem != VN_TOP && tem != name)
5849 if (TREE_CODE (tem) != SSA_NAME)
5850 return tem;
5851 /* For all values we only valueize to an available leader
5852 which means we can use SSA name info without restriction. */
5853 tem = rpo_avail->eliminate_avail (vn_context_bb, tem);
5854 if (tem)
5855 return tem;
5859 return name;
5862 /* Insert on PRED_E predicates derived from CODE OPS being true besides the
5863 inverted condition. */
5865 static void
5866 insert_related_predicates_on_edge (enum tree_code code, tree *ops, edge pred_e)
5868 switch (code)
5870 case LT_EXPR:
5871 /* a < b -> a {!,<}= b */
5872 vn_nary_op_insert_pieces_predicated (2, NE_EXPR, boolean_type_node,
5873 ops, boolean_true_node, 0, pred_e);
5874 vn_nary_op_insert_pieces_predicated (2, LE_EXPR, boolean_type_node,
5875 ops, boolean_true_node, 0, pred_e);
5876 /* a < b -> ! a {>,=} b */
5877 vn_nary_op_insert_pieces_predicated (2, GT_EXPR, boolean_type_node,
5878 ops, boolean_false_node, 0, pred_e);
5879 vn_nary_op_insert_pieces_predicated (2, EQ_EXPR, boolean_type_node,
5880 ops, boolean_false_node, 0, pred_e);
5881 break;
5882 case GT_EXPR:
5883 /* a > b -> a {!,>}= b */
5884 vn_nary_op_insert_pieces_predicated (2, NE_EXPR, boolean_type_node,
5885 ops, boolean_true_node, 0, pred_e);
5886 vn_nary_op_insert_pieces_predicated (2, GE_EXPR, boolean_type_node,
5887 ops, boolean_true_node, 0, pred_e);
5888 /* a > b -> ! a {<,=} b */
5889 vn_nary_op_insert_pieces_predicated (2, LT_EXPR, boolean_type_node,
5890 ops, boolean_false_node, 0, pred_e);
5891 vn_nary_op_insert_pieces_predicated (2, EQ_EXPR, boolean_type_node,
5892 ops, boolean_false_node, 0, pred_e);
5893 break;
5894 case EQ_EXPR:
5895 /* a == b -> ! a {<,>} b */
5896 vn_nary_op_insert_pieces_predicated (2, LT_EXPR, boolean_type_node,
5897 ops, boolean_false_node, 0, pred_e);
5898 vn_nary_op_insert_pieces_predicated (2, GT_EXPR, boolean_type_node,
5899 ops, boolean_false_node, 0, pred_e);
5900 break;
5901 case LE_EXPR:
5902 case GE_EXPR:
5903 case NE_EXPR:
5904 /* Nothing besides inverted condition. */
5905 break;
5906 default:;
5910 /* Main stmt worker for RPO VN, process BB. */
5912 static unsigned
5913 process_bb (rpo_elim &avail, basic_block bb,
5914 bool bb_visited, bool iterate_phis, bool iterate, bool eliminate,
5915 bool do_region, bitmap exit_bbs)
5917 unsigned todo = 0;
5918 edge_iterator ei;
5919 edge e;
5921 vn_context_bb = bb;
5923 /* If we are in loop-closed SSA preserve this state. This is
5924 relevant when called on regions from outside of FRE/PRE. */
5925 bool lc_phi_nodes = false;
5926 if (loops_state_satisfies_p (LOOP_CLOSED_SSA))
5927 FOR_EACH_EDGE (e, ei, bb->preds)
5928 if (e->src->loop_father != e->dest->loop_father
5929 && flow_loop_nested_p (e->dest->loop_father,
5930 e->src->loop_father))
5932 lc_phi_nodes = true;
5933 break;
5936 /* When we visit a loop header substitute into loop info. */
5937 if (!iterate && eliminate && bb->loop_father->header == bb)
5939 /* Keep fields in sync with substitute_in_loop_info. */
5940 if (bb->loop_father->nb_iterations)
5941 bb->loop_father->nb_iterations
5942 = simplify_replace_tree (bb->loop_father->nb_iterations,
5943 NULL_TREE, NULL_TREE, vn_valueize);
5946 /* Value-number all defs in the basic-block. */
5947 for (gphi_iterator gsi = gsi_start_phis (bb); !gsi_end_p (gsi);
5948 gsi_next (&gsi))
5950 gphi *phi = gsi.phi ();
5951 tree res = PHI_RESULT (phi);
5952 vn_ssa_aux_t res_info = VN_INFO (res);
5953 if (!bb_visited)
5955 gcc_assert (!res_info->visited);
5956 res_info->valnum = VN_TOP;
5957 res_info->visited = true;
5960 /* When not iterating force backedge values to varying. */
5961 visit_stmt (phi, !iterate_phis);
5962 if (virtual_operand_p (res))
5963 continue;
5965 /* Eliminate */
5966 /* The interesting case is gcc.dg/tree-ssa/pr22230.c for correctness
5967 how we handle backedges and availability.
5968 And gcc.dg/tree-ssa/ssa-sccvn-2.c for optimization. */
5969 tree val = res_info->valnum;
5970 if (res != val && !iterate && eliminate)
5972 if (tree leader = avail.eliminate_avail (bb, res))
5974 if (leader != res
5975 /* Preserve loop-closed SSA form. */
5976 && (! lc_phi_nodes
5977 || is_gimple_min_invariant (leader)))
5979 if (dump_file && (dump_flags & TDF_DETAILS))
5981 fprintf (dump_file, "Replaced redundant PHI node "
5982 "defining ");
5983 print_generic_expr (dump_file, res);
5984 fprintf (dump_file, " with ");
5985 print_generic_expr (dump_file, leader);
5986 fprintf (dump_file, "\n");
5988 avail.eliminations++;
5990 if (may_propagate_copy (res, leader))
5992 /* Schedule for removal. */
5993 avail.to_remove.safe_push (phi);
5994 continue;
5996 /* ??? Else generate a copy stmt. */
6000 /* Only make defs available that not already are. But make
6001 sure loop-closed SSA PHI node defs are picked up for
6002 downstream uses. */
6003 if (lc_phi_nodes
6004 || res == val
6005 || ! avail.eliminate_avail (bb, res))
6006 avail.eliminate_push_avail (bb, res);
6009 /* For empty BBs mark outgoing edges executable. For non-empty BBs
6010 we do this when processing the last stmt as we have to do this
6011 before elimination which otherwise forces GIMPLE_CONDs to
6012 if (1 != 0) style when seeing non-executable edges. */
6013 if (gsi_end_p (gsi_start_bb (bb)))
6015 FOR_EACH_EDGE (e, ei, bb->succs)
6017 if (!(e->flags & EDGE_EXECUTABLE))
6019 if (dump_file && (dump_flags & TDF_DETAILS))
6020 fprintf (dump_file,
6021 "marking outgoing edge %d -> %d executable\n",
6022 e->src->index, e->dest->index);
6023 e->flags |= EDGE_EXECUTABLE;
6024 e->dest->flags |= BB_EXECUTABLE;
6026 else if (!(e->dest->flags & BB_EXECUTABLE))
6028 if (dump_file && (dump_flags & TDF_DETAILS))
6029 fprintf (dump_file,
6030 "marking destination block %d reachable\n",
6031 e->dest->index);
6032 e->dest->flags |= BB_EXECUTABLE;
6036 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
6037 !gsi_end_p (gsi); gsi_next (&gsi))
6039 ssa_op_iter i;
6040 tree op;
6041 if (!bb_visited)
6043 FOR_EACH_SSA_TREE_OPERAND (op, gsi_stmt (gsi), i, SSA_OP_ALL_DEFS)
6045 vn_ssa_aux_t op_info = VN_INFO (op);
6046 gcc_assert (!op_info->visited);
6047 op_info->valnum = VN_TOP;
6048 op_info->visited = true;
6051 /* We somehow have to deal with uses that are not defined
6052 in the processed region. Forcing unvisited uses to
6053 varying here doesn't play well with def-use following during
6054 expression simplification, so we deal with this by checking
6055 the visited flag in SSA_VAL. */
6058 visit_stmt (gsi_stmt (gsi));
6060 gimple *last = gsi_stmt (gsi);
6061 e = NULL;
6062 switch (gimple_code (last))
6064 case GIMPLE_SWITCH:
6065 e = find_taken_edge (bb, vn_valueize (gimple_switch_index
6066 (as_a <gswitch *> (last))));
6067 break;
6068 case GIMPLE_COND:
6070 tree lhs = vn_valueize (gimple_cond_lhs (last));
6071 tree rhs = vn_valueize (gimple_cond_rhs (last));
6072 tree val = gimple_simplify (gimple_cond_code (last),
6073 boolean_type_node, lhs, rhs,
6074 NULL, vn_valueize);
6075 /* If the condition didn't simplfy see if we have recorded
6076 an expression from sofar taken edges. */
6077 if (! val || TREE_CODE (val) != INTEGER_CST)
6079 vn_nary_op_t vnresult;
6080 tree ops[2];
6081 ops[0] = lhs;
6082 ops[1] = rhs;
6083 val = vn_nary_op_lookup_pieces (2, gimple_cond_code (last),
6084 boolean_type_node, ops,
6085 &vnresult);
6086 /* Did we get a predicated value? */
6087 if (! val && vnresult && vnresult->predicated_values)
6089 val = vn_nary_op_get_predicated_value (vnresult, bb);
6090 if (val && dump_file && (dump_flags & TDF_DETAILS))
6092 fprintf (dump_file, "Got predicated value ");
6093 print_generic_expr (dump_file, val, TDF_NONE);
6094 fprintf (dump_file, " for ");
6095 print_gimple_stmt (dump_file, last, TDF_SLIM);
6099 if (val)
6100 e = find_taken_edge (bb, val);
6101 if (! e)
6103 /* If we didn't manage to compute the taken edge then
6104 push predicated expressions for the condition itself
6105 and related conditions to the hashtables. This allows
6106 simplification of redundant conditions which is
6107 important as early cleanup. */
6108 edge true_e, false_e;
6109 extract_true_false_edges_from_block (bb, &true_e, &false_e);
6110 enum tree_code code = gimple_cond_code (last);
6111 enum tree_code icode
6112 = invert_tree_comparison (code, HONOR_NANS (lhs));
6113 tree ops[2];
6114 ops[0] = lhs;
6115 ops[1] = rhs;
6116 if (do_region
6117 && bitmap_bit_p (exit_bbs, true_e->dest->index))
6118 true_e = NULL;
6119 if (do_region
6120 && bitmap_bit_p (exit_bbs, false_e->dest->index))
6121 false_e = NULL;
6122 if (true_e)
6123 vn_nary_op_insert_pieces_predicated
6124 (2, code, boolean_type_node, ops,
6125 boolean_true_node, 0, true_e);
6126 if (false_e)
6127 vn_nary_op_insert_pieces_predicated
6128 (2, code, boolean_type_node, ops,
6129 boolean_false_node, 0, false_e);
6130 if (icode != ERROR_MARK)
6132 if (true_e)
6133 vn_nary_op_insert_pieces_predicated
6134 (2, icode, boolean_type_node, ops,
6135 boolean_false_node, 0, true_e);
6136 if (false_e)
6137 vn_nary_op_insert_pieces_predicated
6138 (2, icode, boolean_type_node, ops,
6139 boolean_true_node, 0, false_e);
6141 /* Relax for non-integers, inverted condition handled
6142 above. */
6143 if (INTEGRAL_TYPE_P (TREE_TYPE (lhs)))
6145 if (true_e)
6146 insert_related_predicates_on_edge (code, ops, true_e);
6147 if (false_e)
6148 insert_related_predicates_on_edge (icode, ops, false_e);
6151 break;
6153 case GIMPLE_GOTO:
6154 e = find_taken_edge (bb, vn_valueize (gimple_goto_dest (last)));
6155 break;
6156 default:
6157 e = NULL;
6159 if (e)
6161 todo = TODO_cleanup_cfg;
6162 if (!(e->flags & EDGE_EXECUTABLE))
6164 if (dump_file && (dump_flags & TDF_DETAILS))
6165 fprintf (dump_file,
6166 "marking known outgoing %sedge %d -> %d executable\n",
6167 e->flags & EDGE_DFS_BACK ? "back-" : "",
6168 e->src->index, e->dest->index);
6169 e->flags |= EDGE_EXECUTABLE;
6170 e->dest->flags |= BB_EXECUTABLE;
6172 else if (!(e->dest->flags & BB_EXECUTABLE))
6174 if (dump_file && (dump_flags & TDF_DETAILS))
6175 fprintf (dump_file,
6176 "marking destination block %d reachable\n",
6177 e->dest->index);
6178 e->dest->flags |= BB_EXECUTABLE;
6181 else if (gsi_one_before_end_p (gsi))
6183 FOR_EACH_EDGE (e, ei, bb->succs)
6185 if (!(e->flags & EDGE_EXECUTABLE))
6187 if (dump_file && (dump_flags & TDF_DETAILS))
6188 fprintf (dump_file,
6189 "marking outgoing edge %d -> %d executable\n",
6190 e->src->index, e->dest->index);
6191 e->flags |= EDGE_EXECUTABLE;
6192 e->dest->flags |= BB_EXECUTABLE;
6194 else if (!(e->dest->flags & BB_EXECUTABLE))
6196 if (dump_file && (dump_flags & TDF_DETAILS))
6197 fprintf (dump_file,
6198 "marking destination block %d reachable\n",
6199 e->dest->index);
6200 e->dest->flags |= BB_EXECUTABLE;
6205 /* Eliminate. That also pushes to avail. */
6206 if (eliminate && ! iterate)
6207 avail.eliminate_stmt (bb, &gsi);
6208 else
6209 /* If not eliminating, make all not already available defs
6210 available. */
6211 FOR_EACH_SSA_TREE_OPERAND (op, gsi_stmt (gsi), i, SSA_OP_DEF)
6212 if (! avail.eliminate_avail (bb, op))
6213 avail.eliminate_push_avail (bb, op);
6216 /* Eliminate in destination PHI arguments. Always substitute in dest
6217 PHIs, even for non-executable edges. This handles region
6218 exits PHIs. */
6219 if (!iterate && eliminate)
6220 FOR_EACH_EDGE (e, ei, bb->succs)
6221 for (gphi_iterator gsi = gsi_start_phis (e->dest);
6222 !gsi_end_p (gsi); gsi_next (&gsi))
6224 gphi *phi = gsi.phi ();
6225 use_operand_p use_p = PHI_ARG_DEF_PTR_FROM_EDGE (phi, e);
6226 tree arg = USE_FROM_PTR (use_p);
6227 if (TREE_CODE (arg) != SSA_NAME
6228 || virtual_operand_p (arg))
6229 continue;
6230 tree sprime;
6231 if (SSA_NAME_IS_DEFAULT_DEF (arg))
6233 sprime = SSA_VAL (arg);
6234 gcc_assert (TREE_CODE (sprime) != SSA_NAME
6235 || SSA_NAME_IS_DEFAULT_DEF (sprime));
6237 else
6238 /* Look for sth available at the definition block of the argument.
6239 This avoids inconsistencies between availability there which
6240 decides if the stmt can be removed and availability at the
6241 use site. The SSA property ensures that things available
6242 at the definition are also available at uses. */
6243 sprime = avail.eliminate_avail (gimple_bb (SSA_NAME_DEF_STMT (arg)),
6244 arg);
6245 if (sprime
6246 && sprime != arg
6247 && may_propagate_copy (arg, sprime))
6248 propagate_value (use_p, sprime);
6251 vn_context_bb = NULL;
6252 return todo;
6255 /* Unwind state per basic-block. */
6257 struct unwind_state
6259 /* Times this block has been visited. */
6260 unsigned visited;
6261 /* Whether to handle this as iteration point or whether to treat
6262 incoming backedge PHI values as varying. */
6263 bool iterate;
6264 /* Maximum RPO index this block is reachable from. */
6265 int max_rpo;
6266 /* Unwind state. */
6267 void *ob_top;
6268 vn_reference_t ref_top;
6269 vn_phi_t phi_top;
6270 vn_nary_op_t nary_top;
6273 /* Unwind the RPO VN state for iteration. */
6275 static void
6276 do_unwind (unwind_state *to, int rpo_idx, rpo_elim &avail, int *bb_to_rpo)
6278 gcc_assert (to->iterate);
6279 for (; last_inserted_nary != to->nary_top;
6280 last_inserted_nary = last_inserted_nary->next)
6282 vn_nary_op_t *slot;
6283 slot = valid_info->nary->find_slot_with_hash
6284 (last_inserted_nary, last_inserted_nary->hashcode, NO_INSERT);
6285 /* Predication causes the need to restore previous state. */
6286 if ((*slot)->unwind_to)
6287 *slot = (*slot)->unwind_to;
6288 else
6289 valid_info->nary->clear_slot (slot);
6291 for (; last_inserted_phi != to->phi_top;
6292 last_inserted_phi = last_inserted_phi->next)
6294 vn_phi_t *slot;
6295 slot = valid_info->phis->find_slot_with_hash
6296 (last_inserted_phi, last_inserted_phi->hashcode, NO_INSERT);
6297 valid_info->phis->clear_slot (slot);
6299 for (; last_inserted_ref != to->ref_top;
6300 last_inserted_ref = last_inserted_ref->next)
6302 vn_reference_t *slot;
6303 slot = valid_info->references->find_slot_with_hash
6304 (last_inserted_ref, last_inserted_ref->hashcode, NO_INSERT);
6305 (*slot)->operands.release ();
6306 valid_info->references->clear_slot (slot);
6308 obstack_free (&vn_tables_obstack, to->ob_top);
6310 /* Prune [rpo_idx, ] from avail. */
6311 /* ??? This is O(number-of-values-in-region) which is
6312 O(region-size) rather than O(iteration-piece). */
6313 for (rpo_elim::rpo_avail_t::iterator i
6314 = avail.m_rpo_avail.begin ();
6315 i != avail.m_rpo_avail.end (); ++i)
6317 while (! (*i).second.is_empty ())
6319 if (bb_to_rpo[(*i).second.last ().first] < rpo_idx)
6320 break;
6321 (*i).second.pop ();
6326 /* Do VN on a SEME region specified by ENTRY and EXIT_BBS in FN.
6327 If ITERATE is true then treat backedges optimistically as not
6328 executed and iterate. If ELIMINATE is true then perform
6329 elimination, otherwise leave that to the caller. */
6331 static unsigned
6332 do_rpo_vn (function *fn, edge entry, bitmap exit_bbs,
6333 bool iterate, bool eliminate)
6335 unsigned todo = 0;
6337 /* We currently do not support region-based iteration when
6338 elimination is requested. */
6339 gcc_assert (!entry || !iterate || !eliminate);
6340 /* When iterating we need loop info up-to-date. */
6341 gcc_assert (!iterate || !loops_state_satisfies_p (LOOPS_NEED_FIXUP));
6343 bool do_region = entry != NULL;
6344 if (!do_region)
6346 entry = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fn));
6347 exit_bbs = BITMAP_ALLOC (NULL);
6348 bitmap_set_bit (exit_bbs, EXIT_BLOCK);
6351 int *rpo = XNEWVEC (int, n_basic_blocks_for_fn (fn) - NUM_FIXED_BLOCKS);
6352 int n = rev_post_order_and_mark_dfs_back_seme
6353 (fn, entry, exit_bbs, !loops_state_satisfies_p (LOOPS_NEED_FIXUP), rpo);
6354 /* rev_post_order_and_mark_dfs_back_seme fills RPO in reverse order. */
6355 for (int i = 0; i < n / 2; ++i)
6356 std::swap (rpo[i], rpo[n-i-1]);
6358 if (!do_region)
6359 BITMAP_FREE (exit_bbs);
6361 int *bb_to_rpo = XNEWVEC (int, last_basic_block_for_fn (fn));
6362 for (int i = 0; i < n; ++i)
6363 bb_to_rpo[rpo[i]] = i;
6365 unwind_state *rpo_state = XNEWVEC (unwind_state, n);
6367 rpo_elim avail (entry->dest);
6368 rpo_avail = &avail;
6370 /* Verify we have no extra entries into the region. */
6371 if (flag_checking && do_region)
6373 auto_bb_flag bb_in_region (fn);
6374 for (int i = 0; i < n; ++i)
6376 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6377 bb->flags |= bb_in_region;
6379 /* We can't merge the first two loops because we cannot rely
6380 on EDGE_DFS_BACK for edges not within the region. But if
6381 we decide to always have the bb_in_region flag we can
6382 do the checking during the RPO walk itself (but then it's
6383 also easy to handle MEME conservatively). */
6384 for (int i = 0; i < n; ++i)
6386 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6387 edge e;
6388 edge_iterator ei;
6389 FOR_EACH_EDGE (e, ei, bb->preds)
6390 gcc_assert (e == entry || (e->src->flags & bb_in_region));
6392 for (int i = 0; i < n; ++i)
6394 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6395 bb->flags &= ~bb_in_region;
6399 /* Create the VN state. For the initial size of the various hashtables
6400 use a heuristic based on region size and number of SSA names. */
6401 unsigned region_size = (((unsigned HOST_WIDE_INT)n * num_ssa_names)
6402 / (n_basic_blocks_for_fn (fn) - NUM_FIXED_BLOCKS));
6403 VN_TOP = create_tmp_var_raw (void_type_node, "vn_top");
6405 vn_ssa_aux_hash = new hash_table <vn_ssa_aux_hasher> (region_size * 2);
6406 gcc_obstack_init (&vn_ssa_aux_obstack);
6408 gcc_obstack_init (&vn_tables_obstack);
6409 gcc_obstack_init (&vn_tables_insert_obstack);
6410 valid_info = XCNEW (struct vn_tables_s);
6411 allocate_vn_table (valid_info, region_size);
6412 last_inserted_ref = NULL;
6413 last_inserted_phi = NULL;
6414 last_inserted_nary = NULL;
6416 vn_valueize = rpo_vn_valueize;
6418 /* Initialize the unwind state and edge/BB executable state. */
6419 bool need_max_rpo_iterate = false;
6420 for (int i = 0; i < n; ++i)
6422 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6423 rpo_state[i].visited = 0;
6424 rpo_state[i].max_rpo = i;
6425 bb->flags &= ~BB_EXECUTABLE;
6426 bool has_backedges = false;
6427 edge e;
6428 edge_iterator ei;
6429 FOR_EACH_EDGE (e, ei, bb->preds)
6431 if (e->flags & EDGE_DFS_BACK)
6432 has_backedges = true;
6433 e->flags &= ~EDGE_EXECUTABLE;
6434 if (iterate || e == entry)
6435 continue;
6436 if (bb_to_rpo[e->src->index] > i)
6438 rpo_state[i].max_rpo = MAX (rpo_state[i].max_rpo,
6439 bb_to_rpo[e->src->index]);
6440 need_max_rpo_iterate = true;
6442 else
6443 rpo_state[i].max_rpo
6444 = MAX (rpo_state[i].max_rpo,
6445 rpo_state[bb_to_rpo[e->src->index]].max_rpo);
6447 rpo_state[i].iterate = iterate && has_backedges;
6449 entry->flags |= EDGE_EXECUTABLE;
6450 entry->dest->flags |= BB_EXECUTABLE;
6452 /* When there are irreducible regions the simplistic max_rpo computation
6453 above for the case of backedges doesn't work and we need to iterate
6454 until there are no more changes. */
6455 unsigned nit = 0;
6456 while (need_max_rpo_iterate)
6458 nit++;
6459 need_max_rpo_iterate = false;
6460 for (int i = 0; i < n; ++i)
6462 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6463 edge e;
6464 edge_iterator ei;
6465 FOR_EACH_EDGE (e, ei, bb->preds)
6467 if (e == entry)
6468 continue;
6469 int max_rpo = MAX (rpo_state[i].max_rpo,
6470 rpo_state[bb_to_rpo[e->src->index]].max_rpo);
6471 if (rpo_state[i].max_rpo != max_rpo)
6473 rpo_state[i].max_rpo = max_rpo;
6474 need_max_rpo_iterate = true;
6479 statistics_histogram_event (cfun, "RPO max_rpo iterations", nit);
6481 /* As heuristic to improve compile-time we handle only the N innermost
6482 loops and the outermost one optimistically. */
6483 if (iterate)
6485 loop_p loop;
6486 unsigned max_depth = PARAM_VALUE (PARAM_RPO_VN_MAX_LOOP_DEPTH);
6487 FOR_EACH_LOOP (loop, LI_ONLY_INNERMOST)
6488 if (loop_depth (loop) > max_depth)
6489 for (unsigned i = 2;
6490 i < loop_depth (loop) - max_depth; ++i)
6492 basic_block header = superloop_at_depth (loop, i)->header;
6493 bool non_latch_backedge = false;
6494 edge e;
6495 edge_iterator ei;
6496 FOR_EACH_EDGE (e, ei, header->preds)
6497 if (e->flags & EDGE_DFS_BACK)
6499 /* There can be a non-latch backedge into the header
6500 which is part of an outer irreducible region. We
6501 cannot avoid iterating this block then. */
6502 if (!dominated_by_p (CDI_DOMINATORS,
6503 e->src, e->dest))
6505 if (dump_file && (dump_flags & TDF_DETAILS))
6506 fprintf (dump_file, "non-latch backedge %d -> %d "
6507 "forces iteration of loop %d\n",
6508 e->src->index, e->dest->index, loop->num);
6509 non_latch_backedge = true;
6511 else
6512 e->flags |= EDGE_EXECUTABLE;
6514 rpo_state[bb_to_rpo[header->index]].iterate = non_latch_backedge;
6518 uint64_t nblk = 0;
6519 int idx = 0;
6520 if (iterate)
6521 /* Go and process all blocks, iterating as necessary. */
6524 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[idx]);
6526 /* If the block has incoming backedges remember unwind state. This
6527 is required even for non-executable blocks since in irreducible
6528 regions we might reach them via the backedge and re-start iterating
6529 from there.
6530 Note we can individually mark blocks with incoming backedges to
6531 not iterate where we then handle PHIs conservatively. We do that
6532 heuristically to reduce compile-time for degenerate cases. */
6533 if (rpo_state[idx].iterate)
6535 rpo_state[idx].ob_top = obstack_alloc (&vn_tables_obstack, 0);
6536 rpo_state[idx].ref_top = last_inserted_ref;
6537 rpo_state[idx].phi_top = last_inserted_phi;
6538 rpo_state[idx].nary_top = last_inserted_nary;
6541 if (!(bb->flags & BB_EXECUTABLE))
6543 if (dump_file && (dump_flags & TDF_DETAILS))
6544 fprintf (dump_file, "Block %d: BB%d found not executable\n",
6545 idx, bb->index);
6546 idx++;
6547 continue;
6550 if (dump_file && (dump_flags & TDF_DETAILS))
6551 fprintf (dump_file, "Processing block %d: BB%d\n", idx, bb->index);
6552 nblk++;
6553 todo |= process_bb (avail, bb,
6554 rpo_state[idx].visited != 0,
6555 rpo_state[idx].iterate,
6556 iterate, eliminate, do_region, exit_bbs);
6557 rpo_state[idx].visited++;
6559 /* Verify if changed values flow over executable outgoing backedges
6560 and those change destination PHI values (that's the thing we
6561 can easily verify). Reduce over all such edges to the farthest
6562 away PHI. */
6563 int iterate_to = -1;
6564 edge_iterator ei;
6565 edge e;
6566 FOR_EACH_EDGE (e, ei, bb->succs)
6567 if ((e->flags & (EDGE_DFS_BACK|EDGE_EXECUTABLE))
6568 == (EDGE_DFS_BACK|EDGE_EXECUTABLE)
6569 && rpo_state[bb_to_rpo[e->dest->index]].iterate)
6571 int destidx = bb_to_rpo[e->dest->index];
6572 if (!rpo_state[destidx].visited)
6574 if (dump_file && (dump_flags & TDF_DETAILS))
6575 fprintf (dump_file, "Unvisited destination %d\n",
6576 e->dest->index);
6577 if (iterate_to == -1 || destidx < iterate_to)
6578 iterate_to = destidx;
6579 continue;
6581 if (dump_file && (dump_flags & TDF_DETAILS))
6582 fprintf (dump_file, "Looking for changed values of backedge"
6583 " %d->%d destination PHIs\n",
6584 e->src->index, e->dest->index);
6585 vn_context_bb = e->dest;
6586 gphi_iterator gsi;
6587 for (gsi = gsi_start_phis (e->dest);
6588 !gsi_end_p (gsi); gsi_next (&gsi))
6590 bool inserted = false;
6591 /* While we'd ideally just iterate on value changes
6592 we CSE PHIs and do that even across basic-block
6593 boundaries. So even hashtable state changes can
6594 be important (which is roughly equivalent to
6595 PHI argument value changes). To not excessively
6596 iterate because of that we track whether a PHI
6597 was CSEd to with GF_PLF_1. */
6598 bool phival_changed;
6599 if ((phival_changed = visit_phi (gsi.phi (),
6600 &inserted, false))
6601 || (inserted && gimple_plf (gsi.phi (), GF_PLF_1)))
6603 if (!phival_changed
6604 && dump_file && (dump_flags & TDF_DETAILS))
6605 fprintf (dump_file, "PHI was CSEd and hashtable "
6606 "state (changed)\n");
6607 if (iterate_to == -1 || destidx < iterate_to)
6608 iterate_to = destidx;
6609 break;
6612 vn_context_bb = NULL;
6614 if (iterate_to != -1)
6616 do_unwind (&rpo_state[iterate_to], iterate_to, avail, bb_to_rpo);
6617 idx = iterate_to;
6618 if (dump_file && (dump_flags & TDF_DETAILS))
6619 fprintf (dump_file, "Iterating to %d BB%d\n",
6620 iterate_to, rpo[iterate_to]);
6621 continue;
6624 idx++;
6626 while (idx < n);
6628 else /* !iterate */
6630 /* Process all blocks greedily with a worklist that enforces RPO
6631 processing of reachable blocks. */
6632 auto_bitmap worklist;
6633 bitmap_set_bit (worklist, 0);
6634 while (!bitmap_empty_p (worklist))
6636 int idx = bitmap_first_set_bit (worklist);
6637 bitmap_clear_bit (worklist, idx);
6638 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[idx]);
6639 gcc_assert ((bb->flags & BB_EXECUTABLE)
6640 && !rpo_state[idx].visited);
6642 if (dump_file && (dump_flags & TDF_DETAILS))
6643 fprintf (dump_file, "Processing block %d: BB%d\n", idx, bb->index);
6645 /* When we run into predecessor edges where we cannot trust its
6646 executable state mark them executable so PHI processing will
6647 be conservative.
6648 ??? Do we need to force arguments flowing over that edge
6649 to be varying or will they even always be? */
6650 edge_iterator ei;
6651 edge e;
6652 FOR_EACH_EDGE (e, ei, bb->preds)
6653 if (!(e->flags & EDGE_EXECUTABLE)
6654 && !rpo_state[bb_to_rpo[e->src->index]].visited
6655 && rpo_state[bb_to_rpo[e->src->index]].max_rpo >= (int)idx)
6657 if (dump_file && (dump_flags & TDF_DETAILS))
6658 fprintf (dump_file, "Cannot trust state of predecessor "
6659 "edge %d -> %d, marking executable\n",
6660 e->src->index, e->dest->index);
6661 e->flags |= EDGE_EXECUTABLE;
6664 nblk++;
6665 todo |= process_bb (avail, bb, false, false, false, eliminate,
6666 do_region, exit_bbs);
6667 rpo_state[idx].visited++;
6669 FOR_EACH_EDGE (e, ei, bb->succs)
6670 if ((e->flags & EDGE_EXECUTABLE)
6671 && e->dest->index != EXIT_BLOCK
6672 && (!do_region || !bitmap_bit_p (exit_bbs, e->dest->index))
6673 && !rpo_state[bb_to_rpo[e->dest->index]].visited)
6674 bitmap_set_bit (worklist, bb_to_rpo[e->dest->index]);
6678 /* If statistics or dump file active. */
6679 int nex = 0;
6680 unsigned max_visited = 1;
6681 for (int i = 0; i < n; ++i)
6683 basic_block bb = BASIC_BLOCK_FOR_FN (fn, rpo[i]);
6684 if (bb->flags & BB_EXECUTABLE)
6685 nex++;
6686 statistics_histogram_event (cfun, "RPO block visited times",
6687 rpo_state[i].visited);
6688 if (rpo_state[i].visited > max_visited)
6689 max_visited = rpo_state[i].visited;
6691 unsigned nvalues = 0, navail = 0;
6692 for (rpo_elim::rpo_avail_t::iterator i = avail.m_rpo_avail.begin ();
6693 i != avail.m_rpo_avail.end (); ++i)
6695 nvalues++;
6696 navail += (*i).second.length ();
6698 statistics_counter_event (cfun, "RPO blocks", n);
6699 statistics_counter_event (cfun, "RPO blocks visited", nblk);
6700 statistics_counter_event (cfun, "RPO blocks executable", nex);
6701 statistics_histogram_event (cfun, "RPO iterations", 10*nblk / nex);
6702 statistics_histogram_event (cfun, "RPO num values", nvalues);
6703 statistics_histogram_event (cfun, "RPO num avail", navail);
6704 statistics_histogram_event (cfun, "RPO num lattice",
6705 vn_ssa_aux_hash->elements ());
6706 if (dump_file && (dump_flags & (TDF_DETAILS|TDF_STATS)))
6708 fprintf (dump_file, "RPO iteration over %d blocks visited %" PRIu64
6709 " blocks in total discovering %d executable blocks iterating "
6710 "%d.%d times, a block was visited max. %u times\n",
6711 n, nblk, nex,
6712 (int)((10*nblk / nex)/10), (int)((10*nblk / nex)%10),
6713 max_visited);
6714 fprintf (dump_file, "RPO tracked %d values available at %d locations "
6715 "and %" PRIu64 " lattice elements\n",
6716 nvalues, navail, (uint64_t) vn_ssa_aux_hash->elements ());
6719 if (eliminate)
6721 /* When !iterate we already performed elimination during the RPO
6722 walk. */
6723 if (iterate)
6725 /* Elimination for region-based VN needs to be done within the
6726 RPO walk. */
6727 gcc_assert (! do_region);
6728 /* Note we can't use avail.walk here because that gets confused
6729 by the existing availability and it will be less efficient
6730 as well. */
6731 todo |= eliminate_with_rpo_vn (NULL);
6733 else
6734 todo |= avail.eliminate_cleanup (do_region);
6737 vn_valueize = NULL;
6738 rpo_avail = NULL;
6740 XDELETEVEC (bb_to_rpo);
6741 XDELETEVEC (rpo);
6742 XDELETEVEC (rpo_state);
6744 return todo;
6747 /* Region-based entry for RPO VN. Performs value-numbering and elimination
6748 on the SEME region specified by ENTRY and EXIT_BBS. */
6750 unsigned
6751 do_rpo_vn (function *fn, edge entry, bitmap exit_bbs)
6753 default_vn_walk_kind = VN_WALKREWRITE;
6754 unsigned todo = do_rpo_vn (fn, entry, exit_bbs, false, true);
6755 free_rpo_vn ();
6756 return todo;
6760 namespace {
6762 const pass_data pass_data_fre =
6764 GIMPLE_PASS, /* type */
6765 "fre", /* name */
6766 OPTGROUP_NONE, /* optinfo_flags */
6767 TV_TREE_FRE, /* tv_id */
6768 ( PROP_cfg | PROP_ssa ), /* properties_required */
6769 0, /* properties_provided */
6770 0, /* properties_destroyed */
6771 0, /* todo_flags_start */
6772 0, /* todo_flags_finish */
6775 class pass_fre : public gimple_opt_pass
6777 public:
6778 pass_fre (gcc::context *ctxt)
6779 : gimple_opt_pass (pass_data_fre, ctxt)
6782 /* opt_pass methods: */
6783 opt_pass * clone () { return new pass_fre (m_ctxt); }
6784 virtual bool gate (function *) { return flag_tree_fre != 0; }
6785 virtual unsigned int execute (function *);
6787 }; // class pass_fre
6789 unsigned int
6790 pass_fre::execute (function *fun)
6792 unsigned todo = 0;
6794 /* At -O[1g] use the cheap non-iterating mode. */
6795 calculate_dominance_info (CDI_DOMINATORS);
6796 if (optimize > 1)
6797 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
6799 default_vn_walk_kind = VN_WALKREWRITE;
6800 todo = do_rpo_vn (fun, NULL, NULL, optimize > 1, true);
6801 free_rpo_vn ();
6803 if (optimize > 1)
6804 loop_optimizer_finalize ();
6806 return todo;
6809 } // anon namespace
6811 gimple_opt_pass *
6812 make_pass_fre (gcc::context *ctxt)
6814 return new pass_fre (ctxt);
6817 #undef BB_EXECUTABLE