Fixups after merge
[official-gcc.git] / gcc / tree-ssa-forwprop.c
blob4484513b11386ccde359586bb86bd3e7466126b3
1 /* Forward propagation of expressions for single use variables.
2 Copyright (C) 2004-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "tree.h"
25 #include "stor-layout.h"
26 #include "tm_p.h"
27 #include "predict.h"
28 #include "vec.h"
29 #include "hashtab.h"
30 #include "hash-set.h"
31 #include "machmode.h"
32 #include "hard-reg-set.h"
33 #include "input.h"
34 #include "function.h"
35 #include "dominance.h"
36 #include "cfg.h"
37 #include "basic-block.h"
38 #include "gimple-pretty-print.h"
39 #include "tree-ssa-alias.h"
40 #include "internal-fn.h"
41 #include "gimple-fold.h"
42 #include "tree-eh.h"
43 #include "gimple-expr.h"
44 #include "is-a.h"
45 #include "gimple.h"
46 #include "gimplify.h"
47 #include "gimple-iterator.h"
48 #include "gimplify-me.h"
49 #include "gimple-ssa.h"
50 #include "tree-cfg.h"
51 #include "tree-phinodes.h"
52 #include "ssa-iterators.h"
53 #include "stringpool.h"
54 #include "tree-ssanames.h"
55 #include "expr.h"
56 #include "tree-dfa.h"
57 #include "tree-pass.h"
58 #include "langhooks.h"
59 #include "flags.h"
60 #include "diagnostic.h"
61 #include "expr.h"
62 #include "cfgloop.h"
63 #include "insn-codes.h"
64 #include "optabs.h"
65 #include "tree-ssa-propagate.h"
66 #include "tree-ssa-dom.h"
67 #include "builtins.h"
68 #include "tree-cfgcleanup.h"
69 #include "tree-into-ssa.h"
70 #include "cfganal.h"
72 /* This pass propagates the RHS of assignment statements into use
73 sites of the LHS of the assignment. It's basically a specialized
74 form of tree combination. It is hoped all of this can disappear
75 when we have a generalized tree combiner.
77 One class of common cases we handle is forward propagating a single use
78 variable into a COND_EXPR.
80 bb0:
81 x = a COND b;
82 if (x) goto ... else goto ...
84 Will be transformed into:
86 bb0:
87 if (a COND b) goto ... else goto ...
89 Similarly for the tests (x == 0), (x != 0), (x == 1) and (x != 1).
91 Or (assuming c1 and c2 are constants):
93 bb0:
94 x = a + c1;
95 if (x EQ/NEQ c2) goto ... else goto ...
97 Will be transformed into:
99 bb0:
100 if (a EQ/NEQ (c2 - c1)) goto ... else goto ...
102 Similarly for x = a - c1.
106 bb0:
107 x = !a
108 if (x) goto ... else goto ...
110 Will be transformed into:
112 bb0:
113 if (a == 0) goto ... else goto ...
115 Similarly for the tests (x == 0), (x != 0), (x == 1) and (x != 1).
116 For these cases, we propagate A into all, possibly more than one,
117 COND_EXPRs that use X.
121 bb0:
122 x = (typecast) a
123 if (x) goto ... else goto ...
125 Will be transformed into:
127 bb0:
128 if (a != 0) goto ... else goto ...
130 (Assuming a is an integral type and x is a boolean or x is an
131 integral and a is a boolean.)
133 Similarly for the tests (x == 0), (x != 0), (x == 1) and (x != 1).
134 For these cases, we propagate A into all, possibly more than one,
135 COND_EXPRs that use X.
137 In addition to eliminating the variable and the statement which assigns
138 a value to the variable, we may be able to later thread the jump without
139 adding insane complexity in the dominator optimizer.
141 Also note these transformations can cascade. We handle this by having
142 a worklist of COND_EXPR statements to examine. As we make a change to
143 a statement, we put it back on the worklist to examine on the next
144 iteration of the main loop.
146 A second class of propagation opportunities arises for ADDR_EXPR
147 nodes.
149 ptr = &x->y->z;
150 res = *ptr;
152 Will get turned into
154 res = x->y->z;
157 ptr = (type1*)&type2var;
158 res = *ptr
160 Will get turned into (if type1 and type2 are the same size
161 and neither have volatile on them):
162 res = VIEW_CONVERT_EXPR<type1>(type2var)
166 ptr = &x[0];
167 ptr2 = ptr + <constant>;
169 Will get turned into
171 ptr2 = &x[constant/elementsize];
175 ptr = &x[0];
176 offset = index * element_size;
177 offset_p = (pointer) offset;
178 ptr2 = ptr + offset_p
180 Will get turned into:
182 ptr2 = &x[index];
185 ssa = (int) decl
186 res = ssa & 1
188 Provided that decl has known alignment >= 2, will get turned into
190 res = 0
192 We also propagate casts into SWITCH_EXPR and COND_EXPR conditions to
193 allow us to remove the cast and {NOT_EXPR,NEG_EXPR} into a subsequent
194 {NOT_EXPR,NEG_EXPR}.
196 This will (of course) be extended as other needs arise. */
198 static bool forward_propagate_addr_expr (tree, tree, bool);
200 /* Set to true if we delete dead edges during the optimization. */
201 static bool cfg_changed;
203 static tree rhs_to_tree (tree type, gimple stmt);
205 static bitmap to_purge;
207 /* Const-and-copy lattice. */
208 static vec<tree> lattice;
210 /* Set the lattice entry for NAME to VAL. */
211 static void
212 fwprop_set_lattice_val (tree name, tree val)
214 if (TREE_CODE (name) == SSA_NAME)
216 if (SSA_NAME_VERSION (name) >= lattice.length ())
218 lattice.reserve (num_ssa_names - lattice.length ());
219 lattice.quick_grow_cleared (num_ssa_names);
221 lattice[SSA_NAME_VERSION (name)] = val;
225 /* Invalidate the lattice entry for NAME, done when releasing SSA names. */
226 static void
227 fwprop_invalidate_lattice (tree name)
229 if (name
230 && TREE_CODE (name) == SSA_NAME
231 && SSA_NAME_VERSION (name) < lattice.length ())
232 lattice[SSA_NAME_VERSION (name)] = NULL_TREE;
236 /* Get the statement we can propagate from into NAME skipping
237 trivial copies. Returns the statement which defines the
238 propagation source or NULL_TREE if there is no such one.
239 If SINGLE_USE_ONLY is set considers only sources which have
240 a single use chain up to NAME. If SINGLE_USE_P is non-null,
241 it is set to whether the chain to NAME is a single use chain
242 or not. SINGLE_USE_P is not written to if SINGLE_USE_ONLY is set. */
244 static gimple
245 get_prop_source_stmt (tree name, bool single_use_only, bool *single_use_p)
247 bool single_use = true;
249 do {
250 gimple def_stmt = SSA_NAME_DEF_STMT (name);
252 if (!has_single_use (name))
254 single_use = false;
255 if (single_use_only)
256 return NULL;
259 /* If name is defined by a PHI node or is the default def, bail out. */
260 if (!is_gimple_assign (def_stmt))
261 return NULL;
263 /* If def_stmt is a simple copy, continue looking. */
264 if (gimple_assign_rhs_code (def_stmt) == SSA_NAME)
265 name = gimple_assign_rhs1 (def_stmt);
266 else
268 if (!single_use_only && single_use_p)
269 *single_use_p = single_use;
271 return def_stmt;
273 } while (1);
276 /* Checks if the destination ssa name in DEF_STMT can be used as
277 propagation source. Returns true if so, otherwise false. */
279 static bool
280 can_propagate_from (gimple def_stmt)
282 gcc_assert (is_gimple_assign (def_stmt));
284 /* If the rhs has side-effects we cannot propagate from it. */
285 if (gimple_has_volatile_ops (def_stmt))
286 return false;
288 /* If the rhs is a load we cannot propagate from it. */
289 if (TREE_CODE_CLASS (gimple_assign_rhs_code (def_stmt)) == tcc_reference
290 || TREE_CODE_CLASS (gimple_assign_rhs_code (def_stmt)) == tcc_declaration)
291 return false;
293 /* Constants can be always propagated. */
294 if (gimple_assign_single_p (def_stmt)
295 && is_gimple_min_invariant (gimple_assign_rhs1 (def_stmt)))
296 return true;
298 /* We cannot propagate ssa names that occur in abnormal phi nodes. */
299 if (stmt_references_abnormal_ssa_name (def_stmt))
300 return false;
302 /* If the definition is a conversion of a pointer to a function type,
303 then we can not apply optimizations as some targets require
304 function pointers to be canonicalized and in this case this
305 optimization could eliminate a necessary canonicalization. */
306 if (CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (def_stmt)))
308 tree rhs = gimple_assign_rhs1 (def_stmt);
309 if (POINTER_TYPE_P (TREE_TYPE (rhs))
310 && TREE_CODE (TREE_TYPE (TREE_TYPE (rhs))) == FUNCTION_TYPE)
311 return false;
314 return true;
317 /* Remove a chain of dead statements starting at the definition of
318 NAME. The chain is linked via the first operand of the defining statements.
319 If NAME was replaced in its only use then this function can be used
320 to clean up dead stmts. The function handles already released SSA
321 names gracefully.
322 Returns true if cleanup-cfg has to run. */
324 static bool
325 remove_prop_source_from_use (tree name)
327 gimple_stmt_iterator gsi;
328 gimple stmt;
329 bool cfg_changed = false;
331 do {
332 basic_block bb;
334 if (SSA_NAME_IN_FREE_LIST (name)
335 || SSA_NAME_IS_DEFAULT_DEF (name)
336 || !has_zero_uses (name))
337 return cfg_changed;
339 stmt = SSA_NAME_DEF_STMT (name);
340 if (gimple_code (stmt) == GIMPLE_PHI
341 || gimple_has_side_effects (stmt))
342 return cfg_changed;
344 bb = gimple_bb (stmt);
345 gsi = gsi_for_stmt (stmt);
346 unlink_stmt_vdef (stmt);
347 if (gsi_remove (&gsi, true))
348 bitmap_set_bit (to_purge, bb->index);
349 fwprop_invalidate_lattice (gimple_get_lhs (stmt));
350 release_defs (stmt);
352 name = is_gimple_assign (stmt) ? gimple_assign_rhs1 (stmt) : NULL_TREE;
353 } while (name && TREE_CODE (name) == SSA_NAME);
355 return cfg_changed;
358 /* Return the rhs of a gassign *STMT in a form of a single tree,
359 converted to type TYPE.
361 This should disappear, but is needed so we can combine expressions and use
362 the fold() interfaces. Long term, we need to develop folding and combine
363 routines that deal with gimple exclusively . */
365 static tree
366 rhs_to_tree (tree type, gimple stmt)
368 location_t loc = gimple_location (stmt);
369 enum tree_code code = gimple_assign_rhs_code (stmt);
370 if (get_gimple_rhs_class (code) == GIMPLE_TERNARY_RHS)
371 return fold_build3_loc (loc, code, type, gimple_assign_rhs1 (stmt),
372 gimple_assign_rhs2 (stmt),
373 gimple_assign_rhs3 (stmt));
374 else if (get_gimple_rhs_class (code) == GIMPLE_BINARY_RHS)
375 return fold_build2_loc (loc, code, type, gimple_assign_rhs1 (stmt),
376 gimple_assign_rhs2 (stmt));
377 else if (get_gimple_rhs_class (code) == GIMPLE_UNARY_RHS)
378 return build1 (code, type, gimple_assign_rhs1 (stmt));
379 else if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
380 return gimple_assign_rhs1 (stmt);
381 else
382 gcc_unreachable ();
385 /* Combine OP0 CODE OP1 in the context of a COND_EXPR. Returns
386 the folded result in a form suitable for COND_EXPR_COND or
387 NULL_TREE, if there is no suitable simplified form. If
388 INVARIANT_ONLY is true only gimple_min_invariant results are
389 considered simplified. */
391 static tree
392 combine_cond_expr_cond (gimple stmt, enum tree_code code, tree type,
393 tree op0, tree op1, bool invariant_only)
395 tree t;
397 gcc_assert (TREE_CODE_CLASS (code) == tcc_comparison);
399 fold_defer_overflow_warnings ();
400 t = fold_binary_loc (gimple_location (stmt), code, type, op0, op1);
401 if (!t)
403 fold_undefer_overflow_warnings (false, NULL, 0);
404 return NULL_TREE;
407 /* Require that we got a boolean type out if we put one in. */
408 gcc_assert (TREE_CODE (TREE_TYPE (t)) == TREE_CODE (type));
410 /* Canonicalize the combined condition for use in a COND_EXPR. */
411 t = canonicalize_cond_expr_cond (t);
413 /* Bail out if we required an invariant but didn't get one. */
414 if (!t || (invariant_only && !is_gimple_min_invariant (t)))
416 fold_undefer_overflow_warnings (false, NULL, 0);
417 return NULL_TREE;
420 fold_undefer_overflow_warnings (!gimple_no_warning_p (stmt), stmt, 0);
422 return t;
425 /* Combine the comparison OP0 CODE OP1 at LOC with the defining statements
426 of its operand. Return a new comparison tree or NULL_TREE if there
427 were no simplifying combines. */
429 static tree
430 forward_propagate_into_comparison_1 (gimple stmt,
431 enum tree_code code, tree type,
432 tree op0, tree op1)
434 tree tmp = NULL_TREE;
435 tree rhs0 = NULL_TREE, rhs1 = NULL_TREE;
436 bool single_use0_p = false, single_use1_p = false;
438 /* For comparisons use the first operand, that is likely to
439 simplify comparisons against constants. */
440 if (TREE_CODE (op0) == SSA_NAME)
442 gimple def_stmt = get_prop_source_stmt (op0, false, &single_use0_p);
443 if (def_stmt && can_propagate_from (def_stmt))
445 rhs0 = rhs_to_tree (TREE_TYPE (op1), def_stmt);
446 tmp = combine_cond_expr_cond (stmt, code, type,
447 rhs0, op1, !single_use0_p);
448 if (tmp)
449 return tmp;
453 /* If that wasn't successful, try the second operand. */
454 if (TREE_CODE (op1) == SSA_NAME)
456 gimple def_stmt = get_prop_source_stmt (op1, false, &single_use1_p);
457 if (def_stmt && can_propagate_from (def_stmt))
459 rhs1 = rhs_to_tree (TREE_TYPE (op0), def_stmt);
460 tmp = combine_cond_expr_cond (stmt, code, type,
461 op0, rhs1, !single_use1_p);
462 if (tmp)
463 return tmp;
467 /* If that wasn't successful either, try both operands. */
468 if (rhs0 != NULL_TREE
469 && rhs1 != NULL_TREE)
470 tmp = combine_cond_expr_cond (stmt, code, type,
471 rhs0, rhs1,
472 !(single_use0_p && single_use1_p));
474 return tmp;
477 /* Propagate from the ssa name definition statements of the assignment
478 from a comparison at *GSI into the conditional if that simplifies it.
479 Returns 1 if the stmt was modified and 2 if the CFG needs cleanup,
480 otherwise returns 0. */
482 static int
483 forward_propagate_into_comparison (gimple_stmt_iterator *gsi)
485 gimple stmt = gsi_stmt (*gsi);
486 tree tmp;
487 bool cfg_changed = false;
488 tree type = TREE_TYPE (gimple_assign_lhs (stmt));
489 tree rhs1 = gimple_assign_rhs1 (stmt);
490 tree rhs2 = gimple_assign_rhs2 (stmt);
492 /* Combine the comparison with defining statements. */
493 tmp = forward_propagate_into_comparison_1 (stmt,
494 gimple_assign_rhs_code (stmt),
495 type, rhs1, rhs2);
496 if (tmp && useless_type_conversion_p (type, TREE_TYPE (tmp)))
498 gimple_assign_set_rhs_from_tree (gsi, tmp);
499 fold_stmt (gsi);
500 update_stmt (gsi_stmt (*gsi));
502 if (TREE_CODE (rhs1) == SSA_NAME)
503 cfg_changed |= remove_prop_source_from_use (rhs1);
504 if (TREE_CODE (rhs2) == SSA_NAME)
505 cfg_changed |= remove_prop_source_from_use (rhs2);
506 return cfg_changed ? 2 : 1;
509 return 0;
512 /* Propagate from the ssa name definition statements of COND_EXPR
513 in GIMPLE_COND statement STMT into the conditional if that simplifies it.
514 Returns zero if no statement was changed, one if there were
515 changes and two if cfg_cleanup needs to run.
517 This must be kept in sync with forward_propagate_into_cond. */
519 static int
520 forward_propagate_into_gimple_cond (gcond *stmt)
522 tree tmp;
523 enum tree_code code = gimple_cond_code (stmt);
524 bool cfg_changed = false;
525 tree rhs1 = gimple_cond_lhs (stmt);
526 tree rhs2 = gimple_cond_rhs (stmt);
528 /* We can do tree combining on SSA_NAME and comparison expressions. */
529 if (TREE_CODE_CLASS (gimple_cond_code (stmt)) != tcc_comparison)
530 return 0;
532 tmp = forward_propagate_into_comparison_1 (stmt, code,
533 boolean_type_node,
534 rhs1, rhs2);
535 if (tmp)
537 if (dump_file && tmp)
539 fprintf (dump_file, " Replaced '");
540 print_gimple_expr (dump_file, stmt, 0, 0);
541 fprintf (dump_file, "' with '");
542 print_generic_expr (dump_file, tmp, 0);
543 fprintf (dump_file, "'\n");
546 gimple_cond_set_condition_from_tree (stmt, unshare_expr (tmp));
547 update_stmt (stmt);
549 if (TREE_CODE (rhs1) == SSA_NAME)
550 cfg_changed |= remove_prop_source_from_use (rhs1);
551 if (TREE_CODE (rhs2) == SSA_NAME)
552 cfg_changed |= remove_prop_source_from_use (rhs2);
553 return (cfg_changed || is_gimple_min_invariant (tmp)) ? 2 : 1;
556 /* Canonicalize _Bool == 0 and _Bool != 1 to _Bool != 0 by swapping edges. */
557 if ((TREE_CODE (TREE_TYPE (rhs1)) == BOOLEAN_TYPE
558 || (INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
559 && TYPE_PRECISION (TREE_TYPE (rhs1)) == 1))
560 && ((code == EQ_EXPR
561 && integer_zerop (rhs2))
562 || (code == NE_EXPR
563 && integer_onep (rhs2))))
565 basic_block bb = gimple_bb (stmt);
566 gimple_cond_set_code (stmt, NE_EXPR);
567 gimple_cond_set_rhs (stmt, build_zero_cst (TREE_TYPE (rhs1)));
568 EDGE_SUCC (bb, 0)->flags ^= (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE);
569 EDGE_SUCC (bb, 1)->flags ^= (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE);
570 return 1;
573 return 0;
577 /* Propagate from the ssa name definition statements of COND_EXPR
578 in the rhs of statement STMT into the conditional if that simplifies it.
579 Returns true zero if the stmt was changed. */
581 static bool
582 forward_propagate_into_cond (gimple_stmt_iterator *gsi_p)
584 gimple stmt = gsi_stmt (*gsi_p);
585 tree tmp = NULL_TREE;
586 tree cond = gimple_assign_rhs1 (stmt);
587 enum tree_code code = gimple_assign_rhs_code (stmt);
589 /* We can do tree combining on SSA_NAME and comparison expressions. */
590 if (COMPARISON_CLASS_P (cond))
591 tmp = forward_propagate_into_comparison_1 (stmt, TREE_CODE (cond),
592 TREE_TYPE (cond),
593 TREE_OPERAND (cond, 0),
594 TREE_OPERAND (cond, 1));
595 else if (TREE_CODE (cond) == SSA_NAME)
597 enum tree_code def_code;
598 tree name = cond;
599 gimple def_stmt = get_prop_source_stmt (name, true, NULL);
600 if (!def_stmt || !can_propagate_from (def_stmt))
601 return 0;
603 def_code = gimple_assign_rhs_code (def_stmt);
604 if (TREE_CODE_CLASS (def_code) == tcc_comparison)
605 tmp = fold_build2_loc (gimple_location (def_stmt),
606 def_code,
607 TREE_TYPE (cond),
608 gimple_assign_rhs1 (def_stmt),
609 gimple_assign_rhs2 (def_stmt));
612 if (tmp
613 && is_gimple_condexpr (tmp))
615 if (dump_file && tmp)
617 fprintf (dump_file, " Replaced '");
618 print_generic_expr (dump_file, cond, 0);
619 fprintf (dump_file, "' with '");
620 print_generic_expr (dump_file, tmp, 0);
621 fprintf (dump_file, "'\n");
624 if ((code == VEC_COND_EXPR) ? integer_all_onesp (tmp)
625 : integer_onep (tmp))
626 gimple_assign_set_rhs_from_tree (gsi_p, gimple_assign_rhs2 (stmt));
627 else if (integer_zerop (tmp))
628 gimple_assign_set_rhs_from_tree (gsi_p, gimple_assign_rhs3 (stmt));
629 else
630 gimple_assign_set_rhs1 (stmt, unshare_expr (tmp));
631 stmt = gsi_stmt (*gsi_p);
632 update_stmt (stmt);
634 return true;
637 return 0;
640 /* We've just substituted an ADDR_EXPR into stmt. Update all the
641 relevant data structures to match. */
643 static void
644 tidy_after_forward_propagate_addr (gimple stmt)
646 /* We may have turned a trapping insn into a non-trapping insn. */
647 if (maybe_clean_or_replace_eh_stmt (stmt, stmt))
648 bitmap_set_bit (to_purge, gimple_bb (stmt)->index);
650 if (TREE_CODE (gimple_assign_rhs1 (stmt)) == ADDR_EXPR)
651 recompute_tree_invariant_for_addr_expr (gimple_assign_rhs1 (stmt));
654 /* NAME is a SSA_NAME representing DEF_RHS which is of the form
655 ADDR_EXPR <whatever>.
657 Try to forward propagate the ADDR_EXPR into the use USE_STMT.
658 Often this will allow for removal of an ADDR_EXPR and INDIRECT_REF
659 node or for recovery of array indexing from pointer arithmetic.
661 Return true if the propagation was successful (the propagation can
662 be not totally successful, yet things may have been changed). */
664 static bool
665 forward_propagate_addr_expr_1 (tree name, tree def_rhs,
666 gimple_stmt_iterator *use_stmt_gsi,
667 bool single_use_p)
669 tree lhs, rhs, rhs2, array_ref;
670 gimple use_stmt = gsi_stmt (*use_stmt_gsi);
671 enum tree_code rhs_code;
672 bool res = true;
674 gcc_assert (TREE_CODE (def_rhs) == ADDR_EXPR);
676 lhs = gimple_assign_lhs (use_stmt);
677 rhs_code = gimple_assign_rhs_code (use_stmt);
678 rhs = gimple_assign_rhs1 (use_stmt);
680 /* Do not perform copy-propagation but recurse through copy chains. */
681 if (TREE_CODE (lhs) == SSA_NAME
682 && rhs_code == SSA_NAME)
683 return forward_propagate_addr_expr (lhs, def_rhs, single_use_p);
685 /* The use statement could be a conversion. Recurse to the uses of the
686 lhs as copyprop does not copy through pointer to integer to pointer
687 conversions and FRE does not catch all cases either.
688 Treat the case of a single-use name and
689 a conversion to def_rhs type separate, though. */
690 if (TREE_CODE (lhs) == SSA_NAME
691 && CONVERT_EXPR_CODE_P (rhs_code))
693 /* If there is a point in a conversion chain where the types match
694 so we can remove a conversion re-materialize the address here
695 and stop. */
696 if (single_use_p
697 && useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (def_rhs)))
699 gimple_assign_set_rhs1 (use_stmt, unshare_expr (def_rhs));
700 gimple_assign_set_rhs_code (use_stmt, TREE_CODE (def_rhs));
701 return true;
704 /* Else recurse if the conversion preserves the address value. */
705 if ((INTEGRAL_TYPE_P (TREE_TYPE (lhs))
706 || POINTER_TYPE_P (TREE_TYPE (lhs)))
707 && (TYPE_PRECISION (TREE_TYPE (lhs))
708 >= TYPE_PRECISION (TREE_TYPE (def_rhs))))
709 return forward_propagate_addr_expr (lhs, def_rhs, single_use_p);
711 return false;
714 /* If this isn't a conversion chain from this on we only can propagate
715 into compatible pointer contexts. */
716 if (!types_compatible_p (TREE_TYPE (name), TREE_TYPE (def_rhs)))
717 return false;
719 /* Propagate through constant pointer adjustments. */
720 if (TREE_CODE (lhs) == SSA_NAME
721 && rhs_code == POINTER_PLUS_EXPR
722 && rhs == name
723 && TREE_CODE (gimple_assign_rhs2 (use_stmt)) == INTEGER_CST)
725 tree new_def_rhs;
726 /* As we come here with non-invariant addresses in def_rhs we need
727 to make sure we can build a valid constant offsetted address
728 for further propagation. Simply rely on fold building that
729 and check after the fact. */
730 new_def_rhs = fold_build2 (MEM_REF, TREE_TYPE (TREE_TYPE (rhs)),
731 def_rhs,
732 fold_convert (ptr_type_node,
733 gimple_assign_rhs2 (use_stmt)));
734 if (TREE_CODE (new_def_rhs) == MEM_REF
735 && !is_gimple_mem_ref_addr (TREE_OPERAND (new_def_rhs, 0)))
736 return false;
737 new_def_rhs = build_fold_addr_expr_with_type (new_def_rhs,
738 TREE_TYPE (rhs));
740 /* Recurse. If we could propagate into all uses of lhs do not
741 bother to replace into the current use but just pretend we did. */
742 if (TREE_CODE (new_def_rhs) == ADDR_EXPR
743 && forward_propagate_addr_expr (lhs, new_def_rhs, single_use_p))
744 return true;
746 if (useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (new_def_rhs)))
747 gimple_assign_set_rhs_with_ops (use_stmt_gsi, TREE_CODE (new_def_rhs),
748 new_def_rhs, NULL_TREE);
749 else if (is_gimple_min_invariant (new_def_rhs))
750 gimple_assign_set_rhs_with_ops (use_stmt_gsi, NOP_EXPR,
751 new_def_rhs, NULL_TREE);
752 else
753 return false;
754 gcc_assert (gsi_stmt (*use_stmt_gsi) == use_stmt);
755 update_stmt (use_stmt);
756 return true;
759 /* Now strip away any outer COMPONENT_REF/ARRAY_REF nodes from the LHS.
760 ADDR_EXPR will not appear on the LHS. */
761 tree *lhsp = gimple_assign_lhs_ptr (use_stmt);
762 while (handled_component_p (*lhsp))
763 lhsp = &TREE_OPERAND (*lhsp, 0);
764 lhs = *lhsp;
766 /* Now see if the LHS node is a MEM_REF using NAME. If so,
767 propagate the ADDR_EXPR into the use of NAME and fold the result. */
768 if (TREE_CODE (lhs) == MEM_REF
769 && TREE_OPERAND (lhs, 0) == name)
771 tree def_rhs_base;
772 HOST_WIDE_INT def_rhs_offset;
773 /* If the address is invariant we can always fold it. */
774 if ((def_rhs_base = get_addr_base_and_unit_offset (TREE_OPERAND (def_rhs, 0),
775 &def_rhs_offset)))
777 offset_int off = mem_ref_offset (lhs);
778 tree new_ptr;
779 off += def_rhs_offset;
780 if (TREE_CODE (def_rhs_base) == MEM_REF)
782 off += mem_ref_offset (def_rhs_base);
783 new_ptr = TREE_OPERAND (def_rhs_base, 0);
785 else
786 new_ptr = build_fold_addr_expr (def_rhs_base);
787 TREE_OPERAND (lhs, 0) = new_ptr;
788 TREE_OPERAND (lhs, 1)
789 = wide_int_to_tree (TREE_TYPE (TREE_OPERAND (lhs, 1)), off);
790 tidy_after_forward_propagate_addr (use_stmt);
791 /* Continue propagating into the RHS if this was not the only use. */
792 if (single_use_p)
793 return true;
795 /* If the LHS is a plain dereference and the value type is the same as
796 that of the pointed-to type of the address we can put the
797 dereferenced address on the LHS preserving the original alias-type. */
798 else if (integer_zerop (TREE_OPERAND (lhs, 1))
799 && ((gimple_assign_lhs (use_stmt) == lhs
800 && useless_type_conversion_p
801 (TREE_TYPE (TREE_OPERAND (def_rhs, 0)),
802 TREE_TYPE (gimple_assign_rhs1 (use_stmt))))
803 || types_compatible_p (TREE_TYPE (lhs),
804 TREE_TYPE (TREE_OPERAND (def_rhs, 0))))
805 /* Don't forward anything into clobber stmts if it would result
806 in the lhs no longer being a MEM_REF. */
807 && (!gimple_clobber_p (use_stmt)
808 || TREE_CODE (TREE_OPERAND (def_rhs, 0)) == MEM_REF))
810 tree *def_rhs_basep = &TREE_OPERAND (def_rhs, 0);
811 tree new_offset, new_base, saved, new_lhs;
812 while (handled_component_p (*def_rhs_basep))
813 def_rhs_basep = &TREE_OPERAND (*def_rhs_basep, 0);
814 saved = *def_rhs_basep;
815 if (TREE_CODE (*def_rhs_basep) == MEM_REF)
817 new_base = TREE_OPERAND (*def_rhs_basep, 0);
818 new_offset = fold_convert (TREE_TYPE (TREE_OPERAND (lhs, 1)),
819 TREE_OPERAND (*def_rhs_basep, 1));
821 else
823 new_base = build_fold_addr_expr (*def_rhs_basep);
824 new_offset = TREE_OPERAND (lhs, 1);
826 *def_rhs_basep = build2 (MEM_REF, TREE_TYPE (*def_rhs_basep),
827 new_base, new_offset);
828 TREE_THIS_VOLATILE (*def_rhs_basep) = TREE_THIS_VOLATILE (lhs);
829 TREE_SIDE_EFFECTS (*def_rhs_basep) = TREE_SIDE_EFFECTS (lhs);
830 TREE_THIS_NOTRAP (*def_rhs_basep) = TREE_THIS_NOTRAP (lhs);
831 new_lhs = unshare_expr (TREE_OPERAND (def_rhs, 0));
832 *lhsp = new_lhs;
833 TREE_THIS_VOLATILE (new_lhs) = TREE_THIS_VOLATILE (lhs);
834 TREE_SIDE_EFFECTS (new_lhs) = TREE_SIDE_EFFECTS (lhs);
835 *def_rhs_basep = saved;
836 tidy_after_forward_propagate_addr (use_stmt);
837 /* Continue propagating into the RHS if this was not the
838 only use. */
839 if (single_use_p)
840 return true;
842 else
843 /* We can have a struct assignment dereferencing our name twice.
844 Note that we didn't propagate into the lhs to not falsely
845 claim we did when propagating into the rhs. */
846 res = false;
849 /* Strip away any outer COMPONENT_REF, ARRAY_REF or ADDR_EXPR
850 nodes from the RHS. */
851 tree *rhsp = gimple_assign_rhs1_ptr (use_stmt);
852 if (TREE_CODE (*rhsp) == ADDR_EXPR)
853 rhsp = &TREE_OPERAND (*rhsp, 0);
854 while (handled_component_p (*rhsp))
855 rhsp = &TREE_OPERAND (*rhsp, 0);
856 rhs = *rhsp;
858 /* Now see if the RHS node is a MEM_REF using NAME. If so,
859 propagate the ADDR_EXPR into the use of NAME and fold the result. */
860 if (TREE_CODE (rhs) == MEM_REF
861 && TREE_OPERAND (rhs, 0) == name)
863 tree def_rhs_base;
864 HOST_WIDE_INT def_rhs_offset;
865 if ((def_rhs_base = get_addr_base_and_unit_offset (TREE_OPERAND (def_rhs, 0),
866 &def_rhs_offset)))
868 offset_int off = mem_ref_offset (rhs);
869 tree new_ptr;
870 off += def_rhs_offset;
871 if (TREE_CODE (def_rhs_base) == MEM_REF)
873 off += mem_ref_offset (def_rhs_base);
874 new_ptr = TREE_OPERAND (def_rhs_base, 0);
876 else
877 new_ptr = build_fold_addr_expr (def_rhs_base);
878 TREE_OPERAND (rhs, 0) = new_ptr;
879 TREE_OPERAND (rhs, 1)
880 = wide_int_to_tree (TREE_TYPE (TREE_OPERAND (rhs, 1)), off);
881 fold_stmt_inplace (use_stmt_gsi);
882 tidy_after_forward_propagate_addr (use_stmt);
883 return res;
885 /* If the RHS is a plain dereference and the value type is the same as
886 that of the pointed-to type of the address we can put the
887 dereferenced address on the RHS preserving the original alias-type. */
888 else if (integer_zerop (TREE_OPERAND (rhs, 1))
889 && ((gimple_assign_rhs1 (use_stmt) == rhs
890 && useless_type_conversion_p
891 (TREE_TYPE (gimple_assign_lhs (use_stmt)),
892 TREE_TYPE (TREE_OPERAND (def_rhs, 0))))
893 || types_compatible_p (TREE_TYPE (rhs),
894 TREE_TYPE (TREE_OPERAND (def_rhs, 0)))))
896 tree *def_rhs_basep = &TREE_OPERAND (def_rhs, 0);
897 tree new_offset, new_base, saved, new_rhs;
898 while (handled_component_p (*def_rhs_basep))
899 def_rhs_basep = &TREE_OPERAND (*def_rhs_basep, 0);
900 saved = *def_rhs_basep;
901 if (TREE_CODE (*def_rhs_basep) == MEM_REF)
903 new_base = TREE_OPERAND (*def_rhs_basep, 0);
904 new_offset = fold_convert (TREE_TYPE (TREE_OPERAND (rhs, 1)),
905 TREE_OPERAND (*def_rhs_basep, 1));
907 else
909 new_base = build_fold_addr_expr (*def_rhs_basep);
910 new_offset = TREE_OPERAND (rhs, 1);
912 *def_rhs_basep = build2 (MEM_REF, TREE_TYPE (*def_rhs_basep),
913 new_base, new_offset);
914 TREE_THIS_VOLATILE (*def_rhs_basep) = TREE_THIS_VOLATILE (rhs);
915 TREE_SIDE_EFFECTS (*def_rhs_basep) = TREE_SIDE_EFFECTS (rhs);
916 TREE_THIS_NOTRAP (*def_rhs_basep) = TREE_THIS_NOTRAP (rhs);
917 new_rhs = unshare_expr (TREE_OPERAND (def_rhs, 0));
918 *rhsp = new_rhs;
919 TREE_THIS_VOLATILE (new_rhs) = TREE_THIS_VOLATILE (rhs);
920 TREE_SIDE_EFFECTS (new_rhs) = TREE_SIDE_EFFECTS (rhs);
921 *def_rhs_basep = saved;
922 fold_stmt_inplace (use_stmt_gsi);
923 tidy_after_forward_propagate_addr (use_stmt);
924 return res;
928 /* If the use of the ADDR_EXPR is not a POINTER_PLUS_EXPR, there
929 is nothing to do. */
930 if (gimple_assign_rhs_code (use_stmt) != POINTER_PLUS_EXPR
931 || gimple_assign_rhs1 (use_stmt) != name)
932 return false;
934 /* The remaining cases are all for turning pointer arithmetic into
935 array indexing. They only apply when we have the address of
936 element zero in an array. If that is not the case then there
937 is nothing to do. */
938 array_ref = TREE_OPERAND (def_rhs, 0);
939 if ((TREE_CODE (array_ref) != ARRAY_REF
940 || TREE_CODE (TREE_TYPE (TREE_OPERAND (array_ref, 0))) != ARRAY_TYPE
941 || TREE_CODE (TREE_OPERAND (array_ref, 1)) != INTEGER_CST)
942 && TREE_CODE (TREE_TYPE (array_ref)) != ARRAY_TYPE)
943 return false;
945 rhs2 = gimple_assign_rhs2 (use_stmt);
946 /* Optimize &x[C1] p+ C2 to &x p+ C3 with C3 = C1 * element_size + C2. */
947 if (TREE_CODE (rhs2) == INTEGER_CST)
949 tree new_rhs = build1_loc (gimple_location (use_stmt),
950 ADDR_EXPR, TREE_TYPE (def_rhs),
951 fold_build2 (MEM_REF,
952 TREE_TYPE (TREE_TYPE (def_rhs)),
953 unshare_expr (def_rhs),
954 fold_convert (ptr_type_node,
955 rhs2)));
956 gimple_assign_set_rhs_from_tree (use_stmt_gsi, new_rhs);
957 use_stmt = gsi_stmt (*use_stmt_gsi);
958 update_stmt (use_stmt);
959 tidy_after_forward_propagate_addr (use_stmt);
960 return true;
963 return false;
966 /* STMT is a statement of the form SSA_NAME = ADDR_EXPR <whatever>.
968 Try to forward propagate the ADDR_EXPR into all uses of the SSA_NAME.
969 Often this will allow for removal of an ADDR_EXPR and INDIRECT_REF
970 node or for recovery of array indexing from pointer arithmetic.
972 PARENT_SINGLE_USE_P tells if, when in a recursive invocation, NAME was
973 the single use in the previous invocation. Pass true when calling
974 this as toplevel.
976 Returns true, if all uses have been propagated into. */
978 static bool
979 forward_propagate_addr_expr (tree name, tree rhs, bool parent_single_use_p)
981 imm_use_iterator iter;
982 gimple use_stmt;
983 bool all = true;
984 bool single_use_p = parent_single_use_p && has_single_use (name);
986 FOR_EACH_IMM_USE_STMT (use_stmt, iter, name)
988 bool result;
989 tree use_rhs;
991 /* If the use is not in a simple assignment statement, then
992 there is nothing we can do. */
993 if (!is_gimple_assign (use_stmt))
995 if (!is_gimple_debug (use_stmt))
996 all = false;
997 continue;
1000 gimple_stmt_iterator gsi = gsi_for_stmt (use_stmt);
1001 result = forward_propagate_addr_expr_1 (name, rhs, &gsi,
1002 single_use_p);
1003 /* If the use has moved to a different statement adjust
1004 the update machinery for the old statement too. */
1005 if (use_stmt != gsi_stmt (gsi))
1007 update_stmt (use_stmt);
1008 use_stmt = gsi_stmt (gsi);
1010 update_stmt (use_stmt);
1011 all &= result;
1013 /* Remove intermediate now unused copy and conversion chains. */
1014 use_rhs = gimple_assign_rhs1 (use_stmt);
1015 if (result
1016 && TREE_CODE (gimple_assign_lhs (use_stmt)) == SSA_NAME
1017 && TREE_CODE (use_rhs) == SSA_NAME
1018 && has_zero_uses (gimple_assign_lhs (use_stmt)))
1020 gimple_stmt_iterator gsi = gsi_for_stmt (use_stmt);
1021 fwprop_invalidate_lattice (gimple_get_lhs (use_stmt));
1022 release_defs (use_stmt);
1023 gsi_remove (&gsi, true);
1027 return all && has_zero_uses (name);
1031 /* Helper function for simplify_gimple_switch. Remove case labels that
1032 have values outside the range of the new type. */
1034 static void
1035 simplify_gimple_switch_label_vec (gswitch *stmt, tree index_type)
1037 unsigned int branch_num = gimple_switch_num_labels (stmt);
1038 auto_vec<tree> labels (branch_num);
1039 unsigned int i, len;
1041 /* Collect the existing case labels in a VEC, and preprocess it as if
1042 we are gimplifying a GENERIC SWITCH_EXPR. */
1043 for (i = 1; i < branch_num; i++)
1044 labels.quick_push (gimple_switch_label (stmt, i));
1045 preprocess_case_label_vec_for_gimple (labels, index_type, NULL);
1047 /* If any labels were removed, replace the existing case labels
1048 in the GIMPLE_SWITCH statement with the correct ones.
1049 Note that the type updates were done in-place on the case labels,
1050 so we only have to replace the case labels in the GIMPLE_SWITCH
1051 if the number of labels changed. */
1052 len = labels.length ();
1053 if (len < branch_num - 1)
1055 bitmap target_blocks;
1056 edge_iterator ei;
1057 edge e;
1059 /* Corner case: *all* case labels have been removed as being
1060 out-of-range for INDEX_TYPE. Push one label and let the
1061 CFG cleanups deal with this further. */
1062 if (len == 0)
1064 tree label, elt;
1066 label = CASE_LABEL (gimple_switch_default_label (stmt));
1067 elt = build_case_label (build_int_cst (index_type, 0), NULL, label);
1068 labels.quick_push (elt);
1069 len = 1;
1072 for (i = 0; i < labels.length (); i++)
1073 gimple_switch_set_label (stmt, i + 1, labels[i]);
1074 for (i++ ; i < branch_num; i++)
1075 gimple_switch_set_label (stmt, i, NULL_TREE);
1076 gimple_switch_set_num_labels (stmt, len + 1);
1078 /* Cleanup any edges that are now dead. */
1079 target_blocks = BITMAP_ALLOC (NULL);
1080 for (i = 0; i < gimple_switch_num_labels (stmt); i++)
1082 tree elt = gimple_switch_label (stmt, i);
1083 basic_block target = label_to_block (CASE_LABEL (elt));
1084 bitmap_set_bit (target_blocks, target->index);
1086 for (ei = ei_start (gimple_bb (stmt)->succs); (e = ei_safe_edge (ei)); )
1088 if (! bitmap_bit_p (target_blocks, e->dest->index))
1090 remove_edge (e);
1091 cfg_changed = true;
1092 free_dominance_info (CDI_DOMINATORS);
1094 else
1095 ei_next (&ei);
1097 BITMAP_FREE (target_blocks);
1101 /* STMT is a SWITCH_EXPR for which we attempt to find equivalent forms of
1102 the condition which we may be able to optimize better. */
1104 static bool
1105 simplify_gimple_switch (gswitch *stmt)
1107 /* The optimization that we really care about is removing unnecessary
1108 casts. That will let us do much better in propagating the inferred
1109 constant at the switch target. */
1110 tree cond = gimple_switch_index (stmt);
1111 if (TREE_CODE (cond) == SSA_NAME)
1113 gimple def_stmt = SSA_NAME_DEF_STMT (cond);
1114 if (gimple_assign_cast_p (def_stmt))
1116 tree def = gimple_assign_rhs1 (def_stmt);
1117 if (TREE_CODE (def) != SSA_NAME)
1118 return false;
1120 /* If we have an extension or sign-change that preserves the
1121 values we check against then we can copy the source value into
1122 the switch. */
1123 tree ti = TREE_TYPE (def);
1124 if (INTEGRAL_TYPE_P (ti)
1125 && TYPE_PRECISION (ti) <= TYPE_PRECISION (TREE_TYPE (cond)))
1127 size_t n = gimple_switch_num_labels (stmt);
1128 tree min = NULL_TREE, max = NULL_TREE;
1129 if (n > 1)
1131 min = CASE_LOW (gimple_switch_label (stmt, 1));
1132 if (CASE_HIGH (gimple_switch_label (stmt, n - 1)))
1133 max = CASE_HIGH (gimple_switch_label (stmt, n - 1));
1134 else
1135 max = CASE_LOW (gimple_switch_label (stmt, n - 1));
1137 if ((!min || int_fits_type_p (min, ti))
1138 && (!max || int_fits_type_p (max, ti)))
1140 gimple_switch_set_index (stmt, def);
1141 simplify_gimple_switch_label_vec (stmt, ti);
1142 update_stmt (stmt);
1143 return true;
1149 return false;
1152 /* For pointers p2 and p1 return p2 - p1 if the
1153 difference is known and constant, otherwise return NULL. */
1155 static tree
1156 constant_pointer_difference (tree p1, tree p2)
1158 int i, j;
1159 #define CPD_ITERATIONS 5
1160 tree exps[2][CPD_ITERATIONS];
1161 tree offs[2][CPD_ITERATIONS];
1162 int cnt[2];
1164 for (i = 0; i < 2; i++)
1166 tree p = i ? p1 : p2;
1167 tree off = size_zero_node;
1168 gimple stmt;
1169 enum tree_code code;
1171 /* For each of p1 and p2 we need to iterate at least
1172 twice, to handle ADDR_EXPR directly in p1/p2,
1173 SSA_NAME with ADDR_EXPR or POINTER_PLUS_EXPR etc.
1174 on definition's stmt RHS. Iterate a few extra times. */
1175 j = 0;
1178 if (!POINTER_TYPE_P (TREE_TYPE (p)))
1179 break;
1180 if (TREE_CODE (p) == ADDR_EXPR)
1182 tree q = TREE_OPERAND (p, 0);
1183 HOST_WIDE_INT offset;
1184 tree base = get_addr_base_and_unit_offset (q, &offset);
1185 if (base)
1187 q = base;
1188 if (offset)
1189 off = size_binop (PLUS_EXPR, off, size_int (offset));
1191 if (TREE_CODE (q) == MEM_REF
1192 && TREE_CODE (TREE_OPERAND (q, 0)) == SSA_NAME)
1194 p = TREE_OPERAND (q, 0);
1195 off = size_binop (PLUS_EXPR, off,
1196 wide_int_to_tree (sizetype,
1197 mem_ref_offset (q)));
1199 else
1201 exps[i][j] = q;
1202 offs[i][j++] = off;
1203 break;
1206 if (TREE_CODE (p) != SSA_NAME)
1207 break;
1208 exps[i][j] = p;
1209 offs[i][j++] = off;
1210 if (j == CPD_ITERATIONS)
1211 break;
1212 stmt = SSA_NAME_DEF_STMT (p);
1213 if (!is_gimple_assign (stmt) || gimple_assign_lhs (stmt) != p)
1214 break;
1215 code = gimple_assign_rhs_code (stmt);
1216 if (code == POINTER_PLUS_EXPR)
1218 if (TREE_CODE (gimple_assign_rhs2 (stmt)) != INTEGER_CST)
1219 break;
1220 off = size_binop (PLUS_EXPR, off, gimple_assign_rhs2 (stmt));
1221 p = gimple_assign_rhs1 (stmt);
1223 else if (code == ADDR_EXPR || CONVERT_EXPR_CODE_P (code))
1224 p = gimple_assign_rhs1 (stmt);
1225 else
1226 break;
1228 while (1);
1229 cnt[i] = j;
1232 for (i = 0; i < cnt[0]; i++)
1233 for (j = 0; j < cnt[1]; j++)
1234 if (exps[0][i] == exps[1][j])
1235 return size_binop (MINUS_EXPR, offs[0][i], offs[1][j]);
1237 return NULL_TREE;
1240 /* *GSI_P is a GIMPLE_CALL to a builtin function.
1241 Optimize
1242 memcpy (p, "abcd", 4);
1243 memset (p + 4, ' ', 3);
1244 into
1245 memcpy (p, "abcd ", 7);
1246 call if the latter can be stored by pieces during expansion. */
1248 static bool
1249 simplify_builtin_call (gimple_stmt_iterator *gsi_p, tree callee2)
1251 gimple stmt1, stmt2 = gsi_stmt (*gsi_p);
1252 tree vuse = gimple_vuse (stmt2);
1253 if (vuse == NULL)
1254 return false;
1255 stmt1 = SSA_NAME_DEF_STMT (vuse);
1257 switch (DECL_FUNCTION_CODE (callee2))
1259 case BUILT_IN_MEMSET:
1260 if (gimple_call_num_args (stmt2) != 3
1261 || gimple_call_lhs (stmt2)
1262 || CHAR_BIT != 8
1263 || BITS_PER_UNIT != 8)
1264 break;
1265 else
1267 tree callee1;
1268 tree ptr1, src1, str1, off1, len1, lhs1;
1269 tree ptr2 = gimple_call_arg (stmt2, 0);
1270 tree val2 = gimple_call_arg (stmt2, 1);
1271 tree len2 = gimple_call_arg (stmt2, 2);
1272 tree diff, vdef, new_str_cst;
1273 gimple use_stmt;
1274 unsigned int ptr1_align;
1275 unsigned HOST_WIDE_INT src_len;
1276 char *src_buf;
1277 use_operand_p use_p;
1279 if (!tree_fits_shwi_p (val2)
1280 || !tree_fits_uhwi_p (len2))
1281 break;
1282 if (is_gimple_call (stmt1))
1284 /* If first stmt is a call, it needs to be memcpy
1285 or mempcpy, with string literal as second argument and
1286 constant length. */
1287 callee1 = gimple_call_fndecl (stmt1);
1288 if (callee1 == NULL_TREE
1289 || DECL_BUILT_IN_CLASS (callee1) != BUILT_IN_NORMAL
1290 || gimple_call_num_args (stmt1) != 3)
1291 break;
1292 if (DECL_FUNCTION_CODE (callee1) != BUILT_IN_MEMCPY
1293 && DECL_FUNCTION_CODE (callee1) != BUILT_IN_MEMPCPY)
1294 break;
1295 ptr1 = gimple_call_arg (stmt1, 0);
1296 src1 = gimple_call_arg (stmt1, 1);
1297 len1 = gimple_call_arg (stmt1, 2);
1298 lhs1 = gimple_call_lhs (stmt1);
1299 if (!tree_fits_uhwi_p (len1))
1300 break;
1301 str1 = string_constant (src1, &off1);
1302 if (str1 == NULL_TREE)
1303 break;
1304 if (!tree_fits_uhwi_p (off1)
1305 || compare_tree_int (off1, TREE_STRING_LENGTH (str1) - 1) > 0
1306 || compare_tree_int (len1, TREE_STRING_LENGTH (str1)
1307 - tree_to_uhwi (off1)) > 0
1308 || TREE_CODE (TREE_TYPE (str1)) != ARRAY_TYPE
1309 || TYPE_MODE (TREE_TYPE (TREE_TYPE (str1)))
1310 != TYPE_MODE (char_type_node))
1311 break;
1313 else if (gimple_assign_single_p (stmt1))
1315 /* Otherwise look for length 1 memcpy optimized into
1316 assignment. */
1317 ptr1 = gimple_assign_lhs (stmt1);
1318 src1 = gimple_assign_rhs1 (stmt1);
1319 if (TREE_CODE (ptr1) != MEM_REF
1320 || TYPE_MODE (TREE_TYPE (ptr1)) != TYPE_MODE (char_type_node)
1321 || !tree_fits_shwi_p (src1))
1322 break;
1323 ptr1 = build_fold_addr_expr (ptr1);
1324 callee1 = NULL_TREE;
1325 len1 = size_one_node;
1326 lhs1 = NULL_TREE;
1327 off1 = size_zero_node;
1328 str1 = NULL_TREE;
1330 else
1331 break;
1333 diff = constant_pointer_difference (ptr1, ptr2);
1334 if (diff == NULL && lhs1 != NULL)
1336 diff = constant_pointer_difference (lhs1, ptr2);
1337 if (DECL_FUNCTION_CODE (callee1) == BUILT_IN_MEMPCPY
1338 && diff != NULL)
1339 diff = size_binop (PLUS_EXPR, diff,
1340 fold_convert (sizetype, len1));
1342 /* If the difference between the second and first destination pointer
1343 is not constant, or is bigger than memcpy length, bail out. */
1344 if (diff == NULL
1345 || !tree_fits_uhwi_p (diff)
1346 || tree_int_cst_lt (len1, diff))
1347 break;
1349 /* Use maximum of difference plus memset length and memcpy length
1350 as the new memcpy length, if it is too big, bail out. */
1351 src_len = tree_to_uhwi (diff);
1352 src_len += tree_to_uhwi (len2);
1353 if (src_len < tree_to_uhwi (len1))
1354 src_len = tree_to_uhwi (len1);
1355 if (src_len > 1024)
1356 break;
1358 /* If mempcpy value is used elsewhere, bail out, as mempcpy
1359 with bigger length will return different result. */
1360 if (lhs1 != NULL_TREE
1361 && DECL_FUNCTION_CODE (callee1) == BUILT_IN_MEMPCPY
1362 && (TREE_CODE (lhs1) != SSA_NAME
1363 || !single_imm_use (lhs1, &use_p, &use_stmt)
1364 || use_stmt != stmt2))
1365 break;
1367 /* If anything reads memory in between memcpy and memset
1368 call, the modified memcpy call might change it. */
1369 vdef = gimple_vdef (stmt1);
1370 if (vdef != NULL
1371 && (!single_imm_use (vdef, &use_p, &use_stmt)
1372 || use_stmt != stmt2))
1373 break;
1375 ptr1_align = get_pointer_alignment (ptr1);
1376 /* Construct the new source string literal. */
1377 src_buf = XALLOCAVEC (char, src_len + 1);
1378 if (callee1)
1379 memcpy (src_buf,
1380 TREE_STRING_POINTER (str1) + tree_to_uhwi (off1),
1381 tree_to_uhwi (len1));
1382 else
1383 src_buf[0] = tree_to_shwi (src1);
1384 memset (src_buf + tree_to_uhwi (diff),
1385 tree_to_shwi (val2), tree_to_uhwi (len2));
1386 src_buf[src_len] = '\0';
1387 /* Neither builtin_strncpy_read_str nor builtin_memcpy_read_str
1388 handle embedded '\0's. */
1389 if (strlen (src_buf) != src_len)
1390 break;
1391 rtl_profile_for_bb (gimple_bb (stmt2));
1392 /* If the new memcpy wouldn't be emitted by storing the literal
1393 by pieces, this optimization might enlarge .rodata too much,
1394 as commonly used string literals couldn't be shared any
1395 longer. */
1396 if (!can_store_by_pieces (src_len,
1397 builtin_strncpy_read_str,
1398 src_buf, ptr1_align, false))
1399 break;
1401 new_str_cst = build_string_literal (src_len, src_buf);
1402 if (callee1)
1404 /* If STMT1 is a mem{,p}cpy call, adjust it and remove
1405 memset call. */
1406 if (lhs1 && DECL_FUNCTION_CODE (callee1) == BUILT_IN_MEMPCPY)
1407 gimple_call_set_lhs (stmt1, NULL_TREE);
1408 gimple_call_set_arg (stmt1, 1, new_str_cst);
1409 gimple_call_set_arg (stmt1, 2,
1410 build_int_cst (TREE_TYPE (len1), src_len));
1411 update_stmt (stmt1);
1412 unlink_stmt_vdef (stmt2);
1413 gsi_remove (gsi_p, true);
1414 fwprop_invalidate_lattice (gimple_get_lhs (stmt2));
1415 release_defs (stmt2);
1416 if (lhs1 && DECL_FUNCTION_CODE (callee1) == BUILT_IN_MEMPCPY)
1418 fwprop_invalidate_lattice (lhs1);
1419 release_ssa_name (lhs1);
1421 return true;
1423 else
1425 /* Otherwise, if STMT1 is length 1 memcpy optimized into
1426 assignment, remove STMT1 and change memset call into
1427 memcpy call. */
1428 gimple_stmt_iterator gsi = gsi_for_stmt (stmt1);
1430 if (!is_gimple_val (ptr1))
1431 ptr1 = force_gimple_operand_gsi (gsi_p, ptr1, true, NULL_TREE,
1432 true, GSI_SAME_STMT);
1433 gimple_call_set_fndecl (stmt2,
1434 builtin_decl_explicit (BUILT_IN_MEMCPY));
1435 gimple_call_set_arg (stmt2, 0, ptr1);
1436 gimple_call_set_arg (stmt2, 1, new_str_cst);
1437 gimple_call_set_arg (stmt2, 2,
1438 build_int_cst (TREE_TYPE (len2), src_len));
1439 unlink_stmt_vdef (stmt1);
1440 gsi_remove (&gsi, true);
1441 fwprop_invalidate_lattice (gimple_get_lhs (stmt1));
1442 release_defs (stmt1);
1443 update_stmt (stmt2);
1444 return false;
1447 break;
1448 default:
1449 break;
1451 return false;
1454 /* Given a ssa_name in NAME see if it was defined by an assignment and
1455 set CODE to be the code and ARG1 to the first operand on the rhs and ARG2
1456 to the second operand on the rhs. */
1458 static inline void
1459 defcodefor_name (tree name, enum tree_code *code, tree *arg1, tree *arg2)
1461 gimple def;
1462 enum tree_code code1;
1463 tree arg11;
1464 tree arg21;
1465 tree arg31;
1466 enum gimple_rhs_class grhs_class;
1468 code1 = TREE_CODE (name);
1469 arg11 = name;
1470 arg21 = NULL_TREE;
1471 grhs_class = get_gimple_rhs_class (code1);
1473 if (code1 == SSA_NAME)
1475 def = SSA_NAME_DEF_STMT (name);
1477 if (def && is_gimple_assign (def)
1478 && can_propagate_from (def))
1480 code1 = gimple_assign_rhs_code (def);
1481 arg11 = gimple_assign_rhs1 (def);
1482 arg21 = gimple_assign_rhs2 (def);
1483 arg31 = gimple_assign_rhs2 (def);
1486 else if (grhs_class == GIMPLE_TERNARY_RHS
1487 || GIMPLE_BINARY_RHS
1488 || GIMPLE_UNARY_RHS
1489 || GIMPLE_SINGLE_RHS)
1490 extract_ops_from_tree_1 (name, &code1, &arg11, &arg21, &arg31);
1492 *code = code1;
1493 *arg1 = arg11;
1494 if (arg2)
1495 *arg2 = arg21;
1496 /* Ignore arg3 currently. */
1500 /* Recognize rotation patterns. Return true if a transformation
1501 applied, otherwise return false.
1503 We are looking for X with unsigned type T with bitsize B, OP being
1504 +, | or ^, some type T2 wider than T and
1505 (X << CNT1) OP (X >> CNT2) iff CNT1 + CNT2 == B
1506 ((T) ((T2) X << CNT1)) OP ((T) ((T2) X >> CNT2)) iff CNT1 + CNT2 == B
1507 (X << Y) OP (X >> (B - Y))
1508 (X << (int) Y) OP (X >> (int) (B - Y))
1509 ((T) ((T2) X << Y)) OP ((T) ((T2) X >> (B - Y)))
1510 ((T) ((T2) X << (int) Y)) OP ((T) ((T2) X >> (int) (B - Y)))
1511 (X << Y) | (X >> ((-Y) & (B - 1)))
1512 (X << (int) Y) | (X >> (int) ((-Y) & (B - 1)))
1513 ((T) ((T2) X << Y)) | ((T) ((T2) X >> ((-Y) & (B - 1))))
1514 ((T) ((T2) X << (int) Y)) | ((T) ((T2) X >> (int) ((-Y) & (B - 1))))
1516 and transform these into:
1517 X r<< CNT1
1518 X r<< Y
1520 Note, in the patterns with T2 type, the type of OP operands
1521 might be even a signed type, but should have precision B. */
1523 static bool
1524 simplify_rotate (gimple_stmt_iterator *gsi)
1526 gimple stmt = gsi_stmt (*gsi);
1527 tree arg[2], rtype, rotcnt = NULL_TREE;
1528 tree def_arg1[2], def_arg2[2];
1529 enum tree_code def_code[2];
1530 tree lhs;
1531 int i;
1532 bool swapped_p = false;
1533 gimple g;
1535 arg[0] = gimple_assign_rhs1 (stmt);
1536 arg[1] = gimple_assign_rhs2 (stmt);
1537 rtype = TREE_TYPE (arg[0]);
1539 /* Only create rotates in complete modes. Other cases are not
1540 expanded properly. */
1541 if (!INTEGRAL_TYPE_P (rtype)
1542 || TYPE_PRECISION (rtype) != GET_MODE_PRECISION (TYPE_MODE (rtype)))
1543 return false;
1545 for (i = 0; i < 2; i++)
1546 defcodefor_name (arg[i], &def_code[i], &def_arg1[i], &def_arg2[i]);
1548 /* Look through narrowing conversions. */
1549 if (CONVERT_EXPR_CODE_P (def_code[0])
1550 && CONVERT_EXPR_CODE_P (def_code[1])
1551 && INTEGRAL_TYPE_P (TREE_TYPE (def_arg1[0]))
1552 && INTEGRAL_TYPE_P (TREE_TYPE (def_arg1[1]))
1553 && TYPE_PRECISION (TREE_TYPE (def_arg1[0]))
1554 == TYPE_PRECISION (TREE_TYPE (def_arg1[1]))
1555 && TYPE_PRECISION (TREE_TYPE (def_arg1[0])) > TYPE_PRECISION (rtype)
1556 && has_single_use (arg[0])
1557 && has_single_use (arg[1]))
1559 for (i = 0; i < 2; i++)
1561 arg[i] = def_arg1[i];
1562 defcodefor_name (arg[i], &def_code[i], &def_arg1[i], &def_arg2[i]);
1566 /* One operand has to be LSHIFT_EXPR and one RSHIFT_EXPR. */
1567 for (i = 0; i < 2; i++)
1568 if (def_code[i] != LSHIFT_EXPR && def_code[i] != RSHIFT_EXPR)
1569 return false;
1570 else if (!has_single_use (arg[i]))
1571 return false;
1572 if (def_code[0] == def_code[1])
1573 return false;
1575 /* If we've looked through narrowing conversions before, look through
1576 widening conversions from unsigned type with the same precision
1577 as rtype here. */
1578 if (TYPE_PRECISION (TREE_TYPE (def_arg1[0])) != TYPE_PRECISION (rtype))
1579 for (i = 0; i < 2; i++)
1581 tree tem;
1582 enum tree_code code;
1583 defcodefor_name (def_arg1[i], &code, &tem, NULL);
1584 if (!CONVERT_EXPR_CODE_P (code)
1585 || !INTEGRAL_TYPE_P (TREE_TYPE (tem))
1586 || TYPE_PRECISION (TREE_TYPE (tem)) != TYPE_PRECISION (rtype))
1587 return false;
1588 def_arg1[i] = tem;
1590 /* Both shifts have to use the same first operand. */
1591 if (TREE_CODE (def_arg1[0]) != SSA_NAME || def_arg1[0] != def_arg1[1])
1592 return false;
1593 if (!TYPE_UNSIGNED (TREE_TYPE (def_arg1[0])))
1594 return false;
1596 /* CNT1 + CNT2 == B case above. */
1597 if (tree_fits_uhwi_p (def_arg2[0])
1598 && tree_fits_uhwi_p (def_arg2[1])
1599 && tree_to_uhwi (def_arg2[0])
1600 + tree_to_uhwi (def_arg2[1]) == TYPE_PRECISION (rtype))
1601 rotcnt = def_arg2[0];
1602 else if (TREE_CODE (def_arg2[0]) != SSA_NAME
1603 || TREE_CODE (def_arg2[1]) != SSA_NAME)
1604 return false;
1605 else
1607 tree cdef_arg1[2], cdef_arg2[2], def_arg2_alt[2];
1608 enum tree_code cdef_code[2];
1609 /* Look through conversion of the shift count argument.
1610 The C/C++ FE cast any shift count argument to integer_type_node.
1611 The only problem might be if the shift count type maximum value
1612 is equal or smaller than number of bits in rtype. */
1613 for (i = 0; i < 2; i++)
1615 def_arg2_alt[i] = def_arg2[i];
1616 defcodefor_name (def_arg2[i], &cdef_code[i],
1617 &cdef_arg1[i], &cdef_arg2[i]);
1618 if (CONVERT_EXPR_CODE_P (cdef_code[i])
1619 && INTEGRAL_TYPE_P (TREE_TYPE (cdef_arg1[i]))
1620 && TYPE_PRECISION (TREE_TYPE (cdef_arg1[i]))
1621 > floor_log2 (TYPE_PRECISION (rtype))
1622 && TYPE_PRECISION (TREE_TYPE (cdef_arg1[i]))
1623 == GET_MODE_PRECISION (TYPE_MODE (TREE_TYPE (cdef_arg1[i]))))
1625 def_arg2_alt[i] = cdef_arg1[i];
1626 defcodefor_name (def_arg2_alt[i], &cdef_code[i],
1627 &cdef_arg1[i], &cdef_arg2[i]);
1630 for (i = 0; i < 2; i++)
1631 /* Check for one shift count being Y and the other B - Y,
1632 with optional casts. */
1633 if (cdef_code[i] == MINUS_EXPR
1634 && tree_fits_shwi_p (cdef_arg1[i])
1635 && tree_to_shwi (cdef_arg1[i]) == TYPE_PRECISION (rtype)
1636 && TREE_CODE (cdef_arg2[i]) == SSA_NAME)
1638 tree tem;
1639 enum tree_code code;
1641 if (cdef_arg2[i] == def_arg2[1 - i]
1642 || cdef_arg2[i] == def_arg2_alt[1 - i])
1644 rotcnt = cdef_arg2[i];
1645 break;
1647 defcodefor_name (cdef_arg2[i], &code, &tem, NULL);
1648 if (CONVERT_EXPR_CODE_P (code)
1649 && INTEGRAL_TYPE_P (TREE_TYPE (tem))
1650 && TYPE_PRECISION (TREE_TYPE (tem))
1651 > floor_log2 (TYPE_PRECISION (rtype))
1652 && TYPE_PRECISION (TREE_TYPE (tem))
1653 == GET_MODE_PRECISION (TYPE_MODE (TREE_TYPE (tem)))
1654 && (tem == def_arg2[1 - i]
1655 || tem == def_arg2_alt[1 - i]))
1657 rotcnt = tem;
1658 break;
1661 /* The above sequence isn't safe for Y being 0,
1662 because then one of the shifts triggers undefined behavior.
1663 This alternative is safe even for rotation count of 0.
1664 One shift count is Y and the other (-Y) & (B - 1). */
1665 else if (cdef_code[i] == BIT_AND_EXPR
1666 && tree_fits_shwi_p (cdef_arg2[i])
1667 && tree_to_shwi (cdef_arg2[i])
1668 == TYPE_PRECISION (rtype) - 1
1669 && TREE_CODE (cdef_arg1[i]) == SSA_NAME
1670 && gimple_assign_rhs_code (stmt) == BIT_IOR_EXPR)
1672 tree tem;
1673 enum tree_code code;
1675 defcodefor_name (cdef_arg1[i], &code, &tem, NULL);
1676 if (CONVERT_EXPR_CODE_P (code)
1677 && INTEGRAL_TYPE_P (TREE_TYPE (tem))
1678 && TYPE_PRECISION (TREE_TYPE (tem))
1679 > floor_log2 (TYPE_PRECISION (rtype))
1680 && TYPE_PRECISION (TREE_TYPE (tem))
1681 == GET_MODE_PRECISION (TYPE_MODE (TREE_TYPE (tem))))
1682 defcodefor_name (tem, &code, &tem, NULL);
1684 if (code == NEGATE_EXPR)
1686 if (tem == def_arg2[1 - i] || tem == def_arg2_alt[1 - i])
1688 rotcnt = tem;
1689 break;
1691 defcodefor_name (tem, &code, &tem, NULL);
1692 if (CONVERT_EXPR_CODE_P (code)
1693 && INTEGRAL_TYPE_P (TREE_TYPE (tem))
1694 && TYPE_PRECISION (TREE_TYPE (tem))
1695 > floor_log2 (TYPE_PRECISION (rtype))
1696 && TYPE_PRECISION (TREE_TYPE (tem))
1697 == GET_MODE_PRECISION (TYPE_MODE (TREE_TYPE (tem)))
1698 && (tem == def_arg2[1 - i]
1699 || tem == def_arg2_alt[1 - i]))
1701 rotcnt = tem;
1702 break;
1706 if (rotcnt == NULL_TREE)
1707 return false;
1708 swapped_p = i != 1;
1711 if (!useless_type_conversion_p (TREE_TYPE (def_arg2[0]),
1712 TREE_TYPE (rotcnt)))
1714 g = gimple_build_assign_with_ops (NOP_EXPR,
1715 make_ssa_name (TREE_TYPE (def_arg2[0]),
1716 NULL),
1717 rotcnt, NULL_TREE);
1718 gsi_insert_before (gsi, g, GSI_SAME_STMT);
1719 rotcnt = gimple_assign_lhs (g);
1721 lhs = gimple_assign_lhs (stmt);
1722 if (!useless_type_conversion_p (rtype, TREE_TYPE (def_arg1[0])))
1723 lhs = make_ssa_name (TREE_TYPE (def_arg1[0]), NULL);
1724 g = gimple_build_assign_with_ops (((def_code[0] == LSHIFT_EXPR) ^ swapped_p)
1725 ? LROTATE_EXPR : RROTATE_EXPR,
1726 lhs, def_arg1[0], rotcnt);
1727 if (!useless_type_conversion_p (rtype, TREE_TYPE (def_arg1[0])))
1729 gsi_insert_before (gsi, g, GSI_SAME_STMT);
1730 g = gimple_build_assign_with_ops (NOP_EXPR, gimple_assign_lhs (stmt),
1731 lhs, NULL_TREE);
1733 gsi_replace (gsi, g, false);
1734 return true;
1737 /* Combine an element access with a shuffle. Returns true if there were
1738 any changes made, else it returns false. */
1740 static bool
1741 simplify_bitfield_ref (gimple_stmt_iterator *gsi)
1743 gimple stmt = gsi_stmt (*gsi);
1744 gimple def_stmt;
1745 tree op, op0, op1, op2;
1746 tree elem_type;
1747 unsigned idx, n, size;
1748 enum tree_code code;
1750 op = gimple_assign_rhs1 (stmt);
1751 gcc_checking_assert (TREE_CODE (op) == BIT_FIELD_REF);
1753 op0 = TREE_OPERAND (op, 0);
1754 if (TREE_CODE (op0) != SSA_NAME
1755 || TREE_CODE (TREE_TYPE (op0)) != VECTOR_TYPE)
1756 return false;
1758 def_stmt = get_prop_source_stmt (op0, false, NULL);
1759 if (!def_stmt || !can_propagate_from (def_stmt))
1760 return false;
1762 op1 = TREE_OPERAND (op, 1);
1763 op2 = TREE_OPERAND (op, 2);
1764 code = gimple_assign_rhs_code (def_stmt);
1766 if (code == CONSTRUCTOR)
1768 tree tem = fold_ternary (BIT_FIELD_REF, TREE_TYPE (op),
1769 gimple_assign_rhs1 (def_stmt), op1, op2);
1770 if (!tem || !valid_gimple_rhs_p (tem))
1771 return false;
1772 gimple_assign_set_rhs_from_tree (gsi, tem);
1773 update_stmt (gsi_stmt (*gsi));
1774 return true;
1777 elem_type = TREE_TYPE (TREE_TYPE (op0));
1778 if (TREE_TYPE (op) != elem_type)
1779 return false;
1781 size = TREE_INT_CST_LOW (TYPE_SIZE (elem_type));
1782 n = TREE_INT_CST_LOW (op1) / size;
1783 if (n != 1)
1784 return false;
1785 idx = TREE_INT_CST_LOW (op2) / size;
1787 if (code == VEC_PERM_EXPR)
1789 tree p, m, index, tem;
1790 unsigned nelts;
1791 m = gimple_assign_rhs3 (def_stmt);
1792 if (TREE_CODE (m) != VECTOR_CST)
1793 return false;
1794 nelts = VECTOR_CST_NELTS (m);
1795 idx = TREE_INT_CST_LOW (VECTOR_CST_ELT (m, idx));
1796 idx %= 2 * nelts;
1797 if (idx < nelts)
1799 p = gimple_assign_rhs1 (def_stmt);
1801 else
1803 p = gimple_assign_rhs2 (def_stmt);
1804 idx -= nelts;
1806 index = build_int_cst (TREE_TYPE (TREE_TYPE (m)), idx * size);
1807 tem = build3 (BIT_FIELD_REF, TREE_TYPE (op),
1808 unshare_expr (p), op1, index);
1809 gimple_assign_set_rhs1 (stmt, tem);
1810 fold_stmt (gsi);
1811 update_stmt (gsi_stmt (*gsi));
1812 return true;
1815 return false;
1818 /* Determine whether applying the 2 permutations (mask1 then mask2)
1819 gives back one of the input. */
1821 static int
1822 is_combined_permutation_identity (tree mask1, tree mask2)
1824 tree mask;
1825 unsigned int nelts, i, j;
1826 bool maybe_identity1 = true;
1827 bool maybe_identity2 = true;
1829 gcc_checking_assert (TREE_CODE (mask1) == VECTOR_CST
1830 && TREE_CODE (mask2) == VECTOR_CST);
1831 mask = fold_ternary (VEC_PERM_EXPR, TREE_TYPE (mask1), mask1, mask1, mask2);
1832 gcc_assert (TREE_CODE (mask) == VECTOR_CST);
1834 nelts = VECTOR_CST_NELTS (mask);
1835 for (i = 0; i < nelts; i++)
1837 tree val = VECTOR_CST_ELT (mask, i);
1838 gcc_assert (TREE_CODE (val) == INTEGER_CST);
1839 j = TREE_INT_CST_LOW (val) & (2 * nelts - 1);
1840 if (j == i)
1841 maybe_identity2 = false;
1842 else if (j == i + nelts)
1843 maybe_identity1 = false;
1844 else
1845 return 0;
1847 return maybe_identity1 ? 1 : maybe_identity2 ? 2 : 0;
1850 /* Combine a shuffle with its arguments. Returns 1 if there were any
1851 changes made, 2 if cfg-cleanup needs to run. Else it returns 0. */
1853 static int
1854 simplify_permutation (gimple_stmt_iterator *gsi)
1856 gimple stmt = gsi_stmt (*gsi);
1857 gimple def_stmt;
1858 tree op0, op1, op2, op3, arg0, arg1;
1859 enum tree_code code;
1860 bool single_use_op0 = false;
1862 gcc_checking_assert (gimple_assign_rhs_code (stmt) == VEC_PERM_EXPR);
1864 op0 = gimple_assign_rhs1 (stmt);
1865 op1 = gimple_assign_rhs2 (stmt);
1866 op2 = gimple_assign_rhs3 (stmt);
1868 if (TREE_CODE (op2) != VECTOR_CST)
1869 return 0;
1871 if (TREE_CODE (op0) == VECTOR_CST)
1873 code = VECTOR_CST;
1874 arg0 = op0;
1876 else if (TREE_CODE (op0) == SSA_NAME)
1878 def_stmt = get_prop_source_stmt (op0, false, &single_use_op0);
1879 if (!def_stmt || !can_propagate_from (def_stmt))
1880 return 0;
1882 code = gimple_assign_rhs_code (def_stmt);
1883 arg0 = gimple_assign_rhs1 (def_stmt);
1885 else
1886 return 0;
1888 /* Two consecutive shuffles. */
1889 if (code == VEC_PERM_EXPR)
1891 tree orig;
1892 int ident;
1894 if (op0 != op1)
1895 return 0;
1896 op3 = gimple_assign_rhs3 (def_stmt);
1897 if (TREE_CODE (op3) != VECTOR_CST)
1898 return 0;
1899 ident = is_combined_permutation_identity (op3, op2);
1900 if (!ident)
1901 return 0;
1902 orig = (ident == 1) ? gimple_assign_rhs1 (def_stmt)
1903 : gimple_assign_rhs2 (def_stmt);
1904 gimple_assign_set_rhs1 (stmt, unshare_expr (orig));
1905 gimple_assign_set_rhs_code (stmt, TREE_CODE (orig));
1906 gimple_set_num_ops (stmt, 2);
1907 update_stmt (stmt);
1908 return remove_prop_source_from_use (op0) ? 2 : 1;
1911 /* Shuffle of a constructor. */
1912 else if (code == CONSTRUCTOR || code == VECTOR_CST)
1914 tree opt;
1915 bool ret = false;
1916 if (op0 != op1)
1918 if (TREE_CODE (op0) == SSA_NAME && !single_use_op0)
1919 return 0;
1921 if (TREE_CODE (op1) == VECTOR_CST)
1922 arg1 = op1;
1923 else if (TREE_CODE (op1) == SSA_NAME)
1925 enum tree_code code2;
1927 gimple def_stmt2 = get_prop_source_stmt (op1, true, NULL);
1928 if (!def_stmt2 || !can_propagate_from (def_stmt2))
1929 return 0;
1931 code2 = gimple_assign_rhs_code (def_stmt2);
1932 if (code2 != CONSTRUCTOR && code2 != VECTOR_CST)
1933 return 0;
1934 arg1 = gimple_assign_rhs1 (def_stmt2);
1936 else
1937 return 0;
1939 else
1941 /* Already used twice in this statement. */
1942 if (TREE_CODE (op0) == SSA_NAME && num_imm_uses (op0) > 2)
1943 return 0;
1944 arg1 = arg0;
1946 opt = fold_ternary (VEC_PERM_EXPR, TREE_TYPE (op0), arg0, arg1, op2);
1947 if (!opt
1948 || (TREE_CODE (opt) != CONSTRUCTOR && TREE_CODE (opt) != VECTOR_CST))
1949 return 0;
1950 gimple_assign_set_rhs_from_tree (gsi, opt);
1951 update_stmt (gsi_stmt (*gsi));
1952 if (TREE_CODE (op0) == SSA_NAME)
1953 ret = remove_prop_source_from_use (op0);
1954 if (op0 != op1 && TREE_CODE (op1) == SSA_NAME)
1955 ret |= remove_prop_source_from_use (op1);
1956 return ret ? 2 : 1;
1959 return 0;
1962 /* Recognize a VEC_PERM_EXPR. Returns true if there were any changes. */
1964 static bool
1965 simplify_vector_constructor (gimple_stmt_iterator *gsi)
1967 gimple stmt = gsi_stmt (*gsi);
1968 gimple def_stmt;
1969 tree op, op2, orig, type, elem_type;
1970 unsigned elem_size, nelts, i;
1971 enum tree_code code;
1972 constructor_elt *elt;
1973 unsigned char *sel;
1974 bool maybe_ident;
1976 gcc_checking_assert (gimple_assign_rhs_code (stmt) == CONSTRUCTOR);
1978 op = gimple_assign_rhs1 (stmt);
1979 type = TREE_TYPE (op);
1980 gcc_checking_assert (TREE_CODE (type) == VECTOR_TYPE);
1982 nelts = TYPE_VECTOR_SUBPARTS (type);
1983 elem_type = TREE_TYPE (type);
1984 elem_size = TREE_INT_CST_LOW (TYPE_SIZE (elem_type));
1986 sel = XALLOCAVEC (unsigned char, nelts);
1987 orig = NULL;
1988 maybe_ident = true;
1989 FOR_EACH_VEC_SAFE_ELT (CONSTRUCTOR_ELTS (op), i, elt)
1991 tree ref, op1;
1993 if (i >= nelts)
1994 return false;
1996 if (TREE_CODE (elt->value) != SSA_NAME)
1997 return false;
1998 def_stmt = get_prop_source_stmt (elt->value, false, NULL);
1999 if (!def_stmt)
2000 return false;
2001 code = gimple_assign_rhs_code (def_stmt);
2002 if (code != BIT_FIELD_REF)
2003 return false;
2004 op1 = gimple_assign_rhs1 (def_stmt);
2005 ref = TREE_OPERAND (op1, 0);
2006 if (orig)
2008 if (ref != orig)
2009 return false;
2011 else
2013 if (TREE_CODE (ref) != SSA_NAME)
2014 return false;
2015 if (!useless_type_conversion_p (type, TREE_TYPE (ref)))
2016 return false;
2017 orig = ref;
2019 if (TREE_INT_CST_LOW (TREE_OPERAND (op1, 1)) != elem_size)
2020 return false;
2021 sel[i] = TREE_INT_CST_LOW (TREE_OPERAND (op1, 2)) / elem_size;
2022 if (sel[i] != i) maybe_ident = false;
2024 if (i < nelts)
2025 return false;
2027 if (maybe_ident)
2028 gimple_assign_set_rhs_from_tree (gsi, orig);
2029 else
2031 tree mask_type, *mask_elts;
2033 if (!can_vec_perm_p (TYPE_MODE (type), false, sel))
2034 return false;
2035 mask_type
2036 = build_vector_type (build_nonstandard_integer_type (elem_size, 1),
2037 nelts);
2038 if (GET_MODE_CLASS (TYPE_MODE (mask_type)) != MODE_VECTOR_INT
2039 || GET_MODE_SIZE (TYPE_MODE (mask_type))
2040 != GET_MODE_SIZE (TYPE_MODE (type)))
2041 return false;
2042 mask_elts = XALLOCAVEC (tree, nelts);
2043 for (i = 0; i < nelts; i++)
2044 mask_elts[i] = build_int_cst (TREE_TYPE (mask_type), sel[i]);
2045 op2 = build_vector (mask_type, mask_elts);
2046 gimple_assign_set_rhs_with_ops_1 (gsi, VEC_PERM_EXPR, orig, orig, op2);
2048 update_stmt (gsi_stmt (*gsi));
2049 return true;
2053 /* Primitive "lattice" function for gimple_simplify. */
2055 static tree
2056 fwprop_ssa_val (tree name)
2058 /* First valueize NAME. */
2059 if (TREE_CODE (name) == SSA_NAME
2060 && SSA_NAME_VERSION (name) < lattice.length ())
2062 tree val = lattice[SSA_NAME_VERSION (name)];
2063 if (val)
2064 name = val;
2066 /* We continue matching along SSA use-def edges for SSA names
2067 that are not single-use. Currently there are no patterns
2068 that would cause any issues with that. */
2069 return name;
2072 /* Main entry point for the forward propagation and statement combine
2073 optimizer. */
2075 namespace {
2077 const pass_data pass_data_forwprop =
2079 GIMPLE_PASS, /* type */
2080 "forwprop", /* name */
2081 OPTGROUP_NONE, /* optinfo_flags */
2082 TV_TREE_FORWPROP, /* tv_id */
2083 ( PROP_cfg | PROP_ssa ), /* properties_required */
2084 0, /* properties_provided */
2085 0, /* properties_destroyed */
2086 0, /* todo_flags_start */
2087 TODO_update_ssa, /* todo_flags_finish */
2090 class pass_forwprop : public gimple_opt_pass
2092 public:
2093 pass_forwprop (gcc::context *ctxt)
2094 : gimple_opt_pass (pass_data_forwprop, ctxt)
2097 /* opt_pass methods: */
2098 opt_pass * clone () { return new pass_forwprop (m_ctxt); }
2099 virtual bool gate (function *) { return flag_tree_forwprop; }
2100 virtual unsigned int execute (function *);
2102 }; // class pass_forwprop
2104 unsigned int
2105 pass_forwprop::execute (function *fun)
2107 unsigned int todoflags = 0;
2109 cfg_changed = false;
2111 /* Combine stmts with the stmts defining their operands. Do that
2112 in an order that guarantees visiting SSA defs before SSA uses. */
2113 lattice.create (num_ssa_names);
2114 lattice.quick_grow_cleared (num_ssa_names);
2115 int *postorder = XNEWVEC (int, n_basic_blocks_for_fn (fun));
2116 int postorder_num = inverted_post_order_compute (postorder);
2117 to_purge = BITMAP_ALLOC (NULL);
2118 for (int i = 0; i < postorder_num; ++i)
2120 gimple_stmt_iterator gsi;
2121 basic_block bb = BASIC_BLOCK_FOR_FN (fun, postorder[i]);
2123 /* Apply forward propagation to all stmts in the basic-block.
2124 Note we update GSI within the loop as necessary. */
2125 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
2127 gimple stmt = gsi_stmt (gsi);
2128 tree lhs, rhs;
2129 enum tree_code code;
2131 if (!is_gimple_assign (stmt))
2133 gsi_next (&gsi);
2134 continue;
2137 lhs = gimple_assign_lhs (stmt);
2138 rhs = gimple_assign_rhs1 (stmt);
2139 code = gimple_assign_rhs_code (stmt);
2140 if (TREE_CODE (lhs) != SSA_NAME
2141 || has_zero_uses (lhs))
2143 gsi_next (&gsi);
2144 continue;
2147 /* If this statement sets an SSA_NAME to an address,
2148 try to propagate the address into the uses of the SSA_NAME. */
2149 if (code == ADDR_EXPR
2150 /* Handle pointer conversions on invariant addresses
2151 as well, as this is valid gimple. */
2152 || (CONVERT_EXPR_CODE_P (code)
2153 && TREE_CODE (rhs) == ADDR_EXPR
2154 && POINTER_TYPE_P (TREE_TYPE (lhs))))
2156 tree base = get_base_address (TREE_OPERAND (rhs, 0));
2157 if ((!base
2158 || !DECL_P (base)
2159 || decl_address_invariant_p (base))
2160 && !stmt_references_abnormal_ssa_name (stmt)
2161 && forward_propagate_addr_expr (lhs, rhs, true))
2163 fwprop_invalidate_lattice (gimple_get_lhs (stmt));
2164 release_defs (stmt);
2165 gsi_remove (&gsi, true);
2167 else
2168 gsi_next (&gsi);
2170 else if (code == POINTER_PLUS_EXPR)
2172 tree off = gimple_assign_rhs2 (stmt);
2173 if (TREE_CODE (off) == INTEGER_CST
2174 && can_propagate_from (stmt)
2175 && !simple_iv_increment_p (stmt)
2176 /* ??? Better adjust the interface to that function
2177 instead of building new trees here. */
2178 && forward_propagate_addr_expr
2179 (lhs,
2180 build1_loc (gimple_location (stmt),
2181 ADDR_EXPR, TREE_TYPE (rhs),
2182 fold_build2 (MEM_REF,
2183 TREE_TYPE (TREE_TYPE (rhs)),
2184 rhs,
2185 fold_convert (ptr_type_node,
2186 off))), true))
2188 fwprop_invalidate_lattice (gimple_get_lhs (stmt));
2189 release_defs (stmt);
2190 gsi_remove (&gsi, true);
2192 else if (is_gimple_min_invariant (rhs))
2194 /* Make sure to fold &a[0] + off_1 here. */
2195 fold_stmt_inplace (&gsi);
2196 update_stmt (stmt);
2197 if (gimple_assign_rhs_code (stmt) == POINTER_PLUS_EXPR)
2198 gsi_next (&gsi);
2200 else
2201 gsi_next (&gsi);
2203 else
2204 gsi_next (&gsi);
2207 /* Combine stmts with the stmts defining their operands.
2208 Note we update GSI within the loop as necessary. */
2209 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi);)
2211 gimple stmt = gsi_stmt (gsi);
2212 gimple orig_stmt = stmt;
2213 bool changed = false;
2215 /* Mark stmt as potentially needing revisiting. */
2216 gimple_set_plf (stmt, GF_PLF_1, false);
2218 if (fold_stmt (&gsi, fwprop_ssa_val))
2220 changed = true;
2221 stmt = gsi_stmt (gsi);
2222 if (maybe_clean_or_replace_eh_stmt (orig_stmt, stmt))
2223 bitmap_set_bit (to_purge, bb->index);
2224 /* Cleanup the CFG if we simplified a condition to
2225 true or false. */
2226 if (gcond *cond = dyn_cast <gcond *> (stmt))
2227 if (gimple_cond_true_p (cond)
2228 || gimple_cond_false_p (cond))
2229 cfg_changed = true;
2230 update_stmt (stmt);
2233 switch (gimple_code (stmt))
2235 case GIMPLE_ASSIGN:
2237 tree rhs1 = gimple_assign_rhs1 (stmt);
2238 enum tree_code code = gimple_assign_rhs_code (stmt);
2240 if (code == COND_EXPR
2241 || code == VEC_COND_EXPR)
2243 /* In this case the entire COND_EXPR is in rhs1. */
2244 if (forward_propagate_into_cond (&gsi))
2246 changed = true;
2247 stmt = gsi_stmt (gsi);
2250 else if (TREE_CODE_CLASS (code) == tcc_comparison)
2252 int did_something;
2253 did_something = forward_propagate_into_comparison (&gsi);
2254 if (did_something == 2)
2255 cfg_changed = true;
2256 changed = did_something != 0;
2258 else if ((code == PLUS_EXPR
2259 || code == BIT_IOR_EXPR
2260 || code == BIT_XOR_EXPR)
2261 && simplify_rotate (&gsi))
2262 changed = true;
2263 else if (code == VEC_PERM_EXPR)
2265 int did_something = simplify_permutation (&gsi);
2266 if (did_something == 2)
2267 cfg_changed = true;
2268 changed = did_something != 0;
2270 else if (code == BIT_FIELD_REF)
2271 changed = simplify_bitfield_ref (&gsi);
2272 else if (code == CONSTRUCTOR
2273 && TREE_CODE (TREE_TYPE (rhs1)) == VECTOR_TYPE)
2274 changed = simplify_vector_constructor (&gsi);
2275 break;
2278 case GIMPLE_SWITCH:
2279 changed = simplify_gimple_switch (as_a <gswitch *> (stmt));
2280 break;
2282 case GIMPLE_COND:
2284 int did_something;
2285 did_something =
2286 forward_propagate_into_gimple_cond (as_a <gcond *> (stmt));
2287 if (did_something == 2)
2288 cfg_changed = true;
2289 changed = did_something != 0;
2290 break;
2293 case GIMPLE_CALL:
2295 tree callee = gimple_call_fndecl (stmt);
2296 if (callee != NULL_TREE
2297 && DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL)
2298 changed = simplify_builtin_call (&gsi, callee);
2299 break;
2302 default:;
2305 if (changed)
2307 /* If the stmt changed then re-visit it and the statements
2308 inserted before it. */
2309 for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2310 if (gimple_plf (gsi_stmt (gsi), GF_PLF_1))
2311 break;
2312 if (gsi_end_p (gsi))
2313 gsi = gsi_start_bb (bb);
2314 else
2315 gsi_next (&gsi);
2317 else
2319 /* Stmt no longer needs to be revisited. */
2320 gimple_set_plf (stmt, GF_PLF_1, true);
2322 /* Fill up the lattice. */
2323 if (gimple_assign_single_p (stmt))
2325 tree lhs = gimple_assign_lhs (stmt);
2326 tree rhs = gimple_assign_rhs1 (stmt);
2327 if (TREE_CODE (lhs) == SSA_NAME)
2329 tree val = lhs;
2330 if (TREE_CODE (rhs) == SSA_NAME)
2331 val = fwprop_ssa_val (rhs);
2332 else if (is_gimple_min_invariant (rhs))
2333 val = rhs;
2334 fwprop_set_lattice_val (lhs, val);
2338 gsi_next (&gsi);
2342 free (postorder);
2343 lattice.release ();
2345 cfg_changed |= gimple_purge_all_dead_eh_edges (to_purge);
2346 BITMAP_FREE (to_purge);
2348 if (cfg_changed)
2349 todoflags |= TODO_cleanup_cfg;
2351 return todoflags;
2354 } // anon namespace
2356 gimple_opt_pass *
2357 make_pass_forwprop (gcc::context *ctxt)
2359 return new pass_forwprop (ctxt);