2005-04-29 Jim Tison <jtison@us.ibm.com>
[official-gcc.git] / gcc / tree-if-conv.c
blob4eb5a26e6c9b2e1a178d6235fc66c57ca7eddba9
1 /* If-conversion for vectorizer.
2 Copyright (C) 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Devang Patel <dpatel@apple.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
22 /* This pass implements tree level if-conversion transformation of loops.
23 Initial goal is to help vectorizer vectorize loops with conditions.
25 A short description of if-conversion:
27 o Decide if a loop is if-convertible or not.
28 o Walk all loop basic blocks in breadth first order (BFS order).
29 o Remove conditional statements (at the end of basic block)
30 and propagate condition into destination basic blocks'
31 predicate list.
32 o Replace modify expression with conditional modify expression
33 using current basic block's condition.
34 o Merge all basic blocks
35 o Replace phi nodes with conditional modify expr
36 o Merge all basic blocks into header
38 Sample transformation:
40 INPUT
41 -----
43 # i_23 = PHI <0(0), i_18(10)>;
44 <L0>:;
45 j_15 = A[i_23];
46 if (j_15 > 41) goto <L1>; else goto <L17>;
48 <L17>:;
49 goto <bb 3> (<L3>);
51 <L1>:;
53 # iftmp.2_4 = PHI <0(8), 42(2)>;
54 <L3>:;
55 A[i_23] = iftmp.2_4;
56 i_18 = i_23 + 1;
57 if (i_18 <= 15) goto <L19>; else goto <L18>;
59 <L19>:;
60 goto <bb 1> (<L0>);
62 <L18>:;
64 OUTPUT
65 ------
67 # i_23 = PHI <0(0), i_18(10)>;
68 <L0>:;
69 j_15 = A[i_23];
71 <L3>:;
72 iftmp.2_4 = j_15 > 41 ? 42 : 0;
73 A[i_23] = iftmp.2_4;
74 i_18 = i_23 + 1;
75 if (i_18 <= 15) goto <L19>; else goto <L18>;
77 <L19>:;
78 goto <bb 1> (<L0>);
80 <L18>:;
83 #include "config.h"
84 #include "system.h"
85 #include "coretypes.h"
86 #include "tm.h"
87 #include "errors.h"
88 #include "tree.h"
89 #include "c-common.h"
90 #include "flags.h"
91 #include "timevar.h"
92 #include "varray.h"
93 #include "rtl.h"
94 #include "basic-block.h"
95 #include "diagnostic.h"
96 #include "tree-flow.h"
97 #include "tree-dump.h"
98 #include "cfgloop.h"
99 #include "tree-chrec.h"
100 #include "tree-data-ref.h"
101 #include "tree-scalar-evolution.h"
102 #include "tree-pass.h"
103 #include "target.h"
105 /* local function prototypes */
106 static void main_tree_if_conversion (void);
107 static tree tree_if_convert_stmt (struct loop *loop, tree, tree,
108 block_stmt_iterator *);
109 static void tree_if_convert_cond_expr (struct loop *, tree, tree,
110 block_stmt_iterator *);
111 static bool if_convertible_phi_p (struct loop *, basic_block, tree);
112 static bool if_convertible_modify_expr_p (struct loop *, basic_block, tree);
113 static bool if_convertible_stmt_p (struct loop *, basic_block, tree);
114 static bool if_convertible_bb_p (struct loop *, basic_block, bool);
115 static bool if_convertible_loop_p (struct loop *, bool);
116 static void add_to_predicate_list (basic_block, tree);
117 static tree add_to_dst_predicate_list (struct loop * loop, basic_block, tree, tree,
118 block_stmt_iterator *);
119 static void clean_predicate_lists (struct loop *loop);
120 static basic_block find_phi_replacement_condition (struct loop *loop,
121 basic_block, tree *,
122 block_stmt_iterator *);
123 static void replace_phi_with_cond_modify_expr (tree, tree, basic_block,
124 block_stmt_iterator *);
125 static void process_phi_nodes (struct loop *);
126 static void combine_blocks (struct loop *);
127 static tree ifc_temp_var (tree, tree);
128 static bool pred_blocks_visited_p (basic_block, bitmap *);
129 static basic_block * get_loop_body_in_if_conv_order (const struct loop *loop);
130 static bool bb_with_exit_edge_p (struct loop *, basic_block);
132 /* List of basic blocks in if-conversion-suitable order. */
133 static basic_block *ifc_bbs;
135 /* Main entry point.
136 Apply if-conversion to the LOOP. Return true if successful otherwise return
137 false. If false is returned then loop remains unchanged.
138 FOR_VECTORIZER is a boolean flag. It indicates whether if-conversion is used
139 for vectorizer or not. If it is used for vectorizer, additional checks are
140 used. (Vectorization checks are not yet implemented). */
142 static bool
143 tree_if_conversion (struct loop *loop, bool for_vectorizer)
145 basic_block bb;
146 block_stmt_iterator itr;
147 tree cond;
148 unsigned int i;
150 ifc_bbs = NULL;
152 /* if-conversion is not appropriate for all loops. First, check if loop is
153 if-convertible or not. */
154 if (!if_convertible_loop_p (loop, for_vectorizer))
156 if (dump_file && (dump_flags & TDF_DETAILS))
157 fprintf (dump_file,"-------------------------\n");
158 if (ifc_bbs)
160 free (ifc_bbs);
161 ifc_bbs = NULL;
163 free_dominance_info (CDI_POST_DOMINATORS);
164 return false;
167 cond = NULL_TREE;
169 /* Do actual work now. */
170 for (i = 0; i < loop->num_nodes; i++)
172 bb = ifc_bbs [i];
174 /* Update condition using predicate list. */
175 cond = bb->aux;
177 /* Process all statements in this basic block.
178 Remove conditional expression, if any, and annotate
179 destination basic block(s) appropriately. */
180 for (itr = bsi_start (bb); !bsi_end_p (itr); /* empty */)
182 tree t = bsi_stmt (itr);
183 cond = tree_if_convert_stmt (loop, t, cond, &itr);
184 if (!bsi_end_p (itr))
185 bsi_next (&itr);
188 /* If current bb has only one successor, then consider it as an
189 unconditional goto. */
190 if (single_succ_p (bb))
192 basic_block bb_n = single_succ (bb);
193 if (cond != NULL_TREE)
194 add_to_predicate_list (bb_n, cond);
195 cond = NULL_TREE;
199 /* Now, all statements are if-converted and basic blocks are
200 annotated appropriately. Combine all basic block into one huge
201 basic block. */
202 combine_blocks (loop);
204 /* clean up */
205 clean_predicate_lists (loop);
206 free (ifc_bbs);
207 ifc_bbs = NULL;
209 return true;
212 /* if-convert stmt T which is part of LOOP.
213 If T is a MODIFY_EXPR than it is converted into conditional modify
214 expression using COND. For conditional expressions, add condition in the
215 destination basic block's predicate list and remove conditional
216 expression itself. BSI is the iterator used to traverse statements of
217 loop. It is used here when it is required to delete current statement. */
219 static tree
220 tree_if_convert_stmt (struct loop * loop, tree t, tree cond,
221 block_stmt_iterator *bsi)
223 if (dump_file && (dump_flags & TDF_DETAILS))
225 fprintf (dump_file, "------if-convert stmt\n");
226 print_generic_stmt (dump_file, t, TDF_SLIM);
227 print_generic_stmt (dump_file, cond, TDF_SLIM);
230 switch (TREE_CODE (t))
232 /* Labels are harmless here. */
233 case LABEL_EXPR:
234 break;
236 case MODIFY_EXPR:
237 /* This modify_expr is killing previous value of LHS. Appropriate value will
238 be selected by PHI node based on condition. It is possible that before
239 this transformation, PHI nodes was selecting default value and now it will
240 use this new value. This is OK because it does not change validity the
241 program. */
242 break;
244 case GOTO_EXPR:
245 /* Unconditional goto */
246 add_to_predicate_list (bb_for_stmt (TREE_OPERAND (t, 1)), cond);
247 bsi_remove (bsi);
248 cond = NULL_TREE;
249 break;
251 case COND_EXPR:
252 /* Update destination blocks' predicate list and remove this
253 condition expression. */
254 tree_if_convert_cond_expr (loop, t, cond, bsi);
255 cond = NULL_TREE;
256 break;
258 default:
259 gcc_unreachable ();
261 return cond;
264 /* STMT is COND_EXPR. Update two destination's predicate list.
265 Remove COND_EXPR, if it is not the loop exit condition. Otherwise
266 update loop exit condition appropriately. BSI is the iterator
267 used to traverse statement list. STMT is part of loop LOOP. */
269 static void
270 tree_if_convert_cond_expr (struct loop *loop, tree stmt, tree cond,
271 block_stmt_iterator *bsi)
273 tree c, c2;
274 edge true_edge, false_edge;
276 gcc_assert (TREE_CODE (stmt) == COND_EXPR);
278 c = COND_EXPR_COND (stmt);
280 extract_true_false_edges_from_block (bb_for_stmt (stmt),
281 &true_edge, &false_edge);
283 /* Add new condition into destination's predicate list. */
285 /* If 'c' is true then TRUE_EDGE is taken. */
286 add_to_dst_predicate_list (loop, true_edge->dest, cond,
287 unshare_expr (c), bsi);
289 /* If 'c' is false then FALSE_EDGE is taken. */
290 c2 = invert_truthvalue (unshare_expr (c));
291 add_to_dst_predicate_list (loop, false_edge->dest, cond, c2, bsi);
293 /* Now this conditional statement is redundant. Remove it.
294 But, do not remove exit condition! Update exit condition
295 using new condition. */
296 if (!bb_with_exit_edge_p (loop, bb_for_stmt (stmt)))
298 bsi_remove (bsi);
299 cond = NULL_TREE;
301 return;
304 /* Return true, iff PHI is if-convertible. PHI is part of loop LOOP
305 and it belongs to basic block BB.
306 PHI is not if-convertible
307 - if it has more than 2 arguments.
308 - Virtual PHI is immediately used in another PHI node. */
310 static bool
311 if_convertible_phi_p (struct loop *loop, basic_block bb, tree phi)
313 if (dump_file && (dump_flags & TDF_DETAILS))
315 fprintf (dump_file, "-------------------------\n");
316 print_generic_stmt (dump_file, phi, TDF_SLIM);
319 if (bb != loop->header && PHI_NUM_ARGS (phi) != 2)
321 if (dump_file && (dump_flags & TDF_DETAILS))
322 fprintf (dump_file, "More than two phi node args.\n");
323 return false;
326 if (!is_gimple_reg (SSA_NAME_VAR (PHI_RESULT (phi))))
328 imm_use_iterator imm_iter;
329 use_operand_p use_p;
330 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, PHI_RESULT (phi))
332 if (TREE_CODE (USE_STMT (use_p)) == PHI_NODE)
334 if (dump_file && (dump_flags & TDF_DETAILS))
335 fprintf (dump_file, "Difficult to handle this virtual phi.\n");
336 return false;
341 return true;
344 /* Return true, if M_EXPR is if-convertible.
345 MODIFY_EXPR is not if-convertible if,
346 - It is not movable.
347 - It could trap.
348 - LHS is not var decl.
349 MODIFY_EXPR is part of block BB, which is inside loop LOOP.
352 static bool
353 if_convertible_modify_expr_p (struct loop *loop, basic_block bb, tree m_expr)
355 if (dump_file && (dump_flags & TDF_DETAILS))
357 fprintf (dump_file, "-------------------------\n");
358 print_generic_stmt (dump_file, m_expr, TDF_SLIM);
361 /* Be conservative and do not handle immovable expressions. */
362 if (movement_possibility (m_expr) == MOVE_IMPOSSIBLE)
364 if (dump_file && (dump_flags & TDF_DETAILS))
365 fprintf (dump_file, "stmt is movable. Don't take risk\n");
366 return false;
369 /* See if it needs speculative loading or not. */
370 if (bb != loop->header
371 && tree_could_trap_p (TREE_OPERAND (m_expr, 1)))
373 if (dump_file && (dump_flags & TDF_DETAILS))
374 fprintf (dump_file, "tree could trap...\n");
375 return false;
378 if (TREE_CODE (TREE_OPERAND (m_expr, 1)) == CALL_EXPR)
380 if (dump_file && (dump_flags & TDF_DETAILS))
381 fprintf (dump_file, "CALL_EXPR \n");
382 return false;
385 if (TREE_CODE (TREE_OPERAND (m_expr, 0)) != SSA_NAME
386 && bb != loop->header
387 && !bb_with_exit_edge_p (loop, bb))
389 if (dump_file && (dump_flags & TDF_DETAILS))
391 fprintf (dump_file, "LHS is not var\n");
392 print_generic_stmt (dump_file, m_expr, TDF_SLIM);
394 return false;
398 return true;
401 /* Return true, iff STMT is if-convertible.
402 Statement is if-convertible if,
403 - It is if-convertible MODIFY_EXPR
404 - IT is LABEL_EXPR, GOTO_EXPR or COND_EXPR.
405 STMT is inside block BB, which is inside loop LOOP. */
407 static bool
408 if_convertible_stmt_p (struct loop *loop, basic_block bb, tree stmt)
410 switch (TREE_CODE (stmt))
412 case LABEL_EXPR:
413 break;
415 case MODIFY_EXPR:
417 if (!if_convertible_modify_expr_p (loop, bb, stmt))
418 return false;
419 break;
421 case GOTO_EXPR:
422 case COND_EXPR:
423 break;
425 default:
426 /* Don't know what to do with 'em so don't do anything. */
427 if (dump_file && (dump_flags & TDF_DETAILS))
429 fprintf (dump_file, "don't know what to do\n");
430 print_generic_stmt (dump_file, stmt, TDF_SLIM);
432 return false;
433 break;
436 return true;
439 /* Return true, iff BB is if-convertible.
440 Note: This routine does _not_ check basic block statements and phis.
441 Basic block is not if-convertible if,
442 - Basic block is non-empty and it is after exit block (in BFS order).
443 - Basic block is after exit block but before latch.
444 - Basic block edge(s) is not normal.
445 EXIT_BB_SEEN is true if basic block with exit edge is already seen.
446 BB is inside loop LOOP. */
448 static bool
449 if_convertible_bb_p (struct loop *loop, basic_block bb, bool exit_bb_seen)
451 edge e;
452 edge_iterator ei;
454 if (dump_file && (dump_flags & TDF_DETAILS))
455 fprintf (dump_file, "----------[%d]-------------\n", bb->index);
457 if (exit_bb_seen)
459 if (bb != loop->latch)
461 if (dump_file && (dump_flags & TDF_DETAILS))
462 fprintf (dump_file, "basic block after exit bb but before latch\n");
463 return false;
465 else if (!empty_block_p (bb))
467 if (dump_file && (dump_flags & TDF_DETAILS))
468 fprintf (dump_file, "non empty basic block after exit bb\n");
469 return false;
473 /* Be less adventurous and handle only normal edges. */
474 FOR_EACH_EDGE (e, ei, bb->succs)
475 if (e->flags &
476 (EDGE_ABNORMAL_CALL | EDGE_EH | EDGE_ABNORMAL | EDGE_IRREDUCIBLE_LOOP))
478 if (dump_file && (dump_flags & TDF_DETAILS))
479 fprintf (dump_file,"Difficult to handle edges\n");
480 return false;
483 return true;
486 /* Return true, iff LOOP is if-convertible.
487 LOOP is if-convertible if,
488 - It is innermost.
489 - It has two or more basic blocks.
490 - It has only one exit.
491 - Loop header is not the exit edge.
492 - If its basic blocks and phi nodes are if convertible. See above for
493 more info.
494 FOR_VECTORIZER enables vectorizer specific checks. For example, support
495 for vector conditions, data dependency checks etc.. (Not implemented yet). */
497 static bool
498 if_convertible_loop_p (struct loop *loop, bool for_vectorizer ATTRIBUTE_UNUSED)
500 tree phi;
501 basic_block bb;
502 block_stmt_iterator itr;
503 unsigned int i;
504 edge e;
505 edge_iterator ei;
506 bool exit_bb_seen = false;
508 /* Handle only inner most loop. */
509 if (!loop || loop->inner)
511 if (dump_file && (dump_flags & TDF_DETAILS))
512 fprintf (dump_file, "not inner most loop\n");
513 return false;
516 /* If only one block, no need for if-conversion. */
517 if (loop->num_nodes <= 2)
519 if (dump_file && (dump_flags & TDF_DETAILS))
520 fprintf (dump_file, "less than 2 basic blocks\n");
521 return false;
524 /* More than one loop exit is too much to handle. */
525 if (!loop->single_exit)
527 if (dump_file && (dump_flags & TDF_DETAILS))
528 fprintf (dump_file, "multiple exits\n");
529 return false;
532 /* ??? Check target's vector conditional operation support for vectorizer. */
534 /* If one of the loop header's edge is exit edge then do not apply
535 if-conversion. */
536 FOR_EACH_EDGE (e, ei, loop->header->succs)
538 if (loop_exit_edge_p (loop, e))
539 return false;
542 calculate_dominance_info (CDI_DOMINATORS);
543 calculate_dominance_info (CDI_POST_DOMINATORS);
545 /* Allow statements that can be handled during if-conversion. */
546 ifc_bbs = get_loop_body_in_if_conv_order (loop);
547 if (!ifc_bbs)
549 if (dump_file && (dump_flags & TDF_DETAILS))
550 fprintf (dump_file,"Irreducible loop\n");
551 free_dominance_info (CDI_POST_DOMINATORS);
552 return false;
555 for (i = 0; i < loop->num_nodes; i++)
557 bb = ifc_bbs[i];
559 if (!if_convertible_bb_p (loop, bb, exit_bb_seen))
560 return false;
562 /* Check statements. */
563 for (itr = bsi_start (bb); !bsi_end_p (itr); bsi_next (&itr))
564 if (!if_convertible_stmt_p (loop, bb, bsi_stmt (itr)))
565 return false;
566 /* ??? Check data dependency for vectorizer. */
568 /* What about phi nodes ? */
569 for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
570 if (!if_convertible_phi_p (loop, bb, phi))
571 return false;
573 if (bb_with_exit_edge_p (loop, bb))
574 exit_bb_seen = true;
577 /* OK. Did not find any potential issues so go ahead in if-convert
578 this loop. Now there is no looking back. */
579 if (dump_file)
580 fprintf (dump_file,"Applying if-conversion\n");
582 free_dominance_info (CDI_POST_DOMINATORS);
583 return true;
586 /* Add condition COND into predicate list of basic block BB. */
588 static void
589 add_to_predicate_list (basic_block bb, tree new_cond)
591 tree cond = bb->aux;
593 if (cond)
594 cond = fold (build (TRUTH_OR_EXPR, boolean_type_node,
595 unshare_expr (cond), new_cond));
596 else
597 cond = new_cond;
599 bb->aux = cond;
602 /* Add condition COND into BB's predicate list. PREV_COND is
603 existing condition. */
605 static tree
606 add_to_dst_predicate_list (struct loop * loop, basic_block bb,
607 tree prev_cond, tree cond,
608 block_stmt_iterator *bsi)
610 tree new_cond = NULL_TREE;
612 if (!flow_bb_inside_loop_p (loop, bb))
613 return NULL_TREE;
615 if (prev_cond == boolean_true_node || !prev_cond)
616 new_cond = unshare_expr (cond);
617 else
619 tree tmp;
620 tree tmp_stmt = NULL_TREE;
621 tree tmp_stmts1 = NULL_TREE;
622 tree tmp_stmts2 = NULL_TREE;
623 prev_cond = force_gimple_operand (unshare_expr (prev_cond),
624 &tmp_stmts1, true, NULL);
625 if (tmp_stmts1)
626 bsi_insert_before (bsi, tmp_stmts1, BSI_SAME_STMT);
628 cond = force_gimple_operand (unshare_expr (cond),
629 &tmp_stmts2, true, NULL);
630 if (tmp_stmts2)
631 bsi_insert_before (bsi, tmp_stmts2, BSI_SAME_STMT);
633 /* new_cond == prev_cond AND cond */
634 tmp = build (TRUTH_AND_EXPR, boolean_type_node,
635 unshare_expr (prev_cond), cond);
636 tmp_stmt = ifc_temp_var (boolean_type_node, tmp);
637 bsi_insert_before (bsi, tmp_stmt, BSI_SAME_STMT);
638 new_cond = TREE_OPERAND (tmp_stmt, 0);
640 add_to_predicate_list (bb, new_cond);
641 return new_cond;
644 /* During if-conversion aux field from basic block is used to hold predicate
645 list. Clean each basic block's predicate list for the given LOOP. */
647 static void
648 clean_predicate_lists (struct loop *loop)
650 basic_block *bb;
651 unsigned int i;
652 bb = get_loop_body (loop);
653 for (i = 0; i < loop->num_nodes; i++)
654 bb[i]->aux = NULL;
656 free (bb);
659 /* Basic block BB has two predecessors. Using predecessor's aux field, set
660 appropriate condition COND for the PHI node replacement. Return true block
661 whose phi arguments are selected when cond is true. */
663 static basic_block
664 find_phi_replacement_condition (struct loop *loop,
665 basic_block bb, tree *cond,
666 block_stmt_iterator *bsi)
668 basic_block first_bb = NULL;
669 basic_block second_bb = NULL;
670 tree tmp_cond;
672 gcc_assert (EDGE_COUNT (bb->preds) == 2);
673 first_bb = (EDGE_PRED (bb, 0))->src;
674 second_bb = (EDGE_PRED (bb, 1))->src;
676 /* Use condition based on following criteria:
678 S1: x = !c ? a : b;
680 S2: x = c ? b : a;
682 S2 is preferred over S1. Make 'b' first_bb and use its condition.
684 2) Do not make loop header first_bb.
687 S1: x = !(c == d)? a : b;
689 S21: t1 = c == d;
690 S22: x = t1 ? b : a;
692 S3: x = (c == d) ? b : a;
694 S3 is preferred over S1 and S2*, Make 'b' first_bb and use
695 its condition. */
697 /* Select condition that is not TRUTH_NOT_EXPR. */
698 tmp_cond = first_bb->aux;
699 if (TREE_CODE (tmp_cond) == TRUTH_NOT_EXPR)
701 basic_block tmp_bb;
702 tmp_bb = first_bb;
703 first_bb = second_bb;
704 second_bb = first_bb;
707 /* Check if FIRST_BB is loop header or not. */
708 if (first_bb == loop->header)
710 tmp_cond = second_bb->aux;
711 if (TREE_CODE (tmp_cond) == TRUTH_NOT_EXPR)
713 /* Select non loop header condition but do not switch basic blocks. */
714 *cond = invert_truthvalue (unshare_expr (tmp_cond));
716 else
718 /* Select non loop header condition. */
719 first_bb = second_bb;
720 *cond = first_bb->aux;
723 else
724 /* FIRST_BB is not loop header */
725 *cond = first_bb->aux;
727 /* Create temp. for the condition. Vectorizer prefers to have gimple
728 value as condition. Various targets use different means to communicate
729 condition in vector compare operation. Using gimple value allows compiler
730 to emit vector compare and select RTL without exposing compare's result. */
731 if (!is_gimple_reg (*cond) && !is_gimple_condexpr (*cond))
733 tree new_stmt;
735 new_stmt = ifc_temp_var (TREE_TYPE (*cond), unshare_expr (*cond));
736 bsi_insert_after (bsi, new_stmt, BSI_SAME_STMT);
737 bsi_next (bsi);
738 *cond = TREE_OPERAND (new_stmt, 0);
741 gcc_assert (*cond);
743 return first_bb;
747 /* Replace PHI node with conditional modify expr using COND.
748 This routine does not handle PHI nodes with more than two arguments.
749 For example,
750 S1: A = PHI <x1(1), x2(5)
751 is converted into,
752 S2: A = cond ? x1 : x2;
753 S2 is inserted at the top of basic block's statement list.
754 When COND is true, phi arg from TRUE_BB is selected.
757 static void
758 replace_phi_with_cond_modify_expr (tree phi, tree cond, basic_block true_bb,
759 block_stmt_iterator *bsi)
761 tree new_stmt;
762 basic_block bb;
763 tree rhs;
764 tree arg_0, arg_1;
766 gcc_assert (TREE_CODE (phi) == PHI_NODE);
768 /* If this is not filtered earlier, then now it is too late. */
769 gcc_assert (PHI_NUM_ARGS (phi) == 2);
771 /* Find basic block and initialize iterator. */
772 bb = bb_for_stmt (phi);
774 new_stmt = NULL_TREE;
775 arg_0 = NULL_TREE;
776 arg_1 = NULL_TREE;
778 /* Use condition that is not TRUTH_NOT_EXPR in conditional modify expr. */
779 if (EDGE_PRED (bb, 1)->src == true_bb)
781 arg_0 = PHI_ARG_DEF (phi, 1);
782 arg_1 = PHI_ARG_DEF (phi, 0);
784 else
786 arg_0 = PHI_ARG_DEF (phi, 0);
787 arg_1 = PHI_ARG_DEF (phi, 1);
790 /* Build new RHS using selected condition and arguments. */
791 rhs = build (COND_EXPR, TREE_TYPE (PHI_RESULT (phi)),
792 unshare_expr (cond), unshare_expr (arg_0),
793 unshare_expr (arg_1));
795 /* Create new MODIFY expression using RHS. */
796 new_stmt = build (MODIFY_EXPR, TREE_TYPE (PHI_RESULT (phi)),
797 unshare_expr (PHI_RESULT (phi)), rhs);
799 /* Make new statement definition of the original phi result. */
800 SSA_NAME_DEF_STMT (PHI_RESULT (phi)) = new_stmt;
802 /* Set basic block and insert using iterator. */
803 set_bb_for_stmt (new_stmt, bb);
805 bsi_insert_after (bsi, new_stmt, BSI_SAME_STMT);
806 bsi_next (bsi);
808 update_stmt (new_stmt);
810 if (dump_file && (dump_flags & TDF_DETAILS))
812 fprintf (dump_file, "new phi replacement stmt\n");
813 print_generic_stmt (dump_file, new_stmt, TDF_SLIM);
817 /* Process phi nodes for the given LOOP. Replace phi nodes with cond
818 modify expr. */
820 static void
821 process_phi_nodes (struct loop *loop)
823 basic_block bb;
824 unsigned int orig_loop_num_nodes = loop->num_nodes;
825 unsigned int i;
827 /* Replace phi nodes with cond. modify expr. */
828 for (i = 1; i < orig_loop_num_nodes; i++)
830 tree phi, cond;
831 block_stmt_iterator bsi;
832 basic_block true_bb = NULL;
833 bb = ifc_bbs[i];
835 if (bb == loop->header)
836 continue;
838 phi = phi_nodes (bb);
839 bsi = bsi_after_labels (bb);
841 /* BB has two predecessors. Using predecessor's aux field, set
842 appropriate condition for the PHI node replacement. */
843 if (phi)
844 true_bb = find_phi_replacement_condition (loop, bb, &cond, &bsi);
846 while (phi)
848 tree next = PHI_CHAIN (phi);
849 replace_phi_with_cond_modify_expr (phi, cond, true_bb, &bsi);
850 release_phi_node (phi);
851 phi = next;
853 bb_ann (bb)->phi_nodes = NULL;
855 return;
858 /* Combine all basic block from the given LOOP into one or two super
859 basic block. Replace PHI nodes with conditional modify expression. */
861 static void
862 combine_blocks (struct loop *loop)
864 basic_block bb, exit_bb, merge_target_bb;
865 unsigned int orig_loop_num_nodes = loop->num_nodes;
866 unsigned int i;
867 unsigned int n_exits;
869 get_loop_exit_edges (loop, &n_exits);
870 /* Process phi nodes to prepare blocks for merge. */
871 process_phi_nodes (loop);
873 exit_bb = NULL;
875 /* Merge basic blocks */
876 merge_target_bb = loop->header;
877 for (i = 1; i < orig_loop_num_nodes; i++)
879 edge e;
880 block_stmt_iterator bsi;
881 tree_stmt_iterator last;
883 bb = ifc_bbs[i];
885 if (!exit_bb && bb_with_exit_edge_p (loop, bb))
886 exit_bb = bb;
888 if (bb == exit_bb)
890 edge_iterator ei;
892 /* Connect this node with loop header. */
893 make_edge (ifc_bbs[0], bb, EDGE_FALLTHRU);
894 set_immediate_dominator (CDI_DOMINATORS, bb, ifc_bbs[0]);
896 if (exit_bb != loop->latch)
898 /* Redirect non-exit edge to loop->latch. */
899 FOR_EACH_EDGE (e, ei, bb->succs)
901 if (!loop_exit_edge_p (loop, e))
903 redirect_edge_and_branch (e, loop->latch);
904 set_immediate_dominator (CDI_DOMINATORS, loop->latch, bb);
908 continue;
911 if (bb == loop->latch && empty_block_p (bb))
912 continue;
914 /* It is time to remove this basic block. First remove edges. */
915 while (EDGE_COUNT (bb->preds) > 0)
916 remove_edge (EDGE_PRED (bb, 0));
918 /* This is loop latch and loop does not have exit then do not
919 delete this basic block. Just remove its PREDS and reconnect
920 loop->header and loop->latch blocks. */
921 if (bb == loop->latch && n_exits == 0)
923 make_edge (loop->header, loop->latch, EDGE_FALLTHRU);
924 set_immediate_dominator (CDI_DOMINATORS, loop->latch, loop->header);
925 continue;
928 while (EDGE_COUNT (bb->succs) > 0)
929 remove_edge (EDGE_SUCC (bb, 0));
931 /* Remove labels and make stmts member of loop->header. */
932 for (bsi = bsi_start (bb); !bsi_end_p (bsi); )
934 if (TREE_CODE (bsi_stmt (bsi)) == LABEL_EXPR)
935 bsi_remove (&bsi);
936 else
938 set_bb_for_stmt (bsi_stmt (bsi), merge_target_bb);
939 bsi_next (&bsi);
943 /* Update stmt list. */
944 last = tsi_last (merge_target_bb->stmt_list);
945 tsi_link_after (&last, bb->stmt_list, TSI_NEW_STMT);
946 bb->stmt_list = NULL;
948 /* Update dominator info. */
949 if (dom_computed[CDI_DOMINATORS])
950 delete_from_dominance_info (CDI_DOMINATORS, bb);
951 if (dom_computed[CDI_POST_DOMINATORS])
952 delete_from_dominance_info (CDI_POST_DOMINATORS, bb);
954 /* Remove basic block. */
955 if (bb == loop->latch)
956 loop->latch = merge_target_bb;
957 remove_bb_from_loops (bb);
958 expunge_block (bb);
961 /* Now if possible, merge loop header and block with exit edge.
962 This reduces number of basic blocks to 2. Auto vectorizer addresses
963 loops with two nodes only. FIXME: Use cleanup_tree_cfg(). */
964 if (exit_bb
965 && loop->header != loop->latch
966 && exit_bb != loop->latch
967 && empty_block_p (loop->latch))
969 if (can_merge_blocks_p (loop->header, exit_bb))
971 remove_bb_from_loops (exit_bb);
972 merge_blocks (loop->header, exit_bb);
977 /* Make new temp variable of type TYPE. Add MODIFY_EXPR to assign EXP
978 to the new variable. */
980 static tree
981 ifc_temp_var (tree type, tree exp)
983 const char *name = "_ifc_";
984 tree var, stmt, new_name;
986 if (is_gimple_reg (exp))
987 return exp;
989 /* Create new temporary variable. */
990 var = create_tmp_var (type, name);
991 add_referenced_tmp_var (var);
993 /* Build new statement to assign EXP to new variable. */
994 stmt = build (MODIFY_EXPR, type, var, exp);
996 /* Get SSA name for the new variable and set make new statement
997 its definition statement. */
998 new_name = make_ssa_name (var, stmt);
999 TREE_OPERAND (stmt, 0) = new_name;
1000 SSA_NAME_DEF_STMT (new_name) = stmt;
1002 return stmt;
1006 /* Return TRUE iff, all pred blocks of BB are visited.
1007 Bitmap VISITED keeps history of visited blocks. */
1009 static bool
1010 pred_blocks_visited_p (basic_block bb, bitmap *visited)
1012 edge e;
1013 edge_iterator ei;
1014 FOR_EACH_EDGE (e, ei, bb->preds)
1015 if (!bitmap_bit_p (*visited, e->src->index))
1016 return false;
1018 return true;
1021 /* Get body of a LOOP in suitable order for if-conversion.
1022 It is caller's responsibility to deallocate basic block
1023 list. If-conversion suitable order is, BFS order with one
1024 additional constraint. Select block in BFS block, if all
1025 pred are already selected. */
1027 static basic_block *
1028 get_loop_body_in_if_conv_order (const struct loop *loop)
1030 basic_block *blocks, *blocks_in_bfs_order;
1031 basic_block bb;
1032 bitmap visited;
1033 unsigned int index = 0;
1034 unsigned int visited_count = 0;
1036 gcc_assert (loop->num_nodes);
1037 gcc_assert (loop->latch != EXIT_BLOCK_PTR);
1039 blocks = xcalloc (loop->num_nodes, sizeof (basic_block));
1040 visited = BITMAP_ALLOC (NULL);
1042 blocks_in_bfs_order = get_loop_body_in_bfs_order (loop);
1044 index = 0;
1045 while (index < loop->num_nodes)
1047 bb = blocks_in_bfs_order [index];
1049 if (bb->flags & BB_IRREDUCIBLE_LOOP)
1051 free (blocks_in_bfs_order);
1052 BITMAP_FREE (visited);
1053 free (blocks);
1054 return NULL;
1056 if (!bitmap_bit_p (visited, bb->index))
1058 if (pred_blocks_visited_p (bb, &visited)
1059 || bb == loop->header)
1061 /* This block is now visited. */
1062 bitmap_set_bit (visited, bb->index);
1063 blocks[visited_count++] = bb;
1066 index++;
1067 if (index == loop->num_nodes
1068 && visited_count != loop->num_nodes)
1070 /* Not done yet. */
1071 index = 0;
1074 free (blocks_in_bfs_order);
1075 BITMAP_FREE (visited);
1076 return blocks;
1079 /* Return true if one of the basic block BB edge is exit of LOOP. */
1081 static bool
1082 bb_with_exit_edge_p (struct loop *loop, basic_block bb)
1084 edge e;
1085 edge_iterator ei;
1086 bool exit_edge_found = false;
1088 FOR_EACH_EDGE (e, ei, bb->succs)
1089 if (loop_exit_edge_p (loop, e))
1091 exit_edge_found = true;
1092 break;
1095 return exit_edge_found;
1098 /* Tree if-conversion pass management. */
1100 static void
1101 main_tree_if_conversion (void)
1103 unsigned i, loop_num;
1104 struct loop *loop;
1106 if (!current_loops)
1107 return;
1109 loop_num = current_loops->num;
1110 for (i = 0; i < loop_num; i++)
1112 loop = current_loops->parray[i];
1113 if (!loop)
1114 continue;
1116 tree_if_conversion (loop, true);
1121 static bool
1122 gate_tree_if_conversion (void)
1124 return flag_tree_vectorize != 0;
1127 struct tree_opt_pass pass_if_conversion =
1129 "ifcvt", /* name */
1130 gate_tree_if_conversion, /* gate */
1131 main_tree_if_conversion, /* execute */
1132 NULL, /* sub */
1133 NULL, /* next */
1134 0, /* static_pass_number */
1135 0, /* tv_id */
1136 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
1137 0, /* properties_provided */
1138 0, /* properties_destroyed */
1139 0, /* todo_flags_start */
1140 TODO_dump_func | TODO_verify_loops | TODO_verify_stmts | TODO_verify_flow,
1141 /* todo_flags_finish */
1142 0 /* letter */