Ayee, missed a file.
[official-gcc.git] / gcc / tree-tailcall.c
blob6e1957c597d3c9b1684ac2f6ca969f83bb9be87d
1 /* Tail call optimization on trees.
2 Copyright (C) 2003 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING. If not, write to
18 the Free Software Foundation, 59 Temple Place - Suite 330,
19 Boston, MA 02111-1307, USA. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "tree.h"
26 #include "rtl.h"
27 #include "tm_p.h"
28 #include "hard-reg-set.h"
29 #include "basic-block.h"
30 #include "function.h"
31 #include "tree-flow.h"
32 #include "tree-dump.h"
33 #include "diagnostic.h"
34 #include "except.h"
35 #include "tree-pass.h"
36 #include "flags.h"
37 #include "langhooks.h"
39 /* The file implements the tail recursion elimination. It is also used to
40 analyze the tail calls in general, passing the results to the rtl level
41 where they are used for sibcall optimization.
43 In addition to the standard tail recursion elimination, we handle the most
44 trivial cases of making the call tail recursive by creating accumulators.
45 For example the following function
47 int sum (int n)
49 if (n > 0)
50 return n + sum (n - 1);
51 else
52 return 0;
55 is transformed into
57 int sum (int n)
59 int acc = 0;
61 while (n > 0)
62 acc += n--;
64 return acc;
67 To do this, we maintain two accumulators (a_acc and m_acc) that indicate
68 when we reach the return x statement, we should return a_acc + x * m_acc
69 instead. They are initially initialized to 0 and 1, respectively,
70 so the semantics of the function is obviously preserved. If we are
71 guaranteed that the value of the accumulator never change, we
72 omit the accumulator.
74 There are three cases how the function may exit. The first one is
75 handled in adjust_return_value, the other two in adjust_accumulator_values
76 (the second case is actually a special case of the third one and we
77 present it separately just for clarity):
79 1) Just return x, where x is not in any of the remaining special shapes.
80 We rewrite this to a gimple equivalent of return m_acc * x + a_acc.
82 2) return f (...), where f is the current function, is rewritten in a
83 classical tail-recursion elimination way, into assignment of arguments
84 and jump to the start of the function. Values of the accumulators
85 are unchanged.
87 3) return a + m * f(...), where a and m do not depend on call to f.
88 To preserve the semantics described before we want this to be rewritten
89 in such a way that we finally return
91 a_acc + (a + m * f(...)) * m_acc = (a_acc + a * m_acc) + (m * m_acc) * f(...).
93 I.e. we increase a_acc by a * m_acc, multiply m_acc by m and
94 eliminate the tail call to f. Special cases when the value is just
95 added or just multiplied are obtained by setting a = 0 or m = 1.
97 TODO -- it is possible to do similar tricks for other operations. */
99 /* A structure that describes the tailcall. */
101 struct tailcall
103 /* The block in that the call occur. */
104 basic_block call_block;
106 /* The iterator pointing to the call statement. */
107 block_stmt_iterator call_bsi;
109 /* True if it is a call to the current function. */
110 bool tail_recursion;
112 /* The return value of the caller is mult * f + add, where f is the return
113 value of the call. */
114 tree mult, add;
116 /* Next tailcall in the chain. */
117 struct tailcall *next;
120 /* The variables holding the value of multiplicative and additive
121 accumulator. */
122 static tree m_acc, a_acc;
124 static bool suitable_for_tail_opt_p (void);
125 static bool optimize_tail_call (struct tailcall *, bool);
126 static void eliminate_tail_call (struct tailcall *);
127 static void find_tail_calls (basic_block, struct tailcall **);
129 /* Returns false when the function is not suitable for tail call optimization
130 from some reason (e.g. if it takes variable number of arguments). */
132 static bool
133 suitable_for_tail_opt_p (void)
135 int i;
137 if (current_function_stdarg)
138 return false;
140 /* No local variable should be call-clobbered. We ignore any kind
141 of memory tag, as these are not real variables. */
142 for (i = 0; i < (int) VARRAY_ACTIVE_SIZE (referenced_vars); i++)
144 tree var = VARRAY_TREE (referenced_vars, i);
146 if (!TREE_STATIC (var)
147 && var_ann (var)->mem_tag_kind == NOT_A_TAG
148 && is_call_clobbered (var))
149 return false;
152 return true;
154 /* Returns false when the function is not suitable for tail call optimization
155 from some reason (e.g. if it takes variable number of arguments).
156 This test must pass in addition to suitable_for_tail_opt_p in order to make
157 tail call discovery happen. */
159 static bool
160 suitable_for_tail_call_opt_p (void)
162 /* alloca (until we have stack slot life analysis) inhibits
163 sibling call optimizations, but not tail recursion. */
164 if (current_function_calls_alloca)
165 return false;
167 /* If we are using sjlj exceptions, we may need to add a call to
168 _Unwind_SjLj_Unregister at exit of the function. Which means
169 that we cannot do any sibcall transformations. */
170 if (USING_SJLJ_EXCEPTIONS && current_function_has_exception_handlers ())
171 return false;
173 /* Any function that calls setjmp might have longjmp called from
174 any called function. ??? We really should represent this
175 properly in the CFG so that this needn't be special cased. */
176 if (current_function_calls_setjmp)
177 return false;
179 return true;
182 /* Checks whether the expression EXPR in stmt AT is independent of the
183 statement pointed by BSI (in a sense that we already know EXPR's value
184 at BSI). We use the fact that we are only called from the chain of
185 basic blocks that have only single successor. Returns the expression
186 containing the value of EXPR at BSI. */
188 static tree
189 independent_of_stmt_p (tree expr, tree at, block_stmt_iterator bsi)
191 basic_block bb, call_bb, at_bb;
192 edge e;
194 if (is_gimple_min_invariant (expr))
195 return expr;
197 if (TREE_CODE (expr) != SSA_NAME)
198 return NULL_TREE;
200 /* Mark the blocks in the chain leading to the end. */
201 at_bb = bb_for_stmt (at);
202 call_bb = bb_for_stmt (bsi_stmt (bsi));
203 for (bb = call_bb; bb != at_bb; bb = bb->succ->dest)
204 bb->aux = &bb->aux;
205 bb->aux = &bb->aux;
207 while (1)
209 at = SSA_NAME_DEF_STMT (expr);
210 bb = bb_for_stmt (at);
212 /* The default definition or defined before the chain. */
213 if (!bb || !bb->aux)
214 break;
216 if (bb == call_bb)
218 for (; !bsi_end_p (bsi); bsi_next (&bsi))
219 if (bsi_stmt (bsi) == at)
220 break;
222 if (!bsi_end_p (bsi))
223 expr = NULL_TREE;
224 break;
227 if (TREE_CODE (at) != PHI_NODE)
229 expr = NULL_TREE;
230 break;
233 for (e = bb->pred; e; e = e->pred_next)
234 if (e->src->aux)
235 break;
236 if (!e)
237 abort ();
239 expr = PHI_ARG_DEF_FROM_EDGE (at, e);
240 if (TREE_CODE (expr) != SSA_NAME)
242 /* The value is a constant. */
243 break;
247 /* Unmark the blocks. */
248 for (bb = call_bb; bb != at_bb; bb = bb->succ->dest)
249 bb->aux = NULL;
250 bb->aux = NULL;
252 return expr;
255 /* Simulates the effect of an assignment of ASS in STMT on the return value
256 of the tail recursive CALL passed in ASS_VAR. M and A are the
257 multiplicative and the additive factor for the real return value. */
259 static bool
260 process_assignment (tree ass, tree stmt, block_stmt_iterator call, tree *m,
261 tree *a, tree *ass_var)
263 tree op0, op1, non_ass_var;
264 tree dest = TREE_OPERAND (ass, 0);
265 tree src = TREE_OPERAND (ass, 1);
266 enum tree_code code = TREE_CODE (src);
267 tree src_var = src;
269 /* See if this is a simple copy operation of an SSA name to the function
270 result. In that case we may have a simple tail call. Ignore type
271 conversions that can never produce extra code between the function
272 call and the function return. */
273 STRIP_NOPS (src_var);
274 if (TREE_CODE (src_var) == SSA_NAME)
276 if (src_var != *ass_var)
277 return false;
279 *ass_var = dest;
280 return true;
283 if (TREE_CODE_CLASS (code) != '2')
284 return false;
286 /* We only handle the code like
288 x = call ();
289 y = m * x;
290 z = y + a;
291 return z;
293 TODO -- Extend it for cases where the linear transformation of the output
294 is expressed in a more complicated way. */
296 op0 = TREE_OPERAND (src, 0);
297 op1 = TREE_OPERAND (src, 1);
299 if (op0 == *ass_var
300 && (non_ass_var = independent_of_stmt_p (op1, stmt, call)))
302 else if (op1 == *ass_var
303 && (non_ass_var = independent_of_stmt_p (op0, stmt, call)))
305 else
306 return false;
308 switch (code)
310 case PLUS_EXPR:
311 /* There should be no previous addition. TODO -- it should be fairly
312 straightforward to lift this restriction -- just allow storing
313 more complicated expressions in *A, and gimplify it in
314 adjust_accumulator_values. */
315 if (*a)
316 return false;
317 *a = non_ass_var;
318 *ass_var = dest;
319 return true;
321 case MULT_EXPR:
322 /* Similar remark applies here. Handling multiplication after addition
323 is just slightly more complicated -- we need to multiply both *A and
324 *M. */
325 if (*a || *m)
326 return false;
327 *m = non_ass_var;
328 *ass_var = dest;
329 return true;
331 /* TODO -- Handle other codes (NEGATE_EXPR, MINUS_EXPR). */
333 default:
334 return false;
338 /* Propagate VAR through phis on edge E. */
340 static tree
341 propagate_through_phis (tree var, edge e)
343 basic_block dest = e->dest;
344 tree phi;
346 for (phi = phi_nodes (dest); phi; phi = PHI_CHAIN (phi))
347 if (PHI_ARG_DEF_FROM_EDGE (phi, e) == var)
348 return PHI_RESULT (phi);
350 return var;
353 /* Finds tailcalls falling into basic block BB. The list of found tailcalls is
354 added to the start of RET. */
356 static void
357 find_tail_calls (basic_block bb, struct tailcall **ret)
359 tree ass_var, ret_var, stmt, func, param, args, call = NULL_TREE;
360 block_stmt_iterator bsi, absi;
361 bool tail_recursion;
362 struct tailcall *nw;
363 edge e;
364 tree m, a;
365 basic_block abb;
366 stmt_ann_t ann;
368 if (bb->succ->succ_next)
369 return;
371 for (bsi = bsi_last (bb); !bsi_end_p (bsi); bsi_prev (&bsi))
373 stmt = bsi_stmt (bsi);
375 /* Ignore labels. */
376 if (TREE_CODE (stmt) == LABEL_EXPR)
377 continue;
379 get_stmt_operands (stmt);
381 /* Check for a call. */
382 if (TREE_CODE (stmt) == MODIFY_EXPR)
384 ass_var = TREE_OPERAND (stmt, 0);
385 call = TREE_OPERAND (stmt, 1);
386 if (TREE_CODE (call) == WITH_SIZE_EXPR)
387 call = TREE_OPERAND (call, 0);
389 else
391 ass_var = NULL_TREE;
392 call = stmt;
395 if (TREE_CODE (call) == CALL_EXPR)
396 break;
398 /* If the statement has virtual operands, fail. */
399 ann = stmt_ann (stmt);
400 if (NUM_V_MAY_DEFS (V_MAY_DEF_OPS (ann))
401 || NUM_V_MUST_DEFS (V_MUST_DEF_OPS (ann))
402 || NUM_VUSES (VUSE_OPS (ann)))
403 return;
406 if (bsi_end_p (bsi))
408 /* Recurse to the predecessors. */
409 for (e = bb->pred; e; e = e->pred_next)
410 find_tail_calls (e->src, ret);
412 return;
415 /* We found the call, check whether it is suitable. */
416 tail_recursion = false;
417 func = get_callee_fndecl (call);
418 if (func == current_function_decl)
420 for (param = DECL_ARGUMENTS (func), args = TREE_OPERAND (call, 1);
421 param && args;
422 param = TREE_CHAIN (param), args = TREE_CHAIN (args))
424 tree arg = TREE_VALUE (args);
425 if (param != arg
426 /* Make sure there are no problems with copying. Note we must
427 have a copyable type and the two arguments must have reasonably
428 equivalent types. The latter requirement could be relaxed if
429 we emitted a suitable type conversion statement. */
430 && (!is_gimple_reg_type (TREE_TYPE (param))
431 || !lang_hooks.types_compatible_p (TREE_TYPE (param),
432 TREE_TYPE (arg))))
433 break;
435 if (!args && !param)
436 tail_recursion = true;
439 /* Now check the statements after the call. None of them has virtual
440 operands, so they may only depend on the call through its return
441 value. The return value should also be dependent on each of them,
442 since we are running after dce. */
443 m = NULL_TREE;
444 a = NULL_TREE;
446 abb = bb;
447 absi = bsi;
448 while (1)
450 bsi_next (&absi);
452 while (bsi_end_p (absi))
454 ass_var = propagate_through_phis (ass_var, abb->succ);
455 abb = abb->succ->dest;
456 absi = bsi_start (abb);
459 stmt = bsi_stmt (absi);
461 if (TREE_CODE (stmt) == LABEL_EXPR)
462 continue;
464 if (TREE_CODE (stmt) == RETURN_EXPR)
465 break;
467 if (TREE_CODE (stmt) != MODIFY_EXPR)
468 return;
470 if (!process_assignment (stmt, stmt, bsi, &m, &a, &ass_var))
471 return;
474 /* See if this is a tail call we can handle. */
475 ret_var = TREE_OPERAND (stmt, 0);
476 if (ret_var
477 && TREE_CODE (ret_var) == MODIFY_EXPR)
479 tree ret_op = TREE_OPERAND (ret_var, 1);
480 STRIP_NOPS (ret_op);
481 if (!tail_recursion
482 && TREE_CODE (ret_op) != SSA_NAME)
483 return;
485 if (!process_assignment (ret_var, stmt, bsi, &m, &a, &ass_var))
486 return;
487 ret_var = TREE_OPERAND (ret_var, 0);
490 /* We may proceed if there either is no return value, or the return value
491 is identical to the call's return. */
492 if (ret_var
493 && (ret_var != ass_var))
494 return;
496 /* If this is not a tail recursive call, we cannot handle addends or
497 multiplicands. */
498 if (!tail_recursion && (m || a))
499 return;
501 nw = xmalloc (sizeof (struct tailcall));
503 nw->call_block = bb;
504 nw->call_bsi = bsi;
506 nw->tail_recursion = tail_recursion;
508 nw->mult = m;
509 nw->add = a;
511 nw->next = *ret;
512 *ret = nw;
515 /* Adjust the accumulator values according to A and M after BSI, and update
516 the phi nodes on edge BACK. */
518 static void
519 adjust_accumulator_values (block_stmt_iterator bsi, tree m, tree a, edge back)
521 tree stmt, var, phi, tmp;
522 tree ret_type = TREE_TYPE (DECL_RESULT (current_function_decl));
523 tree a_acc_arg = a_acc, m_acc_arg = m_acc;
525 if (a)
527 if (m_acc)
529 if (integer_onep (a))
530 var = m_acc;
531 else
533 stmt = build (MODIFY_EXPR, ret_type, NULL_TREE,
534 build (MULT_EXPR, ret_type, m_acc, a));
536 tmp = create_tmp_var (ret_type, "acc_tmp");
537 add_referenced_tmp_var (tmp);
539 var = make_ssa_name (tmp, stmt);
540 TREE_OPERAND (stmt, 0) = var;
541 bsi_insert_after (&bsi, stmt, BSI_NEW_STMT);
544 else
545 var = a;
547 stmt = build (MODIFY_EXPR, ret_type, NULL_TREE,
548 build (PLUS_EXPR, ret_type, a_acc, var));
549 var = make_ssa_name (SSA_NAME_VAR (a_acc), stmt);
550 TREE_OPERAND (stmt, 0) = var;
551 bsi_insert_after (&bsi, stmt, BSI_NEW_STMT);
552 a_acc_arg = var;
555 if (m)
557 stmt = build (MODIFY_EXPR, ret_type, NULL_TREE,
558 build (MULT_EXPR, ret_type, m_acc, m));
559 var = make_ssa_name (SSA_NAME_VAR (m_acc), stmt);
560 TREE_OPERAND (stmt, 0) = var;
561 bsi_insert_after (&bsi, stmt, BSI_NEW_STMT);
562 m_acc_arg = var;
565 if (a_acc)
567 for (phi = phi_nodes (back->dest); phi; phi = PHI_CHAIN (phi))
568 if (PHI_RESULT (phi) == a_acc)
569 break;
571 add_phi_arg (&phi, a_acc_arg, back);
574 if (m_acc)
576 for (phi = phi_nodes (back->dest); phi; phi = PHI_CHAIN (phi))
577 if (PHI_RESULT (phi) == m_acc)
578 break;
580 add_phi_arg (&phi, m_acc_arg, back);
584 /* Adjust value of the return at the end of BB according to M and A
585 accumulators. */
587 static void
588 adjust_return_value (basic_block bb, tree m, tree a)
590 tree ret_stmt = last_stmt (bb), ret_var, var, stmt, tmp;
591 tree ret_type = TREE_TYPE (DECL_RESULT (current_function_decl));
592 block_stmt_iterator bsi = bsi_last (bb);
594 if (TREE_CODE (ret_stmt) != RETURN_EXPR)
595 abort ();
597 ret_var = TREE_OPERAND (ret_stmt, 0);
598 if (!ret_var)
599 return;
601 if (TREE_CODE (ret_var) == MODIFY_EXPR)
603 ret_var->common.ann = (tree_ann_t) stmt_ann (ret_stmt);
604 bsi_replace (&bsi, ret_var, true);
605 SSA_NAME_DEF_STMT (TREE_OPERAND (ret_var, 0)) = ret_var;
606 ret_var = TREE_OPERAND (ret_var, 0);
607 ret_stmt = build1 (RETURN_EXPR, TREE_TYPE (ret_stmt), ret_var);
608 bsi_insert_after (&bsi, ret_stmt, BSI_NEW_STMT);
611 if (m)
613 stmt = build (MODIFY_EXPR, ret_type, NULL_TREE,
614 build (MULT_EXPR, ret_type, m_acc, ret_var));
616 tmp = create_tmp_var (ret_type, "acc_tmp");
617 add_referenced_tmp_var (tmp);
619 var = make_ssa_name (tmp, stmt);
620 TREE_OPERAND (stmt, 0) = var;
621 bsi_insert_before (&bsi, stmt, BSI_NEW_STMT);
623 else
624 var = ret_var;
626 if (a)
628 stmt = build (MODIFY_EXPR, ret_type, NULL_TREE,
629 build (PLUS_EXPR, ret_type, a_acc, var));
631 tmp = create_tmp_var (ret_type, "acc_tmp");
632 add_referenced_tmp_var (tmp);
634 var = make_ssa_name (tmp, stmt);
635 TREE_OPERAND (stmt, 0) = var;
636 bsi_insert_before (&bsi, stmt, BSI_NEW_STMT);
639 TREE_OPERAND (ret_stmt, 0) = var;
640 modify_stmt (ret_stmt);
643 /* Eliminates tail call described by T. TMP_VARS is a list of
644 temporary variables used to copy the function arguments. */
646 static void
647 eliminate_tail_call (struct tailcall *t)
649 tree param, stmt, args, rslt, call;
650 basic_block bb, first;
651 edge e;
652 tree phi;
653 stmt_ann_t ann;
654 v_may_def_optype v_may_defs;
655 unsigned i;
656 block_stmt_iterator bsi;
658 stmt = bsi_stmt (t->call_bsi);
659 get_stmt_operands (stmt);
660 ann = stmt_ann (stmt);
661 bb = t->call_block;
663 if (dump_file && (dump_flags & TDF_DETAILS))
665 fprintf (dump_file, "Eliminated tail recursion in bb %d : ",
666 bb->index);
667 print_generic_stmt (dump_file, stmt, TDF_SLIM);
668 fprintf (dump_file, "\n");
671 if (TREE_CODE (stmt) == MODIFY_EXPR)
672 stmt = TREE_OPERAND (stmt, 1);
674 first = ENTRY_BLOCK_PTR->succ->dest;
676 /* Remove the code after call_bsi that will become unreachable. The
677 possibly unreachable code in other blocks is removed later in
678 cfg cleanup. */
679 bsi = t->call_bsi;
680 bsi_next (&bsi);
681 while (!bsi_end_p (bsi))
683 /* Do not remove the return statement, so that redirect_edge_and_branch
684 sees how the block ends. */
685 if (TREE_CODE (bsi_stmt (bsi)) == RETURN_EXPR)
686 break;
688 bsi_remove (&bsi);
691 /* Replace the call by a jump to the start of function. */
692 e = redirect_edge_and_branch (t->call_block->succ, first);
693 if (!e)
694 abort ();
695 PENDING_STMT (e) = NULL_TREE;
697 /* Add phi node entries for arguments. Not every PHI node corresponds to
698 a function argument (there may be PHI nodes for virtual definitions of the
699 eliminated calls), so we search for a PHI corresponding to each argument
700 rather than searching for which argument a PHI node corresponds to. */
702 for (param = DECL_ARGUMENTS (current_function_decl),
703 args = TREE_OPERAND (stmt, 1);
704 param;
705 param = TREE_CHAIN (param),
706 args = TREE_CHAIN (args))
709 for (phi = phi_nodes (first); phi; phi = PHI_CHAIN (phi))
710 if (param == SSA_NAME_VAR (PHI_RESULT (phi)))
711 break;
713 /* The phi node indeed does not have to be there, in case the operand is
714 invariant in the function. */
715 if (!phi)
716 continue;
718 add_phi_arg (&phi, TREE_VALUE (args), e);
721 /* Add phi nodes for the call clobbered variables. */
722 v_may_defs = V_MAY_DEF_OPS (ann);
723 for (i = 0; i < NUM_V_MAY_DEFS (v_may_defs); i++)
725 param = SSA_NAME_VAR (V_MAY_DEF_RESULT (v_may_defs, i));
726 for (phi = phi_nodes (first); phi; phi = PHI_CHAIN (phi))
727 if (param == SSA_NAME_VAR (PHI_RESULT (phi)))
728 break;
730 if (!phi)
732 tree name = var_ann (param)->default_def;
733 tree new_name;
735 if (!name)
737 /* It may happen that the tag does not have a default_def in case
738 when all uses of it are dominated by a MUST_DEF. This however
739 means that it is not necessary to add a phi node for this
740 tag. */
741 continue;
743 new_name = make_ssa_name (param, SSA_NAME_DEF_STMT (name));
745 var_ann (param)->default_def = new_name;
746 phi = create_phi_node (name, first);
747 SSA_NAME_DEF_STMT (name) = phi;
748 add_phi_arg (&phi, new_name, ENTRY_BLOCK_PTR->succ);
750 /* For all calls the same set of variables should be clobbered. This
751 means that there always should be the appropriate phi node except
752 for the first time we eliminate the call. */
753 if (first->pred->pred_next->pred_next)
754 abort ();
757 add_phi_arg (&phi, V_MAY_DEF_OP (v_may_defs, i), e);
760 /* Update the values of accumulators. */
761 adjust_accumulator_values (t->call_bsi, t->mult, t->add, e);
763 call = bsi_stmt (t->call_bsi);
764 if (TREE_CODE (call) == MODIFY_EXPR)
766 rslt = TREE_OPERAND (call, 0);
768 /* Result of the call will no longer be defined. So adjust the
769 SSA_NAME_DEF_STMT accordingly. */
770 SSA_NAME_DEF_STMT (rslt) = build_empty_stmt ();
773 bsi_remove (&t->call_bsi);
776 /* Optimizes the tailcall described by T. If OPT_TAILCALLS is true, also
777 mark the tailcalls for the sibcall optimization. */
779 static bool
780 optimize_tail_call (struct tailcall *t, bool opt_tailcalls)
782 if (t->tail_recursion)
784 eliminate_tail_call (t);
785 return true;
788 if (opt_tailcalls)
790 tree stmt = bsi_stmt (t->call_bsi);
792 stmt = get_call_expr_in (stmt);
793 CALL_EXPR_TAILCALL (stmt) = 1;
794 if (dump_file && (dump_flags & TDF_DETAILS))
796 fprintf (dump_file, "Found tail call ");
797 print_generic_expr (dump_file, stmt, dump_flags);
798 fprintf (dump_file, " in bb %i\n", t->call_block->index);
802 return false;
805 /* Optimizes tail calls in the function, turning the tail recursion
806 into iteration. */
808 static void
809 tree_optimize_tail_calls_1 (bool opt_tailcalls)
811 edge e;
812 bool phis_constructed = false;
813 struct tailcall *tailcalls = NULL, *act, *next;
814 bool changed = false;
815 basic_block first = ENTRY_BLOCK_PTR->succ->dest;
816 tree stmt, param, ret_type, tmp, phi;
818 if (!suitable_for_tail_opt_p ())
819 return;
820 if (opt_tailcalls)
821 opt_tailcalls = suitable_for_tail_call_opt_p ();
823 for (e = EXIT_BLOCK_PTR->pred; e; e = e->pred_next)
825 /* Only traverse the normal exits, i.e. those that end with return
826 statement. */
827 stmt = last_stmt (e->src);
829 if (stmt
830 && TREE_CODE (stmt) == RETURN_EXPR)
831 find_tail_calls (e->src, &tailcalls);
834 /* Construct the phi nodes and accumulators if necessary. */
835 a_acc = m_acc = NULL_TREE;
836 for (act = tailcalls; act; act = act->next)
838 if (!act->tail_recursion)
839 continue;
841 if (!phis_constructed)
843 /* Ensure that there is only one predecessor of the block. */
844 if (first->pred->pred_next)
845 first = split_edge (ENTRY_BLOCK_PTR->succ);
847 /* Copy the args if needed. */
848 for (param = DECL_ARGUMENTS (current_function_decl);
849 param;
850 param = TREE_CHAIN (param))
851 if (var_ann (param)
852 /* Also parameters that are only defined but never used need not
853 be copied. */
854 && (var_ann (param)->default_def
855 && TREE_CODE (var_ann (param)->default_def) == SSA_NAME))
857 tree name = var_ann (param)->default_def;
858 tree new_name = make_ssa_name (param, SSA_NAME_DEF_STMT (name));
859 tree phi;
861 var_ann (param)->default_def = new_name;
862 phi = create_phi_node (name, first);
863 SSA_NAME_DEF_STMT (name) = phi;
864 add_phi_arg (&phi, new_name, first->pred);
866 phis_constructed = true;
869 if (act->add && !a_acc)
871 ret_type = TREE_TYPE (DECL_RESULT (current_function_decl));
873 tmp = create_tmp_var (ret_type, "add_acc");
874 add_referenced_tmp_var (tmp);
876 phi = create_phi_node (tmp, first);
877 add_phi_arg (&phi, fold_convert (ret_type, integer_zero_node),
878 first->pred);
879 a_acc = PHI_RESULT (phi);
882 if (act->mult && !m_acc)
884 ret_type = TREE_TYPE (DECL_RESULT (current_function_decl));
886 tmp = create_tmp_var (ret_type, "mult_acc");
887 add_referenced_tmp_var (tmp);
889 phi = create_phi_node (tmp, first);
890 add_phi_arg (&phi, fold_convert (ret_type, integer_one_node),
891 first->pred);
892 m_acc = PHI_RESULT (phi);
896 for (; tailcalls; tailcalls = next)
898 next = tailcalls->next;
899 changed |= optimize_tail_call (tailcalls, opt_tailcalls);
900 free (tailcalls);
903 if (a_acc || m_acc)
905 /* Modify the remaining return statements. */
906 for (e = EXIT_BLOCK_PTR->pred; e; e = e->pred_next)
908 stmt = last_stmt (e->src);
910 if (stmt
911 && TREE_CODE (stmt) == RETURN_EXPR)
912 adjust_return_value (e->src, m_acc, a_acc);
916 if (changed)
918 free_dominance_info (CDI_DOMINATORS);
919 cleanup_tree_cfg ();
923 static void
924 execute_tail_recursion (void)
926 tree_optimize_tail_calls_1 (false);
929 static bool
930 gate_tail_calls (void)
932 return flag_optimize_sibling_calls != 0;
935 static void
936 execute_tail_calls (void)
938 tree_optimize_tail_calls_1 (true);
941 struct tree_opt_pass pass_tail_recursion =
943 "tailr", /* name */
944 NULL, /* gate */
945 execute_tail_recursion, /* execute */
946 NULL, /* sub */
947 NULL, /* next */
948 0, /* static_pass_number */
949 0, /* tv_id */
950 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
951 0, /* properties_provided */
952 0, /* properties_destroyed */
953 0, /* todo_flags_start */
954 TODO_dump_func | TODO_verify_ssa /* todo_flags_finish */
957 struct tree_opt_pass pass_tail_calls =
959 "tailc", /* name */
960 gate_tail_calls, /* gate */
961 execute_tail_calls, /* execute */
962 NULL, /* sub */
963 NULL, /* next */
964 0, /* static_pass_number */
965 0, /* tv_id */
966 PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
967 0, /* properties_provided */
968 0, /* properties_destroyed */
969 0, /* todo_flags_start */
970 TODO_dump_func | TODO_verify_ssa /* todo_flags_finish */