* loop-iv.c (simplify_using_initial_values): Store e->src in a
[official-gcc.git] / gcc / loop-iv.c
blob2dcbb820ddb73611e442504ef1137890838cbea0
1 /* Rtl-level induction variable analysis.
2 Copyright (C) 2004 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 2, or (at your option) any
9 later version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT
12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING. If not, write to the Free
18 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
19 02111-1307, USA. */
21 /* This is just a very simplistic analysis of induction variables of the loop.
22 The major use is for determining the number of iterations of a loop for
23 loop unrolling, doloop optimization and branch prediction. For this we
24 are only interested in bivs and a fairly limited set of givs that are
25 needed in the exit condition. We also only compute the iv information on
26 demand.
28 The interesting registers are determined. A register is interesting if
30 -- it is set only in the blocks that dominate the latch of the current loop
31 -- all its sets are simple -- i.e. in the form we understand
33 We also number the insns sequentially in each basic block. For a use of the
34 interesting reg, it is now easy to find a reaching definition (there may be
35 only one).
37 Induction variable is then simply analyzed by walking the use-def
38 chains.
40 Usage:
42 iv_analysis_loop_init (loop);
43 insn = iv_get_reaching_def (where, reg);
44 if (iv_analyze (insn, reg, &iv))
46 ...
48 iv_analysis_done (); */
50 #include "config.h"
51 #include "system.h"
52 #include "coretypes.h"
53 #include "tm.h"
54 #include "rtl.h"
55 #include "hard-reg-set.h"
56 #include "basic-block.h"
57 #include "cfgloop.h"
58 #include "expr.h"
59 #include "output.h"
61 /* The insn information. */
63 struct insn_info
65 /* Id of the insn. */
66 unsigned luid;
68 /* The previous definition of the register defined by the single
69 set in the insn. */
70 rtx prev_def;
72 /* The description of the iv. */
73 struct rtx_iv iv;
76 static struct insn_info *insn_info;
78 /* The last definition of register. */
80 static rtx *last_def;
82 /* The bivs. */
84 static struct rtx_iv *bivs;
86 /* Maximal insn number for that there is place in insn_info array. */
88 static unsigned max_insn_no;
90 /* Maximal register number for that there is place in bivs and last_def
91 arrays. */
93 static unsigned max_reg_no;
95 /* Dumps information about IV to FILE. */
97 extern void dump_iv_info (FILE *, struct rtx_iv *);
98 void
99 dump_iv_info (FILE *file, struct rtx_iv *iv)
101 if (!iv->base)
103 fprintf (file, "not simple");
104 return;
107 if (iv->step == const0_rtx
108 && !iv->first_special)
109 fprintf (file, "invariant ");
111 print_rtl (file, iv->base);
112 if (iv->step != const0_rtx)
114 fprintf (file, " + ");
115 print_rtl (file, iv->step);
116 fprintf (file, " * iteration");
118 fprintf (file, " (in %s)", GET_MODE_NAME (iv->mode));
120 if (iv->mode != iv->extend_mode)
121 fprintf (file, " %s to %s",
122 rtx_name[iv->extend],
123 GET_MODE_NAME (iv->extend_mode));
125 if (iv->mult != const1_rtx)
127 fprintf (file, " * ");
128 print_rtl (file, iv->mult);
130 if (iv->delta != const0_rtx)
132 fprintf (file, " + ");
133 print_rtl (file, iv->delta);
135 if (iv->first_special)
136 fprintf (file, " (first special)");
139 /* Assigns luids to insns in basic block BB. */
141 static void
142 assign_luids (basic_block bb)
144 unsigned i = 0, uid;
145 rtx insn;
147 FOR_BB_INSNS (bb, insn)
149 uid = INSN_UID (insn);
150 insn_info[uid].luid = i++;
151 insn_info[uid].prev_def = NULL_RTX;
152 insn_info[uid].iv.analysed = false;
156 /* Generates a subreg to get the least significant part of EXPR (in mode
157 INNER_MODE) to OUTER_MODE. */
159 static rtx
160 lowpart_subreg (enum machine_mode outer_mode, rtx expr,
161 enum machine_mode inner_mode)
163 return simplify_gen_subreg (outer_mode, expr, inner_mode,
164 subreg_lowpart_offset (outer_mode, inner_mode));
167 /* Checks whether REG is a well-behaved register. */
169 static bool
170 simple_reg_p (rtx reg)
172 unsigned r;
174 if (GET_CODE (reg) == SUBREG)
176 if (!subreg_lowpart_p (reg))
177 return false;
178 reg = SUBREG_REG (reg);
181 if (!REG_P (reg))
182 return false;
184 r = REGNO (reg);
185 if (HARD_REGISTER_NUM_P (r))
186 return false;
188 if (GET_MODE_CLASS (GET_MODE (reg)) != MODE_INT)
189 return false;
191 if (last_def[r] == const0_rtx)
192 return false;
194 return true;
197 /* Checks whether assignment LHS = RHS is simple enough for us to process. */
199 static bool
200 simple_set_p (rtx lhs, rtx rhs)
202 rtx op0, op1;
204 if (!REG_P (lhs)
205 || !simple_reg_p (lhs))
206 return false;
208 if (CONSTANT_P (rhs))
209 return true;
211 switch (GET_CODE (rhs))
213 case SUBREG:
214 case REG:
215 return simple_reg_p (rhs);
217 case SIGN_EXTEND:
218 case ZERO_EXTEND:
219 case NEG:
220 return simple_reg_p (XEXP (rhs, 0));
222 case PLUS:
223 case MINUS:
224 case MULT:
225 case ASHIFT:
226 op0 = XEXP (rhs, 0);
227 op1 = XEXP (rhs, 1);
229 if (!simple_reg_p (op0)
230 && !CONSTANT_P (op0))
231 return false;
233 if (!simple_reg_p (op1)
234 && !CONSTANT_P (op1))
235 return false;
237 if (GET_CODE (rhs) == MULT
238 && !CONSTANT_P (op0)
239 && !CONSTANT_P (op1))
240 return false;
242 if (GET_CODE (rhs) == ASHIFT
243 && CONSTANT_P (op0))
244 return false;
246 return true;
248 default:
249 return false;
253 /* Mark single SET in INSN. */
255 static rtx
256 mark_single_set (rtx insn, rtx set)
258 rtx def = SET_DEST (set), src;
259 unsigned regno, uid;
261 src = find_reg_equal_equiv_note (insn);
262 if (src)
263 src = XEXP (src, 0);
264 else
265 src = SET_SRC (set);
267 if (!simple_set_p (SET_DEST (set), src))
268 return NULL_RTX;
270 regno = REGNO (def);
271 uid = INSN_UID (insn);
273 bivs[regno].analysed = false;
274 insn_info[uid].prev_def = last_def[regno];
275 last_def[regno] = insn;
277 return def;
280 /* Invalidate register REG unless it is equal to EXCEPT. */
282 static void
283 kill_sets (rtx reg, rtx by ATTRIBUTE_UNUSED, void *except)
285 if (GET_CODE (reg) == SUBREG)
286 reg = SUBREG_REG (reg);
287 if (!REG_P (reg))
288 return;
289 if (reg == except)
290 return;
292 last_def[REGNO (reg)] = const0_rtx;
295 /* Marks sets in basic block BB. If DOM is true, BB dominates the loop
296 latch. */
298 static void
299 mark_sets (basic_block bb, bool dom)
301 rtx insn, set, def;
303 FOR_BB_INSNS (bb, insn)
305 if (!INSN_P (insn))
306 continue;
308 if (dom
309 && (set = single_set (insn)))
310 def = mark_single_set (insn, set);
311 else
312 def = NULL_RTX;
314 note_stores (PATTERN (insn), kill_sets, def);
318 /* Prepare the data for an induction variable analysis of a LOOP. */
320 void
321 iv_analysis_loop_init (struct loop *loop)
323 basic_block *body = get_loop_body_in_dom_order (loop);
324 unsigned b;
326 if ((unsigned) get_max_uid () >= max_insn_no)
328 /* Add some reserve for insns and registers produced in optimizations. */
329 max_insn_no = get_max_uid () + 100;
330 if (insn_info)
331 free (insn_info);
332 insn_info = xmalloc (max_insn_no * sizeof (struct insn_info));
335 if ((unsigned) max_reg_num () >= max_reg_no)
337 max_reg_no = max_reg_num () + 100;
338 if (last_def)
339 free (last_def);
340 last_def = xmalloc (max_reg_no * sizeof (rtx));
341 if (bivs)
342 free (bivs);
343 bivs = xmalloc (max_reg_no * sizeof (struct rtx_iv));
346 memset (last_def, 0, max_reg_num () * sizeof (rtx));
348 for (b = 0; b < loop->num_nodes; b++)
350 assign_luids (body[b]);
351 mark_sets (body[b], just_once_each_iteration_p (loop, body[b]));
354 free (body);
357 /* Gets definition of REG reaching the INSN. If REG is not simple, const0_rtx
358 is returned. If INSN is before the first def in the loop, NULL_RTX is
359 returned. */
362 iv_get_reaching_def (rtx insn, rtx reg)
364 unsigned regno, luid, auid;
365 rtx ainsn;
366 basic_block bb, abb;
368 if (GET_CODE (reg) == SUBREG)
370 if (!subreg_lowpart_p (reg))
371 return const0_rtx;
372 reg = SUBREG_REG (reg);
374 if (!REG_P (reg))
375 return NULL_RTX;
377 regno = REGNO (reg);
378 if (!last_def[regno]
379 || last_def[regno] == const0_rtx)
380 return last_def[regno];
382 bb = BLOCK_FOR_INSN (insn);
383 luid = insn_info[INSN_UID (insn)].luid;
385 ainsn = last_def[regno];
386 while (1)
388 abb = BLOCK_FOR_INSN (ainsn);
390 if (dominated_by_p (CDI_DOMINATORS, bb, abb))
391 break;
393 auid = INSN_UID (ainsn);
394 ainsn = insn_info[auid].prev_def;
396 if (!ainsn)
397 return NULL_RTX;
400 while (1)
402 abb = BLOCK_FOR_INSN (ainsn);
403 if (abb != bb)
404 return ainsn;
406 auid = INSN_UID (ainsn);
407 if (luid > insn_info[auid].luid)
408 return ainsn;
410 ainsn = insn_info[auid].prev_def;
411 if (!ainsn)
412 return NULL_RTX;
416 /* Sets IV to invariant CST in MODE. Always returns true (just for
417 consistency with other iv manipulation functions that may fail). */
419 static bool
420 iv_constant (struct rtx_iv *iv, rtx cst, enum machine_mode mode)
422 if (mode == VOIDmode)
423 mode = GET_MODE (cst);
425 iv->analysed = true;
426 iv->mode = mode;
427 iv->base = cst;
428 iv->step = const0_rtx;
429 iv->first_special = false;
430 iv->extend = UNKNOWN;
431 iv->extend_mode = iv->mode;
432 iv->delta = const0_rtx;
433 iv->mult = const1_rtx;
435 return true;
438 /* Evaluates application of subreg to MODE on IV. */
440 static bool
441 iv_subreg (struct rtx_iv *iv, enum machine_mode mode)
443 /* If iv is invariant, just calculate the new value. */
444 if (iv->step == const0_rtx
445 && !iv->first_special)
447 rtx val = get_iv_value (iv, const0_rtx);
448 val = lowpart_subreg (mode, val, iv->extend_mode);
450 iv->base = val;
451 iv->extend = UNKNOWN;
452 iv->mode = iv->extend_mode = mode;
453 iv->delta = const0_rtx;
454 iv->mult = const1_rtx;
455 return true;
458 if (iv->extend_mode == mode)
459 return true;
461 if (GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (iv->mode))
462 return false;
464 iv->extend = UNKNOWN;
465 iv->mode = mode;
467 iv->base = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
468 simplify_gen_binary (MULT, iv->extend_mode,
469 iv->base, iv->mult));
470 iv->step = simplify_gen_binary (MULT, iv->extend_mode, iv->step, iv->mult);
471 iv->mult = const1_rtx;
472 iv->delta = const0_rtx;
473 iv->first_special = false;
475 return true;
478 /* Evaluates application of EXTEND to MODE on IV. */
480 static bool
481 iv_extend (struct rtx_iv *iv, enum rtx_code extend, enum machine_mode mode)
483 /* If iv is invariant, just calculate the new value. */
484 if (iv->step == const0_rtx
485 && !iv->first_special)
487 rtx val = get_iv_value (iv, const0_rtx);
488 val = simplify_gen_unary (extend, mode, val, iv->extend_mode);
490 iv->base = val;
491 iv->extend = UNKNOWN;
492 iv->mode = iv->extend_mode = mode;
493 iv->delta = const0_rtx;
494 iv->mult = const1_rtx;
495 return true;
498 if (mode != iv->extend_mode)
499 return false;
501 if (iv->extend != UNKNOWN
502 && iv->extend != extend)
503 return false;
505 iv->extend = extend;
507 return true;
510 /* Evaluates negation of IV. */
512 static bool
513 iv_neg (struct rtx_iv *iv)
515 if (iv->extend == UNKNOWN)
517 iv->base = simplify_gen_unary (NEG, iv->extend_mode,
518 iv->base, iv->extend_mode);
519 iv->step = simplify_gen_unary (NEG, iv->extend_mode,
520 iv->step, iv->extend_mode);
522 else
524 iv->delta = simplify_gen_unary (NEG, iv->extend_mode,
525 iv->delta, iv->extend_mode);
526 iv->mult = simplify_gen_unary (NEG, iv->extend_mode,
527 iv->mult, iv->extend_mode);
530 return true;
533 /* Evaluates addition or subtraction (according to OP) of IV1 to IV0. */
535 static bool
536 iv_add (struct rtx_iv *iv0, struct rtx_iv *iv1, enum rtx_code op)
538 enum machine_mode mode;
539 rtx arg;
541 /* Extend the constant to extend_mode of the other operand if necessary. */
542 if (iv0->extend == UNKNOWN
543 && iv0->mode == iv0->extend_mode
544 && iv0->step == const0_rtx
545 && GET_MODE_SIZE (iv0->extend_mode) < GET_MODE_SIZE (iv1->extend_mode))
547 iv0->extend_mode = iv1->extend_mode;
548 iv0->base = simplify_gen_unary (ZERO_EXTEND, iv0->extend_mode,
549 iv0->base, iv0->mode);
551 if (iv1->extend == UNKNOWN
552 && iv1->mode == iv1->extend_mode
553 && iv1->step == const0_rtx
554 && GET_MODE_SIZE (iv1->extend_mode) < GET_MODE_SIZE (iv0->extend_mode))
556 iv1->extend_mode = iv0->extend_mode;
557 iv1->base = simplify_gen_unary (ZERO_EXTEND, iv1->extend_mode,
558 iv1->base, iv1->mode);
561 mode = iv0->extend_mode;
562 if (mode != iv1->extend_mode)
563 return false;
565 if (iv0->extend == UNKNOWN && iv1->extend == UNKNOWN)
567 if (iv0->mode != iv1->mode)
568 return false;
570 iv0->base = simplify_gen_binary (op, mode, iv0->base, iv1->base);
571 iv0->step = simplify_gen_binary (op, mode, iv0->step, iv1->step);
573 return true;
576 /* Handle addition of constant. */
577 if (iv1->extend == UNKNOWN
578 && iv1->mode == mode
579 && iv1->step == const0_rtx)
581 iv0->delta = simplify_gen_binary (op, mode, iv0->delta, iv1->base);
582 return true;
585 if (iv0->extend == UNKNOWN
586 && iv0->mode == mode
587 && iv0->step == const0_rtx)
589 arg = iv0->base;
590 *iv0 = *iv1;
591 if (op == MINUS
592 && !iv_neg (iv0))
593 return false;
595 iv0->delta = simplify_gen_binary (PLUS, mode, iv0->delta, arg);
596 return true;
599 return false;
602 /* Evaluates multiplication of IV by constant CST. */
604 static bool
605 iv_mult (struct rtx_iv *iv, rtx mby)
607 enum machine_mode mode = iv->extend_mode;
609 if (GET_MODE (mby) != VOIDmode
610 && GET_MODE (mby) != mode)
611 return false;
613 if (iv->extend == UNKNOWN)
615 iv->base = simplify_gen_binary (MULT, mode, iv->base, mby);
616 iv->step = simplify_gen_binary (MULT, mode, iv->step, mby);
618 else
620 iv->delta = simplify_gen_binary (MULT, mode, iv->delta, mby);
621 iv->mult = simplify_gen_binary (MULT, mode, iv->mult, mby);
624 return true;
627 /* Evaluates shift of IV by constant CST. */
629 static bool
630 iv_shift (struct rtx_iv *iv, rtx mby)
632 enum machine_mode mode = iv->extend_mode;
634 if (GET_MODE (mby) != VOIDmode
635 && GET_MODE (mby) != mode)
636 return false;
638 if (iv->extend == UNKNOWN)
640 iv->base = simplify_gen_binary (ASHIFT, mode, iv->base, mby);
641 iv->step = simplify_gen_binary (ASHIFT, mode, iv->step, mby);
643 else
645 iv->delta = simplify_gen_binary (ASHIFT, mode, iv->delta, mby);
646 iv->mult = simplify_gen_binary (ASHIFT, mode, iv->mult, mby);
649 return true;
652 /* The recursive part of get_biv_step. Gets the value of the single value
653 defined in INSN wrto initial value of REG inside loop, in shape described
654 at get_biv_step. */
656 static bool
657 get_biv_step_1 (rtx insn, rtx reg,
658 rtx *inner_step, enum machine_mode *inner_mode,
659 enum rtx_code *extend, enum machine_mode outer_mode,
660 rtx *outer_step)
662 rtx set, lhs, rhs, op0 = NULL_RTX, op1 = NULL_RTX;
663 rtx next, nextr, def_insn, tmp;
664 enum rtx_code code;
666 set = single_set (insn);
667 rhs = find_reg_equal_equiv_note (insn);
668 if (rhs)
669 rhs = XEXP (rhs, 0);
670 else
671 rhs = SET_SRC (set);
672 lhs = SET_DEST (set);
674 code = GET_CODE (rhs);
675 switch (code)
677 case SUBREG:
678 case REG:
679 next = rhs;
680 break;
682 case PLUS:
683 case MINUS:
684 op0 = XEXP (rhs, 0);
685 op1 = XEXP (rhs, 1);
687 if (code == PLUS && CONSTANT_P (op0))
689 tmp = op0; op0 = op1; op1 = tmp;
692 if (!simple_reg_p (op0)
693 || !CONSTANT_P (op1))
694 return false;
696 if (GET_MODE (rhs) != outer_mode)
698 /* ppc64 uses expressions like
700 (set x:SI (plus:SI (subreg:SI y:DI) 1)).
702 this is equivalent to
704 (set x':DI (plus:DI y:DI 1))
705 (set x:SI (subreg:SI (x':DI)). */
706 if (GET_CODE (op0) != SUBREG)
707 return false;
708 if (GET_MODE (SUBREG_REG (op0)) != outer_mode)
709 return false;
712 next = op0;
713 break;
715 case SIGN_EXTEND:
716 case ZERO_EXTEND:
717 if (GET_MODE (rhs) != outer_mode)
718 return false;
720 op0 = XEXP (rhs, 0);
721 if (!simple_reg_p (op0))
722 return false;
724 next = op0;
725 break;
727 default:
728 return false;
731 if (GET_CODE (next) == SUBREG)
733 if (!subreg_lowpart_p (next))
734 return false;
736 nextr = SUBREG_REG (next);
737 if (GET_MODE (nextr) != outer_mode)
738 return false;
740 else
741 nextr = next;
743 def_insn = iv_get_reaching_def (insn, nextr);
744 if (def_insn == const0_rtx)
745 return false;
747 if (!def_insn)
749 if (!rtx_equal_p (nextr, reg))
750 return false;
752 *inner_step = const0_rtx;
753 *extend = UNKNOWN;
754 *inner_mode = outer_mode;
755 *outer_step = const0_rtx;
757 else if (!get_biv_step_1 (def_insn, reg,
758 inner_step, inner_mode, extend, outer_mode,
759 outer_step))
760 return false;
762 if (GET_CODE (next) == SUBREG)
764 enum machine_mode amode = GET_MODE (next);
766 if (GET_MODE_SIZE (amode) > GET_MODE_SIZE (*inner_mode))
767 return false;
769 *inner_mode = amode;
770 *inner_step = simplify_gen_binary (PLUS, outer_mode,
771 *inner_step, *outer_step);
772 *outer_step = const0_rtx;
773 *extend = UNKNOWN;
776 switch (code)
778 case REG:
779 case SUBREG:
780 break;
782 case PLUS:
783 case MINUS:
784 if (*inner_mode == outer_mode
785 /* See comment in previous switch. */
786 || GET_MODE (rhs) != outer_mode)
787 *inner_step = simplify_gen_binary (code, outer_mode,
788 *inner_step, op1);
789 else
790 *outer_step = simplify_gen_binary (code, outer_mode,
791 *outer_step, op1);
792 break;
794 case SIGN_EXTEND:
795 case ZERO_EXTEND:
796 if (GET_MODE (op0) != *inner_mode
797 || *extend != UNKNOWN
798 || *outer_step != const0_rtx)
799 abort ();
801 *extend = code;
802 break;
804 default:
805 abort ();
808 return true;
811 /* Gets the operation on register REG inside loop, in shape
813 OUTER_STEP + EXTEND_{OUTER_MODE} (SUBREG_{INNER_MODE} (REG + INNER_STEP))
815 If the operation cannot be described in this shape, return false. */
817 static bool
818 get_biv_step (rtx reg, rtx *inner_step, enum machine_mode *inner_mode,
819 enum rtx_code *extend, enum machine_mode *outer_mode,
820 rtx *outer_step)
822 *outer_mode = GET_MODE (reg);
824 if (!get_biv_step_1 (last_def[REGNO (reg)], reg,
825 inner_step, inner_mode, extend, *outer_mode,
826 outer_step))
827 return false;
829 if (*inner_mode != *outer_mode
830 && *extend == UNKNOWN)
831 abort ();
833 if (*inner_mode == *outer_mode
834 && *extend != UNKNOWN)
835 abort ();
837 if (*inner_mode == *outer_mode
838 && *outer_step != const0_rtx)
839 abort ();
841 return true;
844 /* Determines whether DEF is a biv and if so, stores its description
845 to *IV. */
847 static bool
848 iv_analyze_biv (rtx def, struct rtx_iv *iv)
850 unsigned regno;
851 rtx inner_step, outer_step;
852 enum machine_mode inner_mode, outer_mode;
853 enum rtx_code extend;
855 if (dump_file)
857 fprintf (dump_file, "Analysing ");
858 print_rtl (dump_file, def);
859 fprintf (dump_file, " for bivness.\n");
862 if (!REG_P (def))
864 if (!CONSTANT_P (def))
865 return false;
867 return iv_constant (iv, def, VOIDmode);
870 regno = REGNO (def);
871 if (last_def[regno] == const0_rtx)
873 if (dump_file)
874 fprintf (dump_file, " not simple.\n");
875 return false;
878 if (last_def[regno] && bivs[regno].analysed)
880 if (dump_file)
881 fprintf (dump_file, " already analysed.\n");
883 *iv = bivs[regno];
884 return iv->base != NULL_RTX;
887 if (!last_def[regno])
889 iv_constant (iv, def, VOIDmode);
890 goto end;
893 iv->analysed = true;
894 if (!get_biv_step (def, &inner_step, &inner_mode, &extend,
895 &outer_mode, &outer_step))
897 iv->base = NULL_RTX;
898 goto end;
901 /* Loop transforms base to es (base + inner_step) + outer_step,
902 where es means extend of subreg between inner_mode and outer_mode.
903 The corresponding induction variable is
905 es ((base - outer_step) + i * (inner_step + outer_step)) + outer_step */
907 iv->base = simplify_gen_binary (MINUS, outer_mode, def, outer_step);
908 iv->step = simplify_gen_binary (PLUS, outer_mode, inner_step, outer_step);
909 iv->mode = inner_mode;
910 iv->extend_mode = outer_mode;
911 iv->extend = extend;
912 iv->mult = const1_rtx;
913 iv->delta = outer_step;
914 iv->first_special = inner_mode != outer_mode;
916 end:
917 if (dump_file)
919 fprintf (dump_file, " ");
920 dump_iv_info (dump_file, iv);
921 fprintf (dump_file, "\n");
924 bivs[regno] = *iv;
926 return iv->base != NULL_RTX;
929 /* Analyzes operand OP of INSN and stores the result to *IV. */
931 static bool
932 iv_analyze_op (rtx insn, rtx op, struct rtx_iv *iv)
934 rtx def_insn;
935 unsigned regno;
936 bool inv = CONSTANT_P (op);
938 if (dump_file)
940 fprintf (dump_file, "Analysing operand ");
941 print_rtl (dump_file, op);
942 fprintf (dump_file, " of insn ");
943 print_rtl_single (dump_file, insn);
946 if (GET_CODE (op) == SUBREG)
948 if (!subreg_lowpart_p (op))
949 return false;
951 if (!iv_analyze_op (insn, SUBREG_REG (op), iv))
952 return false;
954 return iv_subreg (iv, GET_MODE (op));
957 if (!inv)
959 regno = REGNO (op);
960 if (!last_def[regno])
961 inv = true;
962 else if (last_def[regno] == const0_rtx)
964 if (dump_file)
965 fprintf (dump_file, " not simple.\n");
966 return false;
970 if (inv)
972 iv_constant (iv, op, VOIDmode);
974 if (dump_file)
976 fprintf (dump_file, " ");
977 dump_iv_info (dump_file, iv);
978 fprintf (dump_file, "\n");
980 return true;
983 def_insn = iv_get_reaching_def (insn, op);
984 if (def_insn == const0_rtx)
986 if (dump_file)
987 fprintf (dump_file, " not simple.\n");
988 return false;
991 return iv_analyze (def_insn, op, iv);
994 /* Analyzes iv DEF defined in INSN and stores the result to *IV. */
996 bool
997 iv_analyze (rtx insn, rtx def, struct rtx_iv *iv)
999 unsigned uid;
1000 rtx set, rhs, mby = NULL_RTX, tmp;
1001 rtx op0 = NULL_RTX, op1 = NULL_RTX;
1002 struct rtx_iv iv0, iv1;
1003 enum machine_mode amode;
1004 enum rtx_code code;
1006 if (insn == const0_rtx)
1007 return false;
1009 if (GET_CODE (def) == SUBREG)
1011 if (!subreg_lowpart_p (def))
1012 return false;
1014 if (!iv_analyze (insn, SUBREG_REG (def), iv))
1015 return false;
1017 return iv_subreg (iv, GET_MODE (def));
1020 if (!insn)
1021 return iv_analyze_biv (def, iv);
1023 if (dump_file)
1025 fprintf (dump_file, "Analysing def of ");
1026 print_rtl (dump_file, def);
1027 fprintf (dump_file, " in insn ");
1028 print_rtl_single (dump_file, insn);
1031 uid = INSN_UID (insn);
1032 if (insn_info[uid].iv.analysed)
1034 if (dump_file)
1035 fprintf (dump_file, " already analysed.\n");
1036 *iv = insn_info[uid].iv;
1037 return iv->base != NULL_RTX;
1040 iv->mode = VOIDmode;
1041 iv->base = NULL_RTX;
1042 iv->step = NULL_RTX;
1044 set = single_set (insn);
1045 rhs = find_reg_equal_equiv_note (insn);
1046 if (rhs)
1047 rhs = XEXP (rhs, 0);
1048 else
1049 rhs = SET_SRC (set);
1050 code = GET_CODE (rhs);
1052 if (CONSTANT_P (rhs))
1054 op0 = rhs;
1055 amode = GET_MODE (def);
1057 else
1059 switch (code)
1061 case SUBREG:
1062 if (!subreg_lowpart_p (rhs))
1063 goto end;
1064 op0 = rhs;
1065 break;
1067 case REG:
1068 op0 = rhs;
1069 break;
1071 case SIGN_EXTEND:
1072 case ZERO_EXTEND:
1073 case NEG:
1074 op0 = XEXP (rhs, 0);
1075 break;
1077 case PLUS:
1078 case MINUS:
1079 op0 = XEXP (rhs, 0);
1080 op1 = XEXP (rhs, 1);
1081 break;
1083 case MULT:
1084 op0 = XEXP (rhs, 0);
1085 mby = XEXP (rhs, 1);
1086 if (!CONSTANT_P (mby))
1088 if (!CONSTANT_P (op0))
1089 abort ();
1090 tmp = op0;
1091 op0 = mby;
1092 mby = tmp;
1094 break;
1096 case ASHIFT:
1097 if (CONSTANT_P (XEXP (rhs, 0)))
1098 abort ();
1099 op0 = XEXP (rhs, 0);
1100 mby = XEXP (rhs, 1);
1101 break;
1103 default:
1104 abort ();
1107 amode = GET_MODE (rhs);
1110 if (op0)
1112 if (!iv_analyze_op (insn, op0, &iv0))
1113 goto end;
1115 if (iv0.mode == VOIDmode)
1117 iv0.mode = amode;
1118 iv0.extend_mode = amode;
1122 if (op1)
1124 if (!iv_analyze_op (insn, op1, &iv1))
1125 goto end;
1127 if (iv1.mode == VOIDmode)
1129 iv1.mode = amode;
1130 iv1.extend_mode = amode;
1134 switch (code)
1136 case SIGN_EXTEND:
1137 case ZERO_EXTEND:
1138 if (!iv_extend (&iv0, code, amode))
1139 goto end;
1140 break;
1142 case NEG:
1143 if (!iv_neg (&iv0))
1144 goto end;
1145 break;
1147 case PLUS:
1148 case MINUS:
1149 if (!iv_add (&iv0, &iv1, code))
1150 goto end;
1151 break;
1153 case MULT:
1154 if (!iv_mult (&iv0, mby))
1155 goto end;
1156 break;
1158 case ASHIFT:
1159 if (!iv_shift (&iv0, mby))
1160 goto end;
1161 break;
1163 default:
1164 break;
1167 *iv = iv0;
1169 end:
1170 iv->analysed = true;
1171 insn_info[uid].iv = *iv;
1173 if (dump_file)
1175 print_rtl (dump_file, def);
1176 fprintf (dump_file, " in insn ");
1177 print_rtl_single (dump_file, insn);
1178 fprintf (dump_file, " is ");
1179 dump_iv_info (dump_file, iv);
1180 fprintf (dump_file, "\n");
1183 return iv->base != NULL_RTX;
1186 /* Calculates value of IV at ITERATION-th iteration. */
1189 get_iv_value (struct rtx_iv *iv, rtx iteration)
1191 rtx val;
1193 /* We would need to generate some if_then_else patterns, and so far
1194 it is not needed anywhere. */
1195 if (iv->first_special)
1196 abort ();
1198 if (iv->step != const0_rtx && iteration != const0_rtx)
1199 val = simplify_gen_binary (PLUS, iv->extend_mode, iv->base,
1200 simplify_gen_binary (MULT, iv->extend_mode,
1201 iv->step, iteration));
1202 else
1203 val = iv->base;
1205 if (iv->extend_mode == iv->mode)
1206 return val;
1208 val = lowpart_subreg (iv->mode, val, iv->extend_mode);
1210 if (iv->extend == UNKNOWN)
1211 return val;
1213 val = simplify_gen_unary (iv->extend, iv->extend_mode, val, iv->mode);
1214 val = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
1215 simplify_gen_binary (MULT, iv->extend_mode,
1216 iv->mult, val));
1218 return val;
1221 /* Free the data for an induction variable analysis. */
1223 void
1224 iv_analysis_done (void)
1226 max_insn_no = 0;
1227 max_reg_no = 0;
1228 if (insn_info)
1230 free (insn_info);
1231 insn_info = NULL;
1233 if (last_def)
1235 free (last_def);
1236 last_def = NULL;
1238 if (bivs)
1240 free (bivs);
1241 bivs = NULL;
1245 /* Computes inverse to X modulo (1 << MOD). */
1247 static unsigned HOST_WIDEST_INT
1248 inverse (unsigned HOST_WIDEST_INT x, int mod)
1250 unsigned HOST_WIDEST_INT mask =
1251 ((unsigned HOST_WIDEST_INT) 1 << (mod - 1) << 1) - 1;
1252 unsigned HOST_WIDEST_INT rslt = 1;
1253 int i;
1255 for (i = 0; i < mod - 1; i++)
1257 rslt = (rslt * x) & mask;
1258 x = (x * x) & mask;
1261 return rslt;
1264 /* Tries to estimate the maximum number of iterations. */
1266 static unsigned HOST_WIDEST_INT
1267 determine_max_iter (struct niter_desc *desc)
1269 rtx niter = desc->niter_expr;
1270 rtx mmin, mmax, left, right;
1271 unsigned HOST_WIDEST_INT nmax, inc;
1273 if (GET_CODE (niter) == AND
1274 && GET_CODE (XEXP (niter, 0)) == CONST_INT)
1276 nmax = INTVAL (XEXP (niter, 0));
1277 if (!(nmax & (nmax + 1)))
1279 desc->niter_max = nmax;
1280 return nmax;
1284 get_mode_bounds (desc->mode, desc->signed_p, desc->mode, &mmin, &mmax);
1285 nmax = INTVAL (mmax) - INTVAL (mmin);
1287 if (GET_CODE (niter) == UDIV)
1289 if (GET_CODE (XEXP (niter, 1)) != CONST_INT)
1291 desc->niter_max = nmax;
1292 return nmax;
1294 inc = INTVAL (XEXP (niter, 1));
1295 niter = XEXP (niter, 0);
1297 else
1298 inc = 1;
1300 if (GET_CODE (niter) == PLUS)
1302 left = XEXP (niter, 0);
1303 right = XEXP (niter, 0);
1305 if (GET_CODE (right) == CONST_INT)
1306 right = GEN_INT (-INTVAL (right));
1308 else if (GET_CODE (niter) == MINUS)
1310 left = XEXP (niter, 0);
1311 right = XEXP (niter, 0);
1313 else
1315 left = niter;
1316 right = mmin;
1319 if (GET_CODE (left) == CONST_INT)
1320 mmax = left;
1321 if (GET_CODE (right) == CONST_INT)
1322 mmin = right;
1323 nmax = INTVAL (mmax) - INTVAL (mmin);
1325 desc->niter_max = nmax / inc;
1326 return nmax / inc;
1329 /* Checks whether register *REG is in set ALT. Callback for for_each_rtx. */
1331 static int
1332 altered_reg_used (rtx *reg, void *alt)
1334 if (!REG_P (*reg))
1335 return 0;
1337 return REGNO_REG_SET_P (alt, REGNO (*reg));
1340 /* Marks registers altered by EXPR in set ALT. */
1342 static void
1343 mark_altered (rtx expr, rtx by ATTRIBUTE_UNUSED, void *alt)
1345 if (GET_CODE (expr) == SUBREG)
1346 expr = SUBREG_REG (expr);
1347 if (!REG_P (expr))
1348 return;
1350 SET_REGNO_REG_SET (alt, REGNO (expr));
1353 /* Checks whether RHS is simple enough to process. */
1355 static bool
1356 simple_rhs_p (rtx rhs)
1358 rtx op0, op1;
1360 if (CONSTANT_P (rhs)
1361 || REG_P (rhs))
1362 return true;
1364 switch (GET_CODE (rhs))
1366 case PLUS:
1367 case MINUS:
1368 op0 = XEXP (rhs, 0);
1369 op1 = XEXP (rhs, 1);
1370 /* Allow reg + const sets only. */
1371 if (REG_P (op0) && CONSTANT_P (op1))
1372 return true;
1373 if (REG_P (op1) && CONSTANT_P (op0))
1374 return true;
1376 return false;
1378 default:
1379 return false;
1383 /* Simplifies *EXPR using assignment in INSN. ALTERED is the set of registers
1384 altered so far. */
1386 static void
1387 simplify_using_assignment (rtx insn, rtx *expr, regset altered)
1389 rtx set = single_set (insn);
1390 rtx lhs = NULL_RTX, rhs;
1391 bool ret = false;
1393 if (set)
1395 lhs = SET_DEST (set);
1396 if (!REG_P (lhs)
1397 || altered_reg_used (&lhs, altered))
1398 ret = true;
1400 else
1401 ret = true;
1403 note_stores (PATTERN (insn), mark_altered, altered);
1404 if (CALL_P (insn))
1406 int i;
1408 /* Kill all call clobbered registers. */
1409 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1410 if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i))
1411 SET_REGNO_REG_SET (altered, i);
1414 if (ret)
1415 return;
1417 rhs = find_reg_equal_equiv_note (insn);
1418 if (rhs)
1419 rhs = XEXP (rhs, 0);
1420 else
1421 rhs = SET_SRC (set);
1423 if (!simple_rhs_p (rhs))
1424 return;
1426 if (for_each_rtx (&rhs, altered_reg_used, altered))
1427 return;
1429 *expr = simplify_replace_rtx (*expr, lhs, rhs);
1432 /* Checks whether A implies B. */
1434 static bool
1435 implies_p (rtx a, rtx b)
1437 rtx op0, op1, opb0, opb1, r;
1438 enum machine_mode mode;
1440 if (GET_CODE (a) == EQ)
1442 op0 = XEXP (a, 0);
1443 op1 = XEXP (a, 1);
1445 if (REG_P (op0))
1447 r = simplify_replace_rtx (b, op0, op1);
1448 if (r == const_true_rtx)
1449 return true;
1452 if (REG_P (op1))
1454 r = simplify_replace_rtx (b, op1, op0);
1455 if (r == const_true_rtx)
1456 return true;
1460 /* A < B implies A + 1 <= B. */
1461 if ((GET_CODE (a) == GT || GET_CODE (a) == LT)
1462 && (GET_CODE (b) == GE || GET_CODE (b) == LE))
1464 op0 = XEXP (a, 0);
1465 op1 = XEXP (a, 1);
1466 opb0 = XEXP (b, 0);
1467 opb1 = XEXP (b, 1);
1469 if (GET_CODE (a) == GT)
1471 r = op0;
1472 op0 = op1;
1473 op1 = r;
1476 if (GET_CODE (b) == GE)
1478 r = opb0;
1479 opb0 = opb1;
1480 opb1 = r;
1483 mode = GET_MODE (op0);
1484 if (mode != GET_MODE (opb0))
1485 mode = VOIDmode;
1486 else if (mode == VOIDmode)
1488 mode = GET_MODE (op1);
1489 if (mode != GET_MODE (opb1))
1490 mode = VOIDmode;
1493 if (mode != VOIDmode
1494 && rtx_equal_p (op1, opb1)
1495 && simplify_gen_binary (MINUS, mode, opb0, op0) == const1_rtx)
1496 return true;
1499 return false;
1502 /* Canonicalizes COND so that
1504 (1) Ensure that operands are ordered according to
1505 swap_commutative_operands_p.
1506 (2) (LE x const) will be replaced with (LT x <const+1>) and similarly
1507 for GE, GEU, and LEU. */
1510 canon_condition (rtx cond)
1512 rtx tem;
1513 rtx op0, op1;
1514 enum rtx_code code;
1515 enum machine_mode mode;
1517 code = GET_CODE (cond);
1518 op0 = XEXP (cond, 0);
1519 op1 = XEXP (cond, 1);
1521 if (swap_commutative_operands_p (op0, op1))
1523 code = swap_condition (code);
1524 tem = op0;
1525 op0 = op1;
1526 op1 = tem;
1529 mode = GET_MODE (op0);
1530 if (mode == VOIDmode)
1531 mode = GET_MODE (op1);
1532 if (mode == VOIDmode)
1533 abort ();
1535 if (GET_CODE (op1) == CONST_INT
1536 && GET_MODE_CLASS (mode) != MODE_CC
1537 && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
1539 HOST_WIDE_INT const_val = INTVAL (op1);
1540 unsigned HOST_WIDE_INT uconst_val = const_val;
1541 unsigned HOST_WIDE_INT max_val
1542 = (unsigned HOST_WIDE_INT) GET_MODE_MASK (mode);
1544 switch (code)
1546 case LE:
1547 if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1)
1548 code = LT, op1 = gen_int_mode (const_val + 1, GET_MODE (op0));
1549 break;
1551 /* When cross-compiling, const_val might be sign-extended from
1552 BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */
1553 case GE:
1554 if ((HOST_WIDE_INT) (const_val & max_val)
1555 != (((HOST_WIDE_INT) 1
1556 << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
1557 code = GT, op1 = gen_int_mode (const_val - 1, mode);
1558 break;
1560 case LEU:
1561 if (uconst_val < max_val)
1562 code = LTU, op1 = gen_int_mode (uconst_val + 1, mode);
1563 break;
1565 case GEU:
1566 if (uconst_val != 0)
1567 code = GTU, op1 = gen_int_mode (uconst_val - 1, mode);
1568 break;
1570 default:
1571 break;
1575 if (op0 != XEXP (cond, 0)
1576 || op1 != XEXP (cond, 1)
1577 || code != GET_CODE (cond)
1578 || GET_MODE (cond) != SImode)
1579 cond = gen_rtx_fmt_ee (code, SImode, op0, op1);
1581 return cond;
1584 /* Tries to use the fact that COND holds to simplify EXPR. ALTERED is the
1585 set of altered regs. */
1587 void
1588 simplify_using_condition (rtx cond, rtx *expr, regset altered)
1590 rtx rev, reve, exp = *expr;
1592 if (!COMPARISON_P (exp))
1593 return;
1595 /* If some register gets altered later, we do not really speak about its
1596 value at the time of comparison. */
1597 if (altered
1598 && for_each_rtx (&cond, altered_reg_used, altered))
1599 return;
1601 rev = reversed_condition (cond);
1602 reve = reversed_condition (exp);
1604 cond = canon_condition (cond);
1605 exp = canon_condition (exp);
1606 if (rev)
1607 rev = canon_condition (rev);
1608 if (reve)
1609 reve = canon_condition (reve);
1611 if (rtx_equal_p (exp, cond))
1613 *expr = const_true_rtx;
1614 return;
1618 if (rev && rtx_equal_p (exp, rev))
1620 *expr = const0_rtx;
1621 return;
1624 if (implies_p (cond, exp))
1626 *expr = const_true_rtx;
1627 return;
1630 if (reve && implies_p (cond, reve))
1632 *expr = const0_rtx;
1633 return;
1636 /* A proof by contradiction. If *EXPR implies (not cond), *EXPR must
1637 be false. */
1638 if (rev && implies_p (exp, rev))
1640 *expr = const0_rtx;
1641 return;
1644 /* Similarly, If (not *EXPR) implies (not cond), *EXPR must be true. */
1645 if (rev && reve && implies_p (reve, rev))
1647 *expr = const_true_rtx;
1648 return;
1651 /* We would like to have some other tests here. TODO. */
1653 return;
1656 /* Use relationship between A and *B to eventually eliminate *B.
1657 OP is the operation we consider. */
1659 static void
1660 eliminate_implied_condition (enum rtx_code op, rtx a, rtx *b)
1662 if (op == AND)
1664 /* If A implies *B, we may replace *B by true. */
1665 if (implies_p (a, *b))
1666 *b = const_true_rtx;
1668 else if (op == IOR)
1670 /* If *B implies A, we may replace *B by false. */
1671 if (implies_p (*b, a))
1672 *b = const0_rtx;
1674 else
1675 abort ();
1678 /* Eliminates the conditions in TAIL that are implied by HEAD. OP is the
1679 operation we consider. */
1681 static void
1682 eliminate_implied_conditions (enum rtx_code op, rtx *head, rtx tail)
1684 rtx elt;
1686 for (elt = tail; elt; elt = XEXP (elt, 1))
1687 eliminate_implied_condition (op, *head, &XEXP (elt, 0));
1688 for (elt = tail; elt; elt = XEXP (elt, 1))
1689 eliminate_implied_condition (op, XEXP (elt, 0), head);
1692 /* Simplifies *EXPR using initial values at the start of the LOOP. If *EXPR
1693 is a list, its elements are assumed to be combined using OP. */
1695 static void
1696 simplify_using_initial_values (struct loop *loop, enum rtx_code op, rtx *expr)
1698 rtx head, tail, insn;
1699 rtx neutral, aggr;
1700 regset altered;
1701 regset_head altered_head;
1702 edge e;
1704 if (!*expr)
1705 return;
1707 if (CONSTANT_P (*expr))
1708 return;
1710 if (GET_CODE (*expr) == EXPR_LIST)
1712 head = XEXP (*expr, 0);
1713 tail = XEXP (*expr, 1);
1715 eliminate_implied_conditions (op, &head, tail);
1717 if (op == AND)
1719 neutral = const_true_rtx;
1720 aggr = const0_rtx;
1722 else if (op == IOR)
1724 neutral = const0_rtx;
1725 aggr = const_true_rtx;
1727 else
1728 abort ();
1730 simplify_using_initial_values (loop, UNKNOWN, &head);
1731 if (head == aggr)
1733 XEXP (*expr, 0) = aggr;
1734 XEXP (*expr, 1) = NULL_RTX;
1735 return;
1737 else if (head == neutral)
1739 *expr = tail;
1740 simplify_using_initial_values (loop, op, expr);
1741 return;
1743 simplify_using_initial_values (loop, op, &tail);
1745 if (tail && XEXP (tail, 0) == aggr)
1747 *expr = tail;
1748 return;
1751 XEXP (*expr, 0) = head;
1752 XEXP (*expr, 1) = tail;
1753 return;
1756 if (op != UNKNOWN)
1757 abort ();
1759 e = loop_preheader_edge (loop);
1760 if (e->src == ENTRY_BLOCK_PTR)
1761 return;
1763 altered = INITIALIZE_REG_SET (altered_head);
1765 while (1)
1767 basic_block tmp_bb;
1769 insn = BB_END (e->src);
1770 if (any_condjump_p (insn))
1772 rtx cond = get_condition (BB_END (e->src), NULL, false, true);
1774 if (cond && (e->flags & EDGE_FALLTHRU))
1775 cond = reversed_condition (cond);
1776 if (cond)
1778 simplify_using_condition (cond, expr, altered);
1779 if (CONSTANT_P (*expr))
1781 FREE_REG_SET (altered);
1782 return;
1787 FOR_BB_INSNS_REVERSE (e->src, insn)
1789 if (!INSN_P (insn))
1790 continue;
1792 simplify_using_assignment (insn, expr, altered);
1793 if (CONSTANT_P (*expr))
1795 FREE_REG_SET (altered);
1796 return;
1800 /* This is a bit subtle. Store away e->src in tmp_bb, since we
1801 modify `e' and this can invalidate the subsequent count of
1802 e->src's predecessors by looking at the wrong block. */
1803 tmp_bb = e->src;
1804 e = EDGE_PRED (tmp_bb, 0);
1805 if (EDGE_COUNT (tmp_bb->preds) > 1
1806 || e->src == ENTRY_BLOCK_PTR)
1807 break;
1810 FREE_REG_SET (altered);
1813 /* Transforms invariant IV into MODE. Adds assumptions based on the fact
1814 that IV occurs as left operands of comparison COND and its signedness
1815 is SIGNED_P to DESC. */
1817 static void
1818 shorten_into_mode (struct rtx_iv *iv, enum machine_mode mode,
1819 enum rtx_code cond, bool signed_p, struct niter_desc *desc)
1821 rtx mmin, mmax, cond_over, cond_under;
1823 get_mode_bounds (mode, signed_p, iv->extend_mode, &mmin, &mmax);
1824 cond_under = simplify_gen_relational (LT, SImode, iv->extend_mode,
1825 iv->base, mmin);
1826 cond_over = simplify_gen_relational (GT, SImode, iv->extend_mode,
1827 iv->base, mmax);
1829 switch (cond)
1831 case LE:
1832 case LT:
1833 case LEU:
1834 case LTU:
1835 if (cond_under != const0_rtx)
1836 desc->infinite =
1837 alloc_EXPR_LIST (0, cond_under, desc->infinite);
1838 if (cond_over != const0_rtx)
1839 desc->noloop_assumptions =
1840 alloc_EXPR_LIST (0, cond_over, desc->noloop_assumptions);
1841 break;
1843 case GE:
1844 case GT:
1845 case GEU:
1846 case GTU:
1847 if (cond_over != const0_rtx)
1848 desc->infinite =
1849 alloc_EXPR_LIST (0, cond_over, desc->infinite);
1850 if (cond_under != const0_rtx)
1851 desc->noloop_assumptions =
1852 alloc_EXPR_LIST (0, cond_under, desc->noloop_assumptions);
1853 break;
1855 case NE:
1856 if (cond_over != const0_rtx)
1857 desc->infinite =
1858 alloc_EXPR_LIST (0, cond_over, desc->infinite);
1859 if (cond_under != const0_rtx)
1860 desc->infinite =
1861 alloc_EXPR_LIST (0, cond_under, desc->infinite);
1862 break;
1864 default:
1865 abort ();
1868 iv->mode = mode;
1869 iv->extend = signed_p ? SIGN_EXTEND : ZERO_EXTEND;
1872 /* Transforms IV0 and IV1 compared by COND so that they are both compared as
1873 subregs of the same mode if possible (sometimes it is necessary to add
1874 some assumptions to DESC). */
1876 static bool
1877 canonicalize_iv_subregs (struct rtx_iv *iv0, struct rtx_iv *iv1,
1878 enum rtx_code cond, struct niter_desc *desc)
1880 enum machine_mode comp_mode;
1881 bool signed_p;
1883 /* If the ivs behave specially in the first iteration, or are
1884 added/multiplied after extending, we ignore them. */
1885 if (iv0->first_special || iv0->mult != const1_rtx || iv0->delta != const0_rtx)
1886 return false;
1887 if (iv1->first_special || iv1->mult != const1_rtx || iv1->delta != const0_rtx)
1888 return false;
1890 /* If there is some extend, it must match signedness of the comparison. */
1891 switch (cond)
1893 case LE:
1894 case LT:
1895 if (iv0->extend == ZERO_EXTEND
1896 || iv1->extend == ZERO_EXTEND)
1897 return false;
1898 signed_p = true;
1899 break;
1901 case LEU:
1902 case LTU:
1903 if (iv0->extend == SIGN_EXTEND
1904 || iv1->extend == SIGN_EXTEND)
1905 return false;
1906 signed_p = false;
1907 break;
1909 case NE:
1910 if (iv0->extend != UNKNOWN
1911 && iv1->extend != UNKNOWN
1912 && iv0->extend != iv1->extend)
1913 return false;
1915 signed_p = false;
1916 if (iv0->extend != UNKNOWN)
1917 signed_p = iv0->extend == SIGN_EXTEND;
1918 if (iv1->extend != UNKNOWN)
1919 signed_p = iv1->extend == SIGN_EXTEND;
1920 break;
1922 default:
1923 abort ();
1926 /* Values of both variables should be computed in the same mode. These
1927 might indeed be different, if we have comparison like
1929 (compare (subreg:SI (iv0)) (subreg:SI (iv1)))
1931 and iv0 and iv1 are both ivs iterating in SI mode, but calculated
1932 in different modes. This does not seem impossible to handle, but
1933 it hardly ever occurs in practice.
1935 The only exception is the case when one of operands is invariant.
1936 For example pentium 3 generates comparisons like
1937 (lt (subreg:HI (reg:SI)) 100). Here we assign HImode to 100, but we
1938 definitely do not want this prevent the optimization. */
1939 comp_mode = iv0->extend_mode;
1940 if (GET_MODE_BITSIZE (comp_mode) < GET_MODE_BITSIZE (iv1->extend_mode))
1941 comp_mode = iv1->extend_mode;
1943 if (iv0->extend_mode != comp_mode)
1945 if (iv0->mode != iv0->extend_mode
1946 || iv0->step != const0_rtx)
1947 return false;
1949 iv0->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
1950 comp_mode, iv0->base, iv0->mode);
1951 iv0->extend_mode = comp_mode;
1954 if (iv1->extend_mode != comp_mode)
1956 if (iv1->mode != iv1->extend_mode
1957 || iv1->step != const0_rtx)
1958 return false;
1960 iv1->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
1961 comp_mode, iv1->base, iv1->mode);
1962 iv1->extend_mode = comp_mode;
1965 /* Check that both ivs belong to a range of a single mode. If one of the
1966 operands is an invariant, we may need to shorten it into the common
1967 mode. */
1968 if (iv0->mode == iv0->extend_mode
1969 && iv0->step == const0_rtx
1970 && iv0->mode != iv1->mode)
1971 shorten_into_mode (iv0, iv1->mode, cond, signed_p, desc);
1973 if (iv1->mode == iv1->extend_mode
1974 && iv1->step == const0_rtx
1975 && iv0->mode != iv1->mode)
1976 shorten_into_mode (iv1, iv0->mode, swap_condition (cond), signed_p, desc);
1978 if (iv0->mode != iv1->mode)
1979 return false;
1981 desc->mode = iv0->mode;
1982 desc->signed_p = signed_p;
1984 return true;
1987 /* Computes number of iterations of the CONDITION in INSN in LOOP and stores
1988 the result into DESC. Very similar to determine_number_of_iterations
1989 (basically its rtl version), complicated by things like subregs. */
1991 void
1992 iv_number_of_iterations (struct loop *loop, rtx insn, rtx condition,
1993 struct niter_desc *desc)
1995 rtx op0, op1, delta, step, bound, may_xform, def_insn, tmp, tmp0, tmp1;
1996 struct rtx_iv iv0, iv1, tmp_iv;
1997 rtx assumption, may_not_xform;
1998 enum rtx_code cond;
1999 enum machine_mode mode, comp_mode;
2000 rtx mmin, mmax, mode_mmin, mode_mmax;
2001 unsigned HOST_WIDEST_INT s, size, d, inv;
2002 HOST_WIDEST_INT up, down, inc;
2003 int was_sharp = false;
2004 rtx old_niter;
2006 /* The meaning of these assumptions is this:
2007 if !assumptions
2008 then the rest of information does not have to be valid
2009 if noloop_assumptions then the loop does not roll
2010 if infinite then this exit is never used */
2012 desc->assumptions = NULL_RTX;
2013 desc->noloop_assumptions = NULL_RTX;
2014 desc->infinite = NULL_RTX;
2015 desc->simple_p = true;
2017 desc->const_iter = false;
2018 desc->niter_expr = NULL_RTX;
2019 desc->niter_max = 0;
2021 cond = GET_CODE (condition);
2022 if (!COMPARISON_P (condition))
2023 abort ();
2025 mode = GET_MODE (XEXP (condition, 0));
2026 if (mode == VOIDmode)
2027 mode = GET_MODE (XEXP (condition, 1));
2028 /* The constant comparisons should be folded. */
2029 if (mode == VOIDmode)
2030 abort ();
2032 /* We only handle integers or pointers. */
2033 if (GET_MODE_CLASS (mode) != MODE_INT
2034 && GET_MODE_CLASS (mode) != MODE_PARTIAL_INT)
2035 goto fail;
2037 op0 = XEXP (condition, 0);
2038 def_insn = iv_get_reaching_def (insn, op0);
2039 if (!iv_analyze (def_insn, op0, &iv0))
2040 goto fail;
2041 if (iv0.extend_mode == VOIDmode)
2042 iv0.mode = iv0.extend_mode = mode;
2044 op1 = XEXP (condition, 1);
2045 def_insn = iv_get_reaching_def (insn, op1);
2046 if (!iv_analyze (def_insn, op1, &iv1))
2047 goto fail;
2048 if (iv1.extend_mode == VOIDmode)
2049 iv1.mode = iv1.extend_mode = mode;
2051 if (GET_MODE_BITSIZE (iv0.extend_mode) > HOST_BITS_PER_WIDE_INT
2052 || GET_MODE_BITSIZE (iv1.extend_mode) > HOST_BITS_PER_WIDE_INT)
2053 goto fail;
2055 /* Check condition and normalize it. */
2057 switch (cond)
2059 case GE:
2060 case GT:
2061 case GEU:
2062 case GTU:
2063 tmp_iv = iv0; iv0 = iv1; iv1 = tmp_iv;
2064 cond = swap_condition (cond);
2065 break;
2066 case NE:
2067 case LE:
2068 case LEU:
2069 case LT:
2070 case LTU:
2071 break;
2072 default:
2073 goto fail;
2076 /* Handle extends. This is relatively nontrivial, so we only try in some
2077 easy cases, when we can canonicalize the ivs (possibly by adding some
2078 assumptions) to shape subreg (base + i * step). This function also fills
2079 in desc->mode and desc->signed_p. */
2081 if (!canonicalize_iv_subregs (&iv0, &iv1, cond, desc))
2082 goto fail;
2084 comp_mode = iv0.extend_mode;
2085 mode = iv0.mode;
2086 size = GET_MODE_BITSIZE (mode);
2087 get_mode_bounds (mode, (cond == LE || cond == LT), comp_mode, &mmin, &mmax);
2088 mode_mmin = lowpart_subreg (mode, mmin, comp_mode);
2089 mode_mmax = lowpart_subreg (mode, mmax, comp_mode);
2091 if (GET_CODE (iv0.step) != CONST_INT || GET_CODE (iv1.step) != CONST_INT)
2092 goto fail;
2094 /* We can take care of the case of two induction variables chasing each other
2095 if the test is NE. I have never seen a loop using it, but still it is
2096 cool. */
2097 if (iv0.step != const0_rtx && iv1.step != const0_rtx)
2099 if (cond != NE)
2100 goto fail;
2102 iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2103 iv1.step = const0_rtx;
2106 /* This is either infinite loop or the one that ends immediately, depending
2107 on initial values. Unswitching should remove this kind of conditions. */
2108 if (iv0.step == const0_rtx && iv1.step == const0_rtx)
2109 goto fail;
2111 /* Ignore loops of while (i-- < 10) type. */
2112 if (cond != NE
2113 && (INTVAL (iv0.step) < 0 || INTVAL (iv1.step) > 0))
2114 goto fail;
2116 /* Some more condition normalization. We must record some assumptions
2117 due to overflows. */
2118 switch (cond)
2120 case LT:
2121 case LTU:
2122 /* We want to take care only of non-sharp relationals; this is easy,
2123 as in cases the overflow would make the transformation unsafe
2124 the loop does not roll. Seemingly it would make more sense to want
2125 to take care of sharp relationals instead, as NE is more similar to
2126 them, but the problem is that here the transformation would be more
2127 difficult due to possibly infinite loops. */
2128 if (iv0.step == const0_rtx)
2130 tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2131 assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2132 mode_mmax);
2133 if (assumption == const_true_rtx)
2134 goto zero_iter;
2135 iv0.base = simplify_gen_binary (PLUS, comp_mode,
2136 iv0.base, const1_rtx);
2138 else
2140 tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2141 assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2142 mode_mmin);
2143 if (assumption == const_true_rtx)
2144 goto zero_iter;
2145 iv1.base = simplify_gen_binary (PLUS, comp_mode,
2146 iv1.base, constm1_rtx);
2149 if (assumption != const0_rtx)
2150 desc->noloop_assumptions =
2151 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2152 cond = (cond == LT) ? LE : LEU;
2154 /* It will be useful to be able to tell the difference once more in
2155 LE -> NE reduction. */
2156 was_sharp = true;
2157 break;
2158 default: ;
2161 /* Take care of trivially infinite loops. */
2162 if (cond != NE)
2164 if (iv0.step == const0_rtx)
2166 tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2167 if (rtx_equal_p (tmp, mode_mmin))
2169 desc->infinite =
2170 alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2171 return;
2174 else
2176 tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2177 if (rtx_equal_p (tmp, mode_mmax))
2179 desc->infinite =
2180 alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2181 return;
2186 /* If we can we want to take care of NE conditions instead of size
2187 comparisons, as they are much more friendly (most importantly
2188 this takes care of special handling of loops with step 1). We can
2189 do it if we first check that upper bound is greater or equal to
2190 lower bound, their difference is constant c modulo step and that
2191 there is not an overflow. */
2192 if (cond != NE)
2194 if (iv0.step == const0_rtx)
2195 step = simplify_gen_unary (NEG, comp_mode, iv1.step, comp_mode);
2196 else
2197 step = iv0.step;
2198 delta = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2199 delta = lowpart_subreg (mode, delta, comp_mode);
2200 delta = simplify_gen_binary (UMOD, mode, delta, step);
2201 may_xform = const0_rtx;
2202 may_not_xform = const_true_rtx;
2204 if (GET_CODE (delta) == CONST_INT)
2206 if (was_sharp && INTVAL (delta) == INTVAL (step) - 1)
2208 /* A special case. We have transformed condition of type
2209 for (i = 0; i < 4; i += 4)
2210 into
2211 for (i = 0; i <= 3; i += 4)
2212 obviously if the test for overflow during that transformation
2213 passed, we cannot overflow here. Most importantly any
2214 loop with sharp end condition and step 1 falls into this
2215 category, so handling this case specially is definitely
2216 worth the troubles. */
2217 may_xform = const_true_rtx;
2219 else if (iv0.step == const0_rtx)
2221 bound = simplify_gen_binary (PLUS, comp_mode, mmin, step);
2222 bound = simplify_gen_binary (MINUS, comp_mode, bound, delta);
2223 bound = lowpart_subreg (mode, bound, comp_mode);
2224 tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2225 may_xform = simplify_gen_relational (cond, SImode, mode,
2226 bound, tmp);
2227 may_not_xform = simplify_gen_relational (reverse_condition (cond),
2228 SImode, mode,
2229 bound, tmp);
2231 else
2233 bound = simplify_gen_binary (MINUS, comp_mode, mmax, step);
2234 bound = simplify_gen_binary (PLUS, comp_mode, bound, delta);
2235 bound = lowpart_subreg (mode, bound, comp_mode);
2236 tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2237 may_xform = simplify_gen_relational (cond, SImode, mode,
2238 tmp, bound);
2239 may_not_xform = simplify_gen_relational (reverse_condition (cond),
2240 SImode, mode,
2241 tmp, bound);
2245 if (may_xform != const0_rtx)
2247 /* We perform the transformation always provided that it is not
2248 completely senseless. This is OK, as we would need this assumption
2249 to determine the number of iterations anyway. */
2250 if (may_xform != const_true_rtx)
2252 /* If the step is a power of two and the final value we have
2253 computed overflows, the cycle is infinite. Otherwise it
2254 is nontrivial to compute the number of iterations. */
2255 s = INTVAL (step);
2256 if ((s & (s - 1)) == 0)
2257 desc->infinite = alloc_EXPR_LIST (0, may_not_xform,
2258 desc->infinite);
2259 else
2260 desc->assumptions = alloc_EXPR_LIST (0, may_xform,
2261 desc->assumptions);
2264 /* We are going to lose some information about upper bound on
2265 number of iterations in this step, so record the information
2266 here. */
2267 inc = INTVAL (iv0.step) - INTVAL (iv1.step);
2268 if (GET_CODE (iv1.base) == CONST_INT)
2269 up = INTVAL (iv1.base);
2270 else
2271 up = INTVAL (mode_mmax) - inc;
2272 down = INTVAL (GET_CODE (iv0.base) == CONST_INT
2273 ? iv0.base
2274 : mode_mmin);
2275 desc->niter_max = (up - down) / inc + 1;
2277 if (iv0.step == const0_rtx)
2279 iv0.base = simplify_gen_binary (PLUS, comp_mode, iv0.base, delta);
2280 iv0.base = simplify_gen_binary (MINUS, comp_mode, iv0.base, step);
2282 else
2284 iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, delta);
2285 iv1.base = simplify_gen_binary (PLUS, comp_mode, iv1.base, step);
2288 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2289 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2290 assumption = simplify_gen_relational (reverse_condition (cond),
2291 SImode, mode, tmp0, tmp1);
2292 if (assumption == const_true_rtx)
2293 goto zero_iter;
2294 else if (assumption != const0_rtx)
2295 desc->noloop_assumptions =
2296 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2297 cond = NE;
2301 /* Count the number of iterations. */
2302 if (cond == NE)
2304 /* Everything we do here is just arithmetics modulo size of mode. This
2305 makes us able to do more involved computations of number of iterations
2306 than in other cases. First transform the condition into shape
2307 s * i <> c, with s positive. */
2308 iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2309 iv0.base = const0_rtx;
2310 iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2311 iv1.step = const0_rtx;
2312 if (INTVAL (iv0.step) < 0)
2314 iv0.step = simplify_gen_unary (NEG, comp_mode, iv0.step, mode);
2315 iv1.base = simplify_gen_unary (NEG, comp_mode, iv1.base, mode);
2317 iv0.step = lowpart_subreg (mode, iv0.step, comp_mode);
2319 /* Let nsd (s, size of mode) = d. If d does not divide c, the loop
2320 is infinite. Otherwise, the number of iterations is
2321 (inverse(s/d) * (c/d)) mod (size of mode/d). */
2322 s = INTVAL (iv0.step); d = 1;
2323 while (s % 2 != 1)
2325 s /= 2;
2326 d *= 2;
2327 size--;
2329 bound = GEN_INT (((unsigned HOST_WIDEST_INT) 1 << (size - 1 ) << 1) - 1);
2331 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2332 tmp = simplify_gen_binary (UMOD, mode, tmp1, GEN_INT (d));
2333 assumption = simplify_gen_relational (NE, SImode, mode, tmp, const0_rtx);
2334 desc->infinite = alloc_EXPR_LIST (0, assumption, desc->infinite);
2336 tmp = simplify_gen_binary (UDIV, mode, tmp1, GEN_INT (d));
2337 inv = inverse (s, size);
2338 inv = trunc_int_for_mode (inv, mode);
2339 tmp = simplify_gen_binary (MULT, mode, tmp, GEN_INT (inv));
2340 desc->niter_expr = simplify_gen_binary (AND, mode, tmp, bound);
2342 else
2344 if (iv1.step == const0_rtx)
2345 /* Condition in shape a + s * i <= b
2346 We must know that b + s does not overflow and a <= b + s and then we
2347 can compute number of iterations as (b + s - a) / s. (It might
2348 seem that we in fact could be more clever about testing the b + s
2349 overflow condition using some information about b - a mod s,
2350 but it was already taken into account during LE -> NE transform). */
2352 step = iv0.step;
2353 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2354 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2356 bound = simplify_gen_binary (MINUS, mode, mode_mmax,
2357 lowpart_subreg (mode, step, comp_mode));
2358 assumption = simplify_gen_relational (cond, SImode, mode,
2359 tmp1, bound);
2360 desc->assumptions =
2361 alloc_EXPR_LIST (0, assumption, desc->assumptions);
2363 tmp = simplify_gen_binary (PLUS, comp_mode, iv1.base, iv0.step);
2364 tmp = lowpart_subreg (mode, tmp, comp_mode);
2365 assumption = simplify_gen_relational (reverse_condition (cond),
2366 SImode, mode, tmp0, tmp);
2368 delta = simplify_gen_binary (PLUS, mode, tmp1, step);
2369 delta = simplify_gen_binary (MINUS, mode, delta, tmp0);
2371 else
2373 /* Condition in shape a <= b - s * i
2374 We must know that a - s does not overflow and a - s <= b and then
2375 we can again compute number of iterations as (b - (a - s)) / s. */
2376 step = simplify_gen_unary (NEG, mode, iv1.step, mode);
2377 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2378 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2380 bound = simplify_gen_binary (MINUS, mode, mode_mmin,
2381 lowpart_subreg (mode, step, comp_mode));
2382 assumption = simplify_gen_relational (cond, SImode, mode,
2383 bound, tmp0);
2384 desc->assumptions =
2385 alloc_EXPR_LIST (0, assumption, desc->assumptions);
2387 tmp = simplify_gen_binary (PLUS, comp_mode, iv0.base, iv1.step);
2388 tmp = lowpart_subreg (mode, tmp, comp_mode);
2389 assumption = simplify_gen_relational (reverse_condition (cond),
2390 SImode, mode,
2391 tmp, tmp1);
2392 delta = simplify_gen_binary (MINUS, mode, tmp0, step);
2393 delta = simplify_gen_binary (MINUS, mode, tmp1, delta);
2395 if (assumption == const_true_rtx)
2396 goto zero_iter;
2397 else if (assumption != const0_rtx)
2398 desc->noloop_assumptions =
2399 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2400 delta = simplify_gen_binary (UDIV, mode, delta, step);
2401 desc->niter_expr = delta;
2404 old_niter = desc->niter_expr;
2406 simplify_using_initial_values (loop, AND, &desc->assumptions);
2407 if (desc->assumptions
2408 && XEXP (desc->assumptions, 0) == const0_rtx)
2409 goto fail;
2410 simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2411 simplify_using_initial_values (loop, IOR, &desc->infinite);
2412 simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2414 /* Rerun the simplification. Consider code (created by copying loop headers)
2416 i = 0;
2418 if (0 < n)
2422 i++;
2423 } while (i < n);
2426 The first pass determines that i = 0, the second pass uses it to eliminate
2427 noloop assumption. */
2429 simplify_using_initial_values (loop, AND, &desc->assumptions);
2430 if (desc->assumptions
2431 && XEXP (desc->assumptions, 0) == const0_rtx)
2432 goto fail;
2433 simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2434 simplify_using_initial_values (loop, IOR, &desc->infinite);
2435 simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2437 if (desc->noloop_assumptions
2438 && XEXP (desc->noloop_assumptions, 0) == const_true_rtx)
2439 goto zero_iter;
2441 if (GET_CODE (desc->niter_expr) == CONST_INT)
2443 unsigned HOST_WIDEST_INT val = INTVAL (desc->niter_expr);
2445 desc->const_iter = true;
2446 desc->niter_max = desc->niter = val & GET_MODE_MASK (desc->mode);
2448 else
2450 if (!desc->niter_max)
2451 desc->niter_max = determine_max_iter (desc);
2453 /* simplify_using_initial_values does a copy propagation on the registers
2454 in the expression for the number of iterations. This prolongs life
2455 ranges of registers and increases register pressure, and usually
2456 brings no gain (and if it happens to do, the cse pass will take care
2457 of it anyway). So prevent this behavior, unless it enabled us to
2458 derive that the number of iterations is a constant. */
2459 desc->niter_expr = old_niter;
2462 return;
2464 fail:
2465 desc->simple_p = false;
2466 return;
2468 zero_iter:
2469 desc->const_iter = true;
2470 desc->niter = 0;
2471 desc->niter_max = 0;
2472 desc->niter_expr = const0_rtx;
2473 return;
2476 /* Checks whether E is a simple exit from LOOP and stores its description
2477 into DESC. */
2479 static void
2480 check_simple_exit (struct loop *loop, edge e, struct niter_desc *desc)
2482 basic_block exit_bb;
2483 rtx condition, at;
2484 edge ei;
2486 exit_bb = e->src;
2487 desc->simple_p = false;
2489 /* It must belong directly to the loop. */
2490 if (exit_bb->loop_father != loop)
2491 return;
2493 /* It must be tested (at least) once during any iteration. */
2494 if (!dominated_by_p (CDI_DOMINATORS, loop->latch, exit_bb))
2495 return;
2497 /* It must end in a simple conditional jump. */
2498 if (!any_condjump_p (BB_END (exit_bb)))
2499 return;
2501 ei = EDGE_SUCC (exit_bb, 0);
2502 if (ei == e)
2503 ei = EDGE_SUCC (exit_bb, 1);
2505 desc->out_edge = e;
2506 desc->in_edge = ei;
2508 /* Test whether the condition is suitable. */
2509 if (!(condition = get_condition (BB_END (ei->src), &at, false, false)))
2510 return;
2512 if (ei->flags & EDGE_FALLTHRU)
2514 condition = reversed_condition (condition);
2515 if (!condition)
2516 return;
2519 /* Check that we are able to determine number of iterations and fill
2520 in information about it. */
2521 iv_number_of_iterations (loop, at, condition, desc);
2524 /* Finds a simple exit of LOOP and stores its description into DESC. */
2526 void
2527 find_simple_exit (struct loop *loop, struct niter_desc *desc)
2529 unsigned i;
2530 basic_block *body;
2531 edge e;
2532 struct niter_desc act;
2533 bool any = false;
2535 desc->simple_p = false;
2536 body = get_loop_body (loop);
2538 for (i = 0; i < loop->num_nodes; i++)
2540 FOR_EACH_EDGE (e, body[i]->succs)
2542 if (flow_bb_inside_loop_p (loop, e->dest))
2543 continue;
2545 check_simple_exit (loop, e, &act);
2546 if (!act.simple_p)
2547 continue;
2549 /* Prefer constant iterations; the less the better. */
2550 if (!any)
2551 any = true;
2552 else if (!act.const_iter
2553 || (desc->const_iter && act.niter >= desc->niter))
2554 continue;
2555 *desc = act;
2557 END_FOR_EACH_EDGE;
2560 if (dump_file)
2562 if (desc->simple_p)
2564 fprintf (dump_file, "Loop %d is simple:\n", loop->num);
2565 fprintf (dump_file, " simple exit %d -> %d\n",
2566 desc->out_edge->src->index,
2567 desc->out_edge->dest->index);
2568 if (desc->assumptions)
2570 fprintf (dump_file, " assumptions: ");
2571 print_rtl (dump_file, desc->assumptions);
2572 fprintf (dump_file, "\n");
2574 if (desc->noloop_assumptions)
2576 fprintf (dump_file, " does not roll if: ");
2577 print_rtl (dump_file, desc->noloop_assumptions);
2578 fprintf (dump_file, "\n");
2580 if (desc->infinite)
2582 fprintf (dump_file, " infinite if: ");
2583 print_rtl (dump_file, desc->infinite);
2584 fprintf (dump_file, "\n");
2587 fprintf (dump_file, " number of iterations: ");
2588 print_rtl (dump_file, desc->niter_expr);
2589 fprintf (dump_file, "\n");
2591 fprintf (dump_file, " upper bound: ");
2592 fprintf (dump_file, HOST_WIDEST_INT_PRINT_DEC, desc->niter_max);
2593 fprintf (dump_file, "\n");
2595 else
2596 fprintf (dump_file, "Loop %d is not simple.\n", loop->num);
2599 free (body);
2602 /* Creates a simple loop description of LOOP if it was not computed
2603 already. */
2605 struct niter_desc *
2606 get_simple_loop_desc (struct loop *loop)
2608 struct niter_desc *desc = simple_loop_desc (loop);
2610 if (desc)
2611 return desc;
2613 desc = xmalloc (sizeof (struct niter_desc));
2614 iv_analysis_loop_init (loop);
2615 find_simple_exit (loop, desc);
2616 loop->aux = desc;
2618 return desc;
2621 /* Releases simple loop description for LOOP. */
2623 void
2624 free_simple_loop_desc (struct loop *loop)
2626 struct niter_desc *desc = simple_loop_desc (loop);
2628 if (!desc)
2629 return;
2631 free (desc);
2632 loop->aux = NULL;