* config/arm/elf.h (ASM_OUTPUT_ALIGNED_COMMON): Remove definition.
[official-gcc.git] / gcc / regmove.c
blob2639ebd54f418003265eafb50b80abe5e45f67de
1 /* Move registers around to reduce number of move instructions needed.
2 Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998,
3 1999, 2000, 2001, 2002, 2003 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
23 /* This module looks for cases where matching constraints would force
24 an instruction to need a reload, and this reload would be a register
25 to register move. It then attempts to change the registers used by the
26 instruction to avoid the move instruction. */
28 #include "config.h"
29 #include "system.h"
30 #include "coretypes.h"
31 #include "tm.h"
32 #include "rtl.h" /* stdio.h must precede rtl.h for FFS. */
33 #include "tm_p.h"
34 #include "insn-config.h"
35 #include "recog.h"
36 #include "output.h"
37 #include "regs.h"
38 #include "hard-reg-set.h"
39 #include "flags.h"
40 #include "function.h"
41 #include "expr.h"
42 #include "basic-block.h"
43 #include "except.h"
44 #include "toplev.h"
45 #include "reload.h"
48 /* Turn STACK_GROWS_DOWNWARD into a boolean. */
49 #ifdef STACK_GROWS_DOWNWARD
50 #undef STACK_GROWS_DOWNWARD
51 #define STACK_GROWS_DOWNWARD 1
52 #else
53 #define STACK_GROWS_DOWNWARD 0
54 #endif
56 static int perhaps_ends_bb_p PARAMS ((rtx));
57 static int optimize_reg_copy_1 PARAMS ((rtx, rtx, rtx));
58 static void optimize_reg_copy_2 PARAMS ((rtx, rtx, rtx));
59 static void optimize_reg_copy_3 PARAMS ((rtx, rtx, rtx));
60 static void copy_src_to_dest PARAMS ((rtx, rtx, rtx, int));
61 static int *regmove_bb_head;
63 struct match {
64 int with[MAX_RECOG_OPERANDS];
65 enum { READ, WRITE, READWRITE } use[MAX_RECOG_OPERANDS];
66 int commutative[MAX_RECOG_OPERANDS];
67 int early_clobber[MAX_RECOG_OPERANDS];
70 static rtx discover_flags_reg PARAMS ((void));
71 static void mark_flags_life_zones PARAMS ((rtx));
72 static void flags_set_1 PARAMS ((rtx, rtx, void *));
74 static int try_auto_increment PARAMS ((rtx, rtx, rtx, rtx, HOST_WIDE_INT, int));
75 static int find_matches PARAMS ((rtx, struct match *));
76 static void replace_in_call_usage PARAMS ((rtx *, unsigned int, rtx, rtx));
77 static int fixup_match_1 PARAMS ((rtx, rtx, rtx, rtx, rtx, int, int, int, FILE *))
79 static int reg_is_remote_constant_p PARAMS ((rtx, rtx, rtx));
80 static int stable_and_no_regs_but_for_p PARAMS ((rtx, rtx, rtx));
81 static int regclass_compatible_p PARAMS ((int, int));
82 static int replacement_quality PARAMS ((rtx));
83 static int fixup_match_2 PARAMS ((rtx, rtx, rtx, rtx, FILE *));
85 /* Return nonzero if registers with CLASS1 and CLASS2 can be merged without
86 causing too much register allocation problems. */
87 static int
88 regclass_compatible_p (class0, class1)
89 int class0, class1;
91 return (class0 == class1
92 || (reg_class_subset_p (class0, class1)
93 && ! CLASS_LIKELY_SPILLED_P (class0))
94 || (reg_class_subset_p (class1, class0)
95 && ! CLASS_LIKELY_SPILLED_P (class1)));
98 /* INC_INSN is an instruction that adds INCREMENT to REG.
99 Try to fold INC_INSN as a post/pre in/decrement into INSN.
100 Iff INC_INSN_SET is nonzero, inc_insn has a destination different from src.
101 Return nonzero for success. */
102 static int
103 try_auto_increment (insn, inc_insn, inc_insn_set, reg, increment, pre)
104 rtx reg, insn, inc_insn ,inc_insn_set;
105 HOST_WIDE_INT increment;
106 int pre;
108 enum rtx_code inc_code;
110 rtx pset = single_set (insn);
111 if (pset)
113 /* Can't use the size of SET_SRC, we might have something like
114 (sign_extend:SI (mem:QI ... */
115 rtx use = find_use_as_address (pset, reg, 0);
116 if (use != 0 && use != (rtx) (size_t) 1)
118 int size = GET_MODE_SIZE (GET_MODE (use));
119 if (0
120 || (HAVE_POST_INCREMENT
121 && pre == 0 && (inc_code = POST_INC, increment == size))
122 || (HAVE_PRE_INCREMENT
123 && pre == 1 && (inc_code = PRE_INC, increment == size))
124 || (HAVE_POST_DECREMENT
125 && pre == 0 && (inc_code = POST_DEC, increment == -size))
126 || (HAVE_PRE_DECREMENT
127 && pre == 1 && (inc_code = PRE_DEC, increment == -size))
130 if (inc_insn_set)
131 validate_change
132 (inc_insn,
133 &SET_SRC (inc_insn_set),
134 XEXP (SET_SRC (inc_insn_set), 0), 1);
135 validate_change (insn, &XEXP (use, 0),
136 gen_rtx_fmt_e (inc_code, Pmode, reg), 1);
137 if (apply_change_group ())
139 /* If there is a REG_DEAD note on this insn, we must
140 change this not to REG_UNUSED meaning that the register
141 is set, but the value is dead. Failure to do so will
142 result in a sched1 abort -- when it recomputes lifetime
143 information, the number of REG_DEAD notes will have
144 changed. */
145 rtx note = find_reg_note (insn, REG_DEAD, reg);
146 if (note)
147 PUT_MODE (note, REG_UNUSED);
149 REG_NOTES (insn)
150 = gen_rtx_EXPR_LIST (REG_INC,
151 reg, REG_NOTES (insn));
152 if (! inc_insn_set)
153 delete_insn (inc_insn);
154 return 1;
159 return 0;
162 /* Determine if the pattern generated by add_optab has a clobber,
163 such as might be issued for a flags hard register. To make the
164 code elsewhere simpler, we handle cc0 in this same framework.
166 Return the register if one was discovered. Return NULL_RTX if
167 if no flags were found. Return pc_rtx if we got confused. */
169 static rtx
170 discover_flags_reg ()
172 rtx tmp;
173 tmp = gen_rtx_REG (word_mode, 10000);
174 tmp = gen_add3_insn (tmp, tmp, GEN_INT (2));
176 /* If we get something that isn't a simple set, or a
177 [(set ..) (clobber ..)], this whole function will go wrong. */
178 if (GET_CODE (tmp) == SET)
179 return NULL_RTX;
180 else if (GET_CODE (tmp) == PARALLEL)
182 int found;
184 if (XVECLEN (tmp, 0) != 2)
185 return pc_rtx;
186 tmp = XVECEXP (tmp, 0, 1);
187 if (GET_CODE (tmp) != CLOBBER)
188 return pc_rtx;
189 tmp = XEXP (tmp, 0);
191 /* Don't do anything foolish if the md wanted to clobber a
192 scratch or something. We only care about hard regs.
193 Moreover we don't like the notion of subregs of hard regs. */
194 if (GET_CODE (tmp) == SUBREG
195 && GET_CODE (SUBREG_REG (tmp)) == REG
196 && REGNO (SUBREG_REG (tmp)) < FIRST_PSEUDO_REGISTER)
197 return pc_rtx;
198 found = (GET_CODE (tmp) == REG && REGNO (tmp) < FIRST_PSEUDO_REGISTER);
200 return (found ? tmp : NULL_RTX);
203 return pc_rtx;
206 /* It is a tedious task identifying when the flags register is live and
207 when it is safe to optimize. Since we process the instruction stream
208 multiple times, locate and record these live zones by marking the
209 mode of the instructions --
211 QImode is used on the instruction at which the flags becomes live.
213 HImode is used within the range (exclusive) that the flags are
214 live. Thus the user of the flags is not marked.
216 All other instructions are cleared to VOIDmode. */
218 /* Used to communicate with flags_set_1. */
219 static rtx flags_set_1_rtx;
220 static int flags_set_1_set;
222 static void
223 mark_flags_life_zones (flags)
224 rtx flags;
226 int flags_regno;
227 int flags_nregs;
228 basic_block block;
230 #ifdef HAVE_cc0
231 /* If we found a flags register on a cc0 host, bail. */
232 if (flags == NULL_RTX)
233 flags = cc0_rtx;
234 else if (flags != cc0_rtx)
235 flags = pc_rtx;
236 #endif
238 /* Simple cases first: if no flags, clear all modes. If confusing,
239 mark the entire function as being in a flags shadow. */
240 if (flags == NULL_RTX || flags == pc_rtx)
242 enum machine_mode mode = (flags ? HImode : VOIDmode);
243 rtx insn;
244 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
245 PUT_MODE (insn, mode);
246 return;
249 #ifdef HAVE_cc0
250 flags_regno = -1;
251 flags_nregs = 1;
252 #else
253 flags_regno = REGNO (flags);
254 flags_nregs = HARD_REGNO_NREGS (flags_regno, GET_MODE (flags));
255 #endif
256 flags_set_1_rtx = flags;
258 /* Process each basic block. */
259 FOR_EACH_BB_REVERSE (block)
261 rtx insn, end;
262 int live;
264 insn = block->head;
265 end = block->end;
267 /* Look out for the (unlikely) case of flags being live across
268 basic block boundaries. */
269 live = 0;
270 #ifndef HAVE_cc0
272 int i;
273 for (i = 0; i < flags_nregs; ++i)
274 live |= REGNO_REG_SET_P (block->global_live_at_start,
275 flags_regno + i);
277 #endif
279 while (1)
281 /* Process liveness in reverse order of importance --
282 alive, death, birth. This lets more important info
283 overwrite the mode of lesser info. */
285 if (INSN_P (insn))
287 #ifdef HAVE_cc0
288 /* In the cc0 case, death is not marked in reg notes,
289 but is instead the mere use of cc0 when it is alive. */
290 if (live && reg_mentioned_p (cc0_rtx, PATTERN (insn)))
291 live = 0;
292 #else
293 /* In the hard reg case, we watch death notes. */
294 if (live && find_regno_note (insn, REG_DEAD, flags_regno))
295 live = 0;
296 #endif
297 PUT_MODE (insn, (live ? HImode : VOIDmode));
299 /* In either case, birth is denoted simply by it's presence
300 as the destination of a set. */
301 flags_set_1_set = 0;
302 note_stores (PATTERN (insn), flags_set_1, NULL);
303 if (flags_set_1_set)
305 live = 1;
306 PUT_MODE (insn, QImode);
309 else
310 PUT_MODE (insn, (live ? HImode : VOIDmode));
312 if (insn == end)
313 break;
314 insn = NEXT_INSN (insn);
319 /* A subroutine of mark_flags_life_zones, called through note_stores. */
321 static void
322 flags_set_1 (x, pat, data)
323 rtx x, pat;
324 void *data ATTRIBUTE_UNUSED;
326 if (GET_CODE (pat) == SET
327 && reg_overlap_mentioned_p (x, flags_set_1_rtx))
328 flags_set_1_set = 1;
331 static int *regno_src_regno;
333 /* Indicate how good a choice REG (which appears as a source) is to replace
334 a destination register with. The higher the returned value, the better
335 the choice. The main objective is to avoid using a register that is
336 a candidate for tying to a hard register, since the output might in
337 turn be a candidate to be tied to a different hard register. */
338 static int
339 replacement_quality (reg)
340 rtx reg;
342 int src_regno;
344 /* Bad if this isn't a register at all. */
345 if (GET_CODE (reg) != REG)
346 return 0;
348 /* If this register is not meant to get a hard register,
349 it is a poor choice. */
350 if (REG_LIVE_LENGTH (REGNO (reg)) < 0)
351 return 0;
353 src_regno = regno_src_regno[REGNO (reg)];
355 /* If it was not copied from another register, it is fine. */
356 if (src_regno < 0)
357 return 3;
359 /* Copied from a hard register? */
360 if (src_regno < FIRST_PSEUDO_REGISTER)
361 return 1;
363 /* Copied from a pseudo register - not as bad as from a hard register,
364 yet still cumbersome, since the register live length will be lengthened
365 when the registers get tied. */
366 return 2;
369 /* Return 1 if INSN might end a basic block. */
371 static int perhaps_ends_bb_p (insn)
372 rtx insn;
374 switch (GET_CODE (insn))
376 case CODE_LABEL:
377 case JUMP_INSN:
378 /* These always end a basic block. */
379 return 1;
381 case CALL_INSN:
382 /* A CALL_INSN might be the last insn of a basic block, if it is inside
383 an EH region or if there are nonlocal gotos. Note that this test is
384 very conservative. */
385 if (nonlocal_goto_handler_labels)
386 return 1;
387 /* FALLTHRU */
388 default:
389 return can_throw_internal (insn);
393 /* INSN is a copy from SRC to DEST, both registers, and SRC does not die
394 in INSN.
396 Search forward to see if SRC dies before either it or DEST is modified,
397 but don't scan past the end of a basic block. If so, we can replace SRC
398 with DEST and let SRC die in INSN.
400 This will reduce the number of registers live in that range and may enable
401 DEST to be tied to SRC, thus often saving one register in addition to a
402 register-register copy. */
404 static int
405 optimize_reg_copy_1 (insn, dest, src)
406 rtx insn;
407 rtx dest;
408 rtx src;
410 rtx p, q;
411 rtx note;
412 rtx dest_death = 0;
413 int sregno = REGNO (src);
414 int dregno = REGNO (dest);
416 /* We don't want to mess with hard regs if register classes are small. */
417 if (sregno == dregno
418 || (SMALL_REGISTER_CLASSES
419 && (sregno < FIRST_PSEUDO_REGISTER
420 || dregno < FIRST_PSEUDO_REGISTER))
421 /* We don't see all updates to SP if they are in an auto-inc memory
422 reference, so we must disallow this optimization on them. */
423 || sregno == STACK_POINTER_REGNUM || dregno == STACK_POINTER_REGNUM)
424 return 0;
426 for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
428 /* ??? We can't scan past the end of a basic block without updating
429 the register lifetime info (REG_DEAD/basic_block_live_at_start). */
430 if (perhaps_ends_bb_p (p))
431 break;
432 else if (! INSN_P (p))
433 continue;
435 if (reg_set_p (src, p) || reg_set_p (dest, p)
436 /* If SRC is an asm-declared register, it must not be replaced
437 in any asm. Unfortunately, the REG_EXPR tree for the asm
438 variable may be absent in the SRC rtx, so we can't check the
439 actual register declaration easily (the asm operand will have
440 it, though). To avoid complicating the test for a rare case,
441 we just don't perform register replacement for a hard reg
442 mentioned in an asm. */
443 || (sregno < FIRST_PSEUDO_REGISTER
444 && asm_noperands (PATTERN (p)) >= 0
445 && reg_overlap_mentioned_p (src, PATTERN (p)))
446 /* Don't change a USE of a register. */
447 || (GET_CODE (PATTERN (p)) == USE
448 && reg_overlap_mentioned_p (src, XEXP (PATTERN (p), 0))))
449 break;
451 /* See if all of SRC dies in P. This test is slightly more
452 conservative than it needs to be. */
453 if ((note = find_regno_note (p, REG_DEAD, sregno)) != 0
454 && GET_MODE (XEXP (note, 0)) == GET_MODE (src))
456 int failed = 0;
457 int d_length = 0;
458 int s_length = 0;
459 int d_n_calls = 0;
460 int s_n_calls = 0;
462 /* We can do the optimization. Scan forward from INSN again,
463 replacing regs as we go. Set FAILED if a replacement can't
464 be done. In that case, we can't move the death note for SRC.
465 This should be rare. */
467 /* Set to stop at next insn. */
468 for (q = next_real_insn (insn);
469 q != next_real_insn (p);
470 q = next_real_insn (q))
472 if (reg_overlap_mentioned_p (src, PATTERN (q)))
474 /* If SRC is a hard register, we might miss some
475 overlapping registers with validate_replace_rtx,
476 so we would have to undo it. We can't if DEST is
477 present in the insn, so fail in that combination
478 of cases. */
479 if (sregno < FIRST_PSEUDO_REGISTER
480 && reg_mentioned_p (dest, PATTERN (q)))
481 failed = 1;
483 /* Replace all uses and make sure that the register
484 isn't still present. */
485 else if (validate_replace_rtx (src, dest, q)
486 && (sregno >= FIRST_PSEUDO_REGISTER
487 || ! reg_overlap_mentioned_p (src,
488 PATTERN (q))))
490 else
492 validate_replace_rtx (dest, src, q);
493 failed = 1;
497 /* For SREGNO, count the total number of insns scanned.
498 For DREGNO, count the total number of insns scanned after
499 passing the death note for DREGNO. */
500 s_length++;
501 if (dest_death)
502 d_length++;
504 /* If the insn in which SRC dies is a CALL_INSN, don't count it
505 as a call that has been crossed. Otherwise, count it. */
506 if (q != p && GET_CODE (q) == CALL_INSN)
508 /* Similarly, total calls for SREGNO, total calls beyond
509 the death note for DREGNO. */
510 s_n_calls++;
511 if (dest_death)
512 d_n_calls++;
515 /* If DEST dies here, remove the death note and save it for
516 later. Make sure ALL of DEST dies here; again, this is
517 overly conservative. */
518 if (dest_death == 0
519 && (dest_death = find_regno_note (q, REG_DEAD, dregno)) != 0)
521 if (GET_MODE (XEXP (dest_death, 0)) != GET_MODE (dest))
522 failed = 1, dest_death = 0;
523 else
524 remove_note (q, dest_death);
528 if (! failed)
530 /* These counters need to be updated if and only if we are
531 going to move the REG_DEAD note. */
532 if (sregno >= FIRST_PSEUDO_REGISTER)
534 if (REG_LIVE_LENGTH (sregno) >= 0)
536 REG_LIVE_LENGTH (sregno) -= s_length;
537 /* REG_LIVE_LENGTH is only an approximation after
538 combine if sched is not run, so make sure that we
539 still have a reasonable value. */
540 if (REG_LIVE_LENGTH (sregno) < 2)
541 REG_LIVE_LENGTH (sregno) = 2;
544 REG_N_CALLS_CROSSED (sregno) -= s_n_calls;
547 /* Move death note of SRC from P to INSN. */
548 remove_note (p, note);
549 XEXP (note, 1) = REG_NOTES (insn);
550 REG_NOTES (insn) = note;
553 /* DEST is also dead if INSN has a REG_UNUSED note for DEST. */
554 if (! dest_death
555 && (dest_death = find_regno_note (insn, REG_UNUSED, dregno)))
557 PUT_REG_NOTE_KIND (dest_death, REG_DEAD);
558 remove_note (insn, dest_death);
561 /* Put death note of DEST on P if we saw it die. */
562 if (dest_death)
564 XEXP (dest_death, 1) = REG_NOTES (p);
565 REG_NOTES (p) = dest_death;
567 if (dregno >= FIRST_PSEUDO_REGISTER)
569 /* If and only if we are moving the death note for DREGNO,
570 then we need to update its counters. */
571 if (REG_LIVE_LENGTH (dregno) >= 0)
572 REG_LIVE_LENGTH (dregno) += d_length;
573 REG_N_CALLS_CROSSED (dregno) += d_n_calls;
577 return ! failed;
580 /* If SRC is a hard register which is set or killed in some other
581 way, we can't do this optimization. */
582 else if (sregno < FIRST_PSEUDO_REGISTER
583 && dead_or_set_p (p, src))
584 break;
586 return 0;
589 /* INSN is a copy of SRC to DEST, in which SRC dies. See if we now have
590 a sequence of insns that modify DEST followed by an insn that sets
591 SRC to DEST in which DEST dies, with no prior modification of DEST.
592 (There is no need to check if the insns in between actually modify
593 DEST. We should not have cases where DEST is not modified, but
594 the optimization is safe if no such modification is detected.)
595 In that case, we can replace all uses of DEST, starting with INSN and
596 ending with the set of SRC to DEST, with SRC. We do not do this
597 optimization if a CALL_INSN is crossed unless SRC already crosses a
598 call or if DEST dies before the copy back to SRC.
600 It is assumed that DEST and SRC are pseudos; it is too complicated to do
601 this for hard registers since the substitutions we may make might fail. */
603 static void
604 optimize_reg_copy_2 (insn, dest, src)
605 rtx insn;
606 rtx dest;
607 rtx src;
609 rtx p, q;
610 rtx set;
611 int sregno = REGNO (src);
612 int dregno = REGNO (dest);
614 for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
616 /* ??? We can't scan past the end of a basic block without updating
617 the register lifetime info (REG_DEAD/basic_block_live_at_start). */
618 if (perhaps_ends_bb_p (p))
619 break;
620 else if (! INSN_P (p))
621 continue;
623 set = single_set (p);
624 if (set && SET_SRC (set) == dest && SET_DEST (set) == src
625 && find_reg_note (p, REG_DEAD, dest))
627 /* We can do the optimization. Scan forward from INSN again,
628 replacing regs as we go. */
630 /* Set to stop at next insn. */
631 for (q = insn; q != NEXT_INSN (p); q = NEXT_INSN (q))
632 if (INSN_P (q))
634 if (reg_mentioned_p (dest, PATTERN (q)))
635 PATTERN (q) = replace_rtx (PATTERN (q), dest, src);
638 if (GET_CODE (q) == CALL_INSN)
640 REG_N_CALLS_CROSSED (dregno)--;
641 REG_N_CALLS_CROSSED (sregno)++;
645 remove_note (p, find_reg_note (p, REG_DEAD, dest));
646 REG_N_DEATHS (dregno)--;
647 remove_note (insn, find_reg_note (insn, REG_DEAD, src));
648 REG_N_DEATHS (sregno)--;
649 return;
652 if (reg_set_p (src, p)
653 || find_reg_note (p, REG_DEAD, dest)
654 || (GET_CODE (p) == CALL_INSN && REG_N_CALLS_CROSSED (sregno) == 0))
655 break;
658 /* INSN is a ZERO_EXTEND or SIGN_EXTEND of SRC to DEST.
659 Look if SRC dies there, and if it is only set once, by loading
660 it from memory. If so, try to incorporate the zero/sign extension
661 into the memory read, change SRC to the mode of DEST, and alter
662 the remaining accesses to use the appropriate SUBREG. This allows
663 SRC and DEST to be tied later. */
664 static void
665 optimize_reg_copy_3 (insn, dest, src)
666 rtx insn;
667 rtx dest;
668 rtx src;
670 rtx src_reg = XEXP (src, 0);
671 int src_no = REGNO (src_reg);
672 int dst_no = REGNO (dest);
673 rtx p, set, subreg;
674 enum machine_mode old_mode;
676 if (src_no < FIRST_PSEUDO_REGISTER
677 || dst_no < FIRST_PSEUDO_REGISTER
678 || ! find_reg_note (insn, REG_DEAD, src_reg)
679 || REG_N_DEATHS (src_no) != 1
680 || REG_N_SETS (src_no) != 1)
681 return;
682 for (p = PREV_INSN (insn); p && ! reg_set_p (src_reg, p); p = PREV_INSN (p))
683 /* ??? We can't scan past the end of a basic block without updating
684 the register lifetime info (REG_DEAD/basic_block_live_at_start). */
685 if (perhaps_ends_bb_p (p))
686 break;
688 if (! p)
689 return;
691 if (! (set = single_set (p))
692 || GET_CODE (SET_SRC (set)) != MEM
693 /* If there's a REG_EQUIV note, this must be an insn that loads an
694 argument. Prefer keeping the note over doing this optimization. */
695 || find_reg_note (p, REG_EQUIV, NULL_RTX)
696 || SET_DEST (set) != src_reg)
697 return;
699 /* Be conservative: although this optimization is also valid for
700 volatile memory references, that could cause trouble in later passes. */
701 if (MEM_VOLATILE_P (SET_SRC (set)))
702 return;
704 /* Do not use a SUBREG to truncate from one mode to another if truncation
705 is not a nop. */
706 if (GET_MODE_BITSIZE (GET_MODE (src_reg)) <= GET_MODE_BITSIZE (GET_MODE (src))
707 && !TRULY_NOOP_TRUNCATION (GET_MODE_BITSIZE (GET_MODE (src)),
708 GET_MODE_BITSIZE (GET_MODE (src_reg))))
709 return;
711 old_mode = GET_MODE (src_reg);
712 PUT_MODE (src_reg, GET_MODE (src));
713 XEXP (src, 0) = SET_SRC (set);
715 /* Include this change in the group so that it's easily undone if
716 one of the changes in the group is invalid. */
717 validate_change (p, &SET_SRC (set), src, 1);
719 /* Now walk forward making additional replacements. We want to be able
720 to undo all the changes if a later substitution fails. */
721 subreg = gen_lowpart_SUBREG (old_mode, src_reg);
722 while (p = NEXT_INSN (p), p != insn)
724 if (! INSN_P (p))
725 continue;
727 /* Make a tenative change. */
728 validate_replace_rtx_group (src_reg, subreg, p);
731 validate_replace_rtx_group (src, src_reg, insn);
733 /* Now see if all the changes are valid. */
734 if (! apply_change_group ())
736 /* One or more changes were no good. Back out everything. */
737 PUT_MODE (src_reg, old_mode);
738 XEXP (src, 0) = src_reg;
740 else
742 rtx note = find_reg_note (p, REG_EQUAL, NULL_RTX);
743 if (note)
744 remove_note (p, note);
749 /* If we were not able to update the users of src to use dest directly, try
750 instead moving the value to dest directly before the operation. */
752 static void
753 copy_src_to_dest (insn, src, dest, old_max_uid)
754 rtx insn;
755 rtx src;
756 rtx dest;
757 int old_max_uid;
759 rtx seq;
760 rtx link;
761 rtx next;
762 rtx set;
763 rtx move_insn;
764 rtx *p_insn_notes;
765 rtx *p_move_notes;
766 int src_regno;
767 int dest_regno;
768 int bb;
769 int insn_uid;
770 int move_uid;
772 /* A REG_LIVE_LENGTH of -1 indicates the register is equivalent to a constant
773 or memory location and is used infrequently; a REG_LIVE_LENGTH of -2 is
774 parameter when there is no frame pointer that is not allocated a register.
775 For now, we just reject them, rather than incrementing the live length. */
777 if (GET_CODE (src) == REG
778 && REG_LIVE_LENGTH (REGNO (src)) > 0
779 && GET_CODE (dest) == REG
780 && !RTX_UNCHANGING_P (dest)
781 && REG_LIVE_LENGTH (REGNO (dest)) > 0
782 && (set = single_set (insn)) != NULL_RTX
783 && !reg_mentioned_p (dest, SET_SRC (set))
784 && GET_MODE (src) == GET_MODE (dest))
786 int old_num_regs = reg_rtx_no;
788 /* Generate the src->dest move. */
789 start_sequence ();
790 emit_move_insn (dest, src);
791 seq = get_insns ();
792 end_sequence ();
793 /* If this sequence uses new registers, we may not use it. */
794 if (old_num_regs != reg_rtx_no
795 || ! validate_replace_rtx (src, dest, insn))
797 /* We have to restore reg_rtx_no to its old value, lest
798 recompute_reg_usage will try to compute the usage of the
799 new regs, yet reg_n_info is not valid for them. */
800 reg_rtx_no = old_num_regs;
801 return;
803 emit_insn_before (seq, insn);
804 move_insn = PREV_INSN (insn);
805 p_move_notes = &REG_NOTES (move_insn);
806 p_insn_notes = &REG_NOTES (insn);
808 /* Move any notes mentioning src to the move instruction. */
809 for (link = REG_NOTES (insn); link != NULL_RTX; link = next)
811 next = XEXP (link, 1);
812 if (XEXP (link, 0) == src)
814 *p_move_notes = link;
815 p_move_notes = &XEXP (link, 1);
817 else
819 *p_insn_notes = link;
820 p_insn_notes = &XEXP (link, 1);
824 *p_move_notes = NULL_RTX;
825 *p_insn_notes = NULL_RTX;
827 /* Is the insn the head of a basic block? If so extend it. */
828 insn_uid = INSN_UID (insn);
829 move_uid = INSN_UID (move_insn);
830 if (insn_uid < old_max_uid)
832 bb = regmove_bb_head[insn_uid];
833 if (bb >= 0)
835 BLOCK_HEAD (bb) = move_insn;
836 regmove_bb_head[insn_uid] = -1;
840 /* Update the various register tables. */
841 dest_regno = REGNO (dest);
842 REG_N_SETS (dest_regno) ++;
843 REG_LIVE_LENGTH (dest_regno)++;
844 if (REGNO_FIRST_UID (dest_regno) == insn_uid)
845 REGNO_FIRST_UID (dest_regno) = move_uid;
847 src_regno = REGNO (src);
848 if (! find_reg_note (move_insn, REG_DEAD, src))
849 REG_LIVE_LENGTH (src_regno)++;
851 if (REGNO_FIRST_UID (src_regno) == insn_uid)
852 REGNO_FIRST_UID (src_regno) = move_uid;
854 if (REGNO_LAST_UID (src_regno) == insn_uid)
855 REGNO_LAST_UID (src_regno) = move_uid;
857 if (REGNO_LAST_NOTE_UID (src_regno) == insn_uid)
858 REGNO_LAST_NOTE_UID (src_regno) = move_uid;
863 /* Return whether REG is set in only one location, and is set to a
864 constant, but is set in a different basic block from INSN (an
865 instructions which uses REG). In this case REG is equivalent to a
866 constant, and we don't want to break that equivalence, because that
867 may increase register pressure and make reload harder. If REG is
868 set in the same basic block as INSN, we don't worry about it,
869 because we'll probably need a register anyhow (??? but what if REG
870 is used in a different basic block as well as this one?). FIRST is
871 the first insn in the function. */
873 static int
874 reg_is_remote_constant_p (reg, insn, first)
875 rtx reg;
876 rtx insn;
877 rtx first;
879 rtx p;
881 if (REG_N_SETS (REGNO (reg)) != 1)
882 return 0;
884 /* Look for the set. */
885 for (p = LOG_LINKS (insn); p; p = XEXP (p, 1))
887 rtx s;
889 if (REG_NOTE_KIND (p) != 0)
890 continue;
891 s = single_set (XEXP (p, 0));
892 if (s != 0
893 && GET_CODE (SET_DEST (s)) == REG
894 && REGNO (SET_DEST (s)) == REGNO (reg))
896 /* The register is set in the same basic block. */
897 return 0;
901 for (p = first; p && p != insn; p = NEXT_INSN (p))
903 rtx s;
905 if (! INSN_P (p))
906 continue;
907 s = single_set (p);
908 if (s != 0
909 && GET_CODE (SET_DEST (s)) == REG
910 && REGNO (SET_DEST (s)) == REGNO (reg))
912 /* This is the instruction which sets REG. If there is a
913 REG_EQUAL note, then REG is equivalent to a constant. */
914 if (find_reg_note (p, REG_EQUAL, NULL_RTX))
915 return 1;
916 return 0;
920 return 0;
923 /* INSN is adding a CONST_INT to a REG. We search backwards looking for
924 another add immediate instruction with the same source and dest registers,
925 and if we find one, we change INSN to an increment, and return 1. If
926 no changes are made, we return 0.
928 This changes
929 (set (reg100) (plus reg1 offset1))
931 (set (reg100) (plus reg1 offset2))
933 (set (reg100) (plus reg1 offset1))
935 (set (reg100) (plus reg100 offset2-offset1)) */
937 /* ??? What does this comment mean? */
938 /* cse disrupts preincrement / postdecrement sequences when it finds a
939 hard register as ultimate source, like the frame pointer. */
941 static int
942 fixup_match_2 (insn, dst, src, offset, regmove_dump_file)
943 rtx insn, dst, src, offset;
944 FILE *regmove_dump_file;
946 rtx p, dst_death = 0;
947 int length, num_calls = 0;
949 /* If SRC dies in INSN, we'd have to move the death note. This is
950 considered to be very unlikely, so we just skip the optimization
951 in this case. */
952 if (find_regno_note (insn, REG_DEAD, REGNO (src)))
953 return 0;
955 /* Scan backward to find the first instruction that sets DST. */
957 for (length = 0, p = PREV_INSN (insn); p; p = PREV_INSN (p))
959 rtx pset;
961 /* ??? We can't scan past the end of a basic block without updating
962 the register lifetime info (REG_DEAD/basic_block_live_at_start). */
963 if (perhaps_ends_bb_p (p))
964 break;
965 else if (! INSN_P (p))
966 continue;
968 if (find_regno_note (p, REG_DEAD, REGNO (dst)))
969 dst_death = p;
970 if (! dst_death)
971 length++;
973 pset = single_set (p);
974 if (pset && SET_DEST (pset) == dst
975 && GET_CODE (SET_SRC (pset)) == PLUS
976 && XEXP (SET_SRC (pset), 0) == src
977 && GET_CODE (XEXP (SET_SRC (pset), 1)) == CONST_INT)
979 HOST_WIDE_INT newconst
980 = INTVAL (offset) - INTVAL (XEXP (SET_SRC (pset), 1));
981 rtx add = gen_add3_insn (dst, dst, GEN_INT (newconst));
983 if (add && validate_change (insn, &PATTERN (insn), add, 0))
985 /* Remove the death note for DST from DST_DEATH. */
986 if (dst_death)
988 remove_death (REGNO (dst), dst_death);
989 REG_LIVE_LENGTH (REGNO (dst)) += length;
990 REG_N_CALLS_CROSSED (REGNO (dst)) += num_calls;
993 if (regmove_dump_file)
994 fprintf (regmove_dump_file,
995 "Fixed operand of insn %d.\n",
996 INSN_UID (insn));
998 #ifdef AUTO_INC_DEC
999 for (p = PREV_INSN (insn); p; p = PREV_INSN (p))
1001 if (GET_CODE (p) == CODE_LABEL
1002 || GET_CODE (p) == JUMP_INSN)
1003 break;
1004 if (! INSN_P (p))
1005 continue;
1006 if (reg_overlap_mentioned_p (dst, PATTERN (p)))
1008 if (try_auto_increment (p, insn, 0, dst, newconst, 0))
1009 return 1;
1010 break;
1013 for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
1015 if (GET_CODE (p) == CODE_LABEL
1016 || GET_CODE (p) == JUMP_INSN)
1017 break;
1018 if (! INSN_P (p))
1019 continue;
1020 if (reg_overlap_mentioned_p (dst, PATTERN (p)))
1022 try_auto_increment (p, insn, 0, dst, newconst, 1);
1023 break;
1026 #endif
1027 return 1;
1031 if (reg_set_p (dst, PATTERN (p)))
1032 break;
1034 /* If we have passed a call instruction, and the
1035 pseudo-reg SRC is not already live across a call,
1036 then don't perform the optimization. */
1037 /* reg_set_p is overly conservative for CALL_INSNS, thinks that all
1038 hard regs are clobbered. Thus, we only use it for src for
1039 non-call insns. */
1040 if (GET_CODE (p) == CALL_INSN)
1042 if (! dst_death)
1043 num_calls++;
1045 if (REG_N_CALLS_CROSSED (REGNO (src)) == 0)
1046 break;
1048 if (call_used_regs [REGNO (dst)]
1049 || find_reg_fusage (p, CLOBBER, dst))
1050 break;
1052 else if (reg_set_p (src, PATTERN (p)))
1053 break;
1056 return 0;
1059 /* Main entry for the register move optimization.
1060 F is the first instruction.
1061 NREGS is one plus the highest pseudo-reg number used in the instruction.
1062 REGMOVE_DUMP_FILE is a stream for output of a trace of actions taken
1063 (or 0 if none should be output). */
1065 void
1066 regmove_optimize (f, nregs, regmove_dump_file)
1067 rtx f;
1068 int nregs;
1069 FILE *regmove_dump_file;
1071 int old_max_uid = get_max_uid ();
1072 rtx insn;
1073 struct match match;
1074 int pass;
1075 int i;
1076 rtx copy_src, copy_dst;
1077 basic_block bb;
1079 /* ??? Hack. Regmove doesn't examine the CFG, and gets mightily
1080 confused by non-call exceptions ending blocks. */
1081 if (flag_non_call_exceptions)
1082 return;
1084 /* Find out where a potential flags register is live, and so that we
1085 can suppress some optimizations in those zones. */
1086 mark_flags_life_zones (discover_flags_reg ());
1088 regno_src_regno = (int *) xmalloc (sizeof *regno_src_regno * nregs);
1089 for (i = nregs; --i >= 0; ) regno_src_regno[i] = -1;
1091 regmove_bb_head = (int *) xmalloc (sizeof (int) * (old_max_uid + 1));
1092 for (i = old_max_uid; i >= 0; i--) regmove_bb_head[i] = -1;
1093 FOR_EACH_BB (bb)
1094 regmove_bb_head[INSN_UID (bb->head)] = bb->index;
1096 /* A forward/backward pass. Replace output operands with input operands. */
1098 for (pass = 0; pass <= 2; pass++)
1100 if (! flag_regmove && pass >= flag_expensive_optimizations)
1101 goto done;
1103 if (regmove_dump_file)
1104 fprintf (regmove_dump_file, "Starting %s pass...\n",
1105 pass ? "backward" : "forward");
1107 for (insn = pass ? get_last_insn () : f; insn;
1108 insn = pass ? PREV_INSN (insn) : NEXT_INSN (insn))
1110 rtx set;
1111 int op_no, match_no;
1113 set = single_set (insn);
1114 if (! set)
1115 continue;
1117 if (flag_expensive_optimizations && ! pass
1118 && (GET_CODE (SET_SRC (set)) == SIGN_EXTEND
1119 || GET_CODE (SET_SRC (set)) == ZERO_EXTEND)
1120 && GET_CODE (XEXP (SET_SRC (set), 0)) == REG
1121 && GET_CODE (SET_DEST (set)) == REG)
1122 optimize_reg_copy_3 (insn, SET_DEST (set), SET_SRC (set));
1124 if (flag_expensive_optimizations && ! pass
1125 && GET_CODE (SET_SRC (set)) == REG
1126 && GET_CODE (SET_DEST (set)) == REG)
1128 /* If this is a register-register copy where SRC is not dead,
1129 see if we can optimize it. If this optimization succeeds,
1130 it will become a copy where SRC is dead. */
1131 if ((find_reg_note (insn, REG_DEAD, SET_SRC (set))
1132 || optimize_reg_copy_1 (insn, SET_DEST (set), SET_SRC (set)))
1133 && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
1135 /* Similarly for a pseudo-pseudo copy when SRC is dead. */
1136 if (REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER)
1137 optimize_reg_copy_2 (insn, SET_DEST (set), SET_SRC (set));
1138 if (regno_src_regno[REGNO (SET_DEST (set))] < 0
1139 && SET_SRC (set) != SET_DEST (set))
1141 int srcregno = REGNO (SET_SRC (set));
1142 if (regno_src_regno[srcregno] >= 0)
1143 srcregno = regno_src_regno[srcregno];
1144 regno_src_regno[REGNO (SET_DEST (set))] = srcregno;
1148 if (! flag_regmove)
1149 continue;
1151 if (! find_matches (insn, &match))
1152 continue;
1154 /* Now scan through the operands looking for a source operand
1155 which is supposed to match the destination operand.
1156 Then scan forward for an instruction which uses the dest
1157 operand.
1158 If it dies there, then replace the dest in both operands with
1159 the source operand. */
1161 for (op_no = 0; op_no < recog_data.n_operands; op_no++)
1163 rtx src, dst, src_subreg;
1164 enum reg_class src_class, dst_class;
1166 match_no = match.with[op_no];
1168 /* Nothing to do if the two operands aren't supposed to match. */
1169 if (match_no < 0)
1170 continue;
1172 src = recog_data.operand[op_no];
1173 dst = recog_data.operand[match_no];
1175 if (GET_CODE (src) != REG)
1176 continue;
1178 src_subreg = src;
1179 if (GET_CODE (dst) == SUBREG
1180 && GET_MODE_SIZE (GET_MODE (dst))
1181 >= GET_MODE_SIZE (GET_MODE (SUBREG_REG (dst))))
1183 src_subreg
1184 = gen_rtx_SUBREG (GET_MODE (SUBREG_REG (dst)),
1185 src, SUBREG_BYTE (dst));
1186 dst = SUBREG_REG (dst);
1188 if (GET_CODE (dst) != REG
1189 || REGNO (dst) < FIRST_PSEUDO_REGISTER)
1190 continue;
1192 if (REGNO (src) < FIRST_PSEUDO_REGISTER)
1194 if (match.commutative[op_no] < op_no)
1195 regno_src_regno[REGNO (dst)] = REGNO (src);
1196 continue;
1199 if (REG_LIVE_LENGTH (REGNO (src)) < 0)
1200 continue;
1202 /* op_no/src must be a read-only operand, and
1203 match_operand/dst must be a write-only operand. */
1204 if (match.use[op_no] != READ
1205 || match.use[match_no] != WRITE)
1206 continue;
1208 if (match.early_clobber[match_no]
1209 && count_occurrences (PATTERN (insn), src, 0) > 1)
1210 continue;
1212 /* Make sure match_operand is the destination. */
1213 if (recog_data.operand[match_no] != SET_DEST (set))
1214 continue;
1216 /* If the operands already match, then there is nothing to do. */
1217 if (operands_match_p (src, dst))
1218 continue;
1220 /* But in the commutative case, we might find a better match. */
1221 if (match.commutative[op_no] >= 0)
1223 rtx comm = recog_data.operand[match.commutative[op_no]];
1224 if (operands_match_p (comm, dst)
1225 && (replacement_quality (comm)
1226 >= replacement_quality (src)))
1227 continue;
1230 src_class = reg_preferred_class (REGNO (src));
1231 dst_class = reg_preferred_class (REGNO (dst));
1232 if (! regclass_compatible_p (src_class, dst_class))
1233 continue;
1235 if (GET_MODE (src) != GET_MODE (dst))
1236 continue;
1238 if (fixup_match_1 (insn, set, src, src_subreg, dst, pass,
1239 op_no, match_no,
1240 regmove_dump_file))
1241 break;
1246 /* A backward pass. Replace input operands with output operands. */
1248 if (regmove_dump_file)
1249 fprintf (regmove_dump_file, "Starting backward pass...\n");
1251 for (insn = get_last_insn (); insn; insn = PREV_INSN (insn))
1253 if (INSN_P (insn))
1255 int op_no, match_no;
1256 int success = 0;
1258 if (! find_matches (insn, &match))
1259 continue;
1261 /* Now scan through the operands looking for a destination operand
1262 which is supposed to match a source operand.
1263 Then scan backward for an instruction which sets the source
1264 operand. If safe, then replace the source operand with the
1265 dest operand in both instructions. */
1267 copy_src = NULL_RTX;
1268 copy_dst = NULL_RTX;
1269 for (op_no = 0; op_no < recog_data.n_operands; op_no++)
1271 rtx set, p, src, dst;
1272 rtx src_note, dst_note;
1273 int num_calls = 0;
1274 enum reg_class src_class, dst_class;
1275 int length;
1277 match_no = match.with[op_no];
1279 /* Nothing to do if the two operands aren't supposed to match. */
1280 if (match_no < 0)
1281 continue;
1283 dst = recog_data.operand[match_no];
1284 src = recog_data.operand[op_no];
1286 if (GET_CODE (src) != REG)
1287 continue;
1289 if (GET_CODE (dst) != REG
1290 || REGNO (dst) < FIRST_PSEUDO_REGISTER
1291 || REG_LIVE_LENGTH (REGNO (dst)) < 0
1292 || RTX_UNCHANGING_P (dst))
1293 continue;
1295 /* If the operands already match, then there is nothing to do. */
1296 if (operands_match_p (src, dst))
1297 continue;
1299 if (match.commutative[op_no] >= 0)
1301 rtx comm = recog_data.operand[match.commutative[op_no]];
1302 if (operands_match_p (comm, dst))
1303 continue;
1306 set = single_set (insn);
1307 if (! set)
1308 continue;
1310 /* Note that single_set ignores parts of a parallel set for
1311 which one of the destinations is REG_UNUSED. We can't
1312 handle that here, since we can wind up rewriting things
1313 such that a single register is set twice within a single
1314 parallel. */
1315 if (reg_set_p (src, insn))
1316 continue;
1318 /* match_no/dst must be a write-only operand, and
1319 operand_operand/src must be a read-only operand. */
1320 if (match.use[op_no] != READ
1321 || match.use[match_no] != WRITE)
1322 continue;
1324 if (match.early_clobber[match_no]
1325 && count_occurrences (PATTERN (insn), src, 0) > 1)
1326 continue;
1328 /* Make sure match_no is the destination. */
1329 if (recog_data.operand[match_no] != SET_DEST (set))
1330 continue;
1332 if (REGNO (src) < FIRST_PSEUDO_REGISTER)
1334 if (GET_CODE (SET_SRC (set)) == PLUS
1335 && GET_CODE (XEXP (SET_SRC (set), 1)) == CONST_INT
1336 && XEXP (SET_SRC (set), 0) == src
1337 && fixup_match_2 (insn, dst, src,
1338 XEXP (SET_SRC (set), 1),
1339 regmove_dump_file))
1340 break;
1341 continue;
1343 src_class = reg_preferred_class (REGNO (src));
1344 dst_class = reg_preferred_class (REGNO (dst));
1346 if (! (src_note = find_reg_note (insn, REG_DEAD, src)))
1348 /* We used to force the copy here like in other cases, but
1349 it produces worse code, as it eliminates no copy
1350 instructions and the copy emitted will be produced by
1351 reload anyway. On patterns with multiple alternatives,
1352 there may be better solution available.
1354 In particular this change produced slower code for numeric
1355 i387 programs. */
1357 continue;
1360 if (! regclass_compatible_p (src_class, dst_class))
1362 if (!copy_src)
1364 copy_src = src;
1365 copy_dst = dst;
1367 continue;
1370 /* Can not modify an earlier insn to set dst if this insn
1371 uses an old value in the source. */
1372 if (reg_overlap_mentioned_p (dst, SET_SRC (set)))
1374 if (!copy_src)
1376 copy_src = src;
1377 copy_dst = dst;
1379 continue;
1382 /* If src is set once in a different basic block,
1383 and is set equal to a constant, then do not use
1384 it for this optimization, as this would make it
1385 no longer equivalent to a constant. */
1387 if (reg_is_remote_constant_p (src, insn, f))
1389 if (!copy_src)
1391 copy_src = src;
1392 copy_dst = dst;
1394 continue;
1398 if (regmove_dump_file)
1399 fprintf (regmove_dump_file,
1400 "Could fix operand %d of insn %d matching operand %d.\n",
1401 op_no, INSN_UID (insn), match_no);
1403 /* Scan backward to find the first instruction that uses
1404 the input operand. If the operand is set here, then
1405 replace it in both instructions with match_no. */
1407 for (length = 0, p = PREV_INSN (insn); p; p = PREV_INSN (p))
1409 rtx pset;
1411 /* ??? We can't scan past the end of a basic block without
1412 updating the register lifetime info
1413 (REG_DEAD/basic_block_live_at_start). */
1414 if (perhaps_ends_bb_p (p))
1415 break;
1416 else if (! INSN_P (p))
1417 continue;
1419 length++;
1421 /* ??? See if all of SRC is set in P. This test is much
1422 more conservative than it needs to be. */
1423 pset = single_set (p);
1424 if (pset && SET_DEST (pset) == src)
1426 /* We use validate_replace_rtx, in case there
1427 are multiple identical source operands. All of
1428 them have to be changed at the same time. */
1429 if (validate_replace_rtx (src, dst, insn))
1431 if (validate_change (p, &SET_DEST (pset),
1432 dst, 0))
1433 success = 1;
1434 else
1436 /* Change all source operands back.
1437 This modifies the dst as a side-effect. */
1438 validate_replace_rtx (dst, src, insn);
1439 /* Now make sure the dst is right. */
1440 validate_change (insn,
1441 recog_data.operand_loc[match_no],
1442 dst, 0);
1445 break;
1448 if (reg_overlap_mentioned_p (src, PATTERN (p))
1449 || reg_overlap_mentioned_p (dst, PATTERN (p)))
1450 break;
1452 /* If we have passed a call instruction, and the
1453 pseudo-reg DST is not already live across a call,
1454 then don't perform the optimization. */
1455 if (GET_CODE (p) == CALL_INSN)
1457 num_calls++;
1459 if (REG_N_CALLS_CROSSED (REGNO (dst)) == 0)
1460 break;
1464 if (success)
1466 int dstno, srcno;
1468 /* Remove the death note for SRC from INSN. */
1469 remove_note (insn, src_note);
1470 /* Move the death note for SRC to P if it is used
1471 there. */
1472 if (reg_overlap_mentioned_p (src, PATTERN (p)))
1474 XEXP (src_note, 1) = REG_NOTES (p);
1475 REG_NOTES (p) = src_note;
1477 /* If there is a REG_DEAD note for DST on P, then remove
1478 it, because DST is now set there. */
1479 if ((dst_note = find_reg_note (p, REG_DEAD, dst)))
1480 remove_note (p, dst_note);
1482 dstno = REGNO (dst);
1483 srcno = REGNO (src);
1485 REG_N_SETS (dstno)++;
1486 REG_N_SETS (srcno)--;
1488 REG_N_CALLS_CROSSED (dstno) += num_calls;
1489 REG_N_CALLS_CROSSED (srcno) -= num_calls;
1491 REG_LIVE_LENGTH (dstno) += length;
1492 if (REG_LIVE_LENGTH (srcno) >= 0)
1494 REG_LIVE_LENGTH (srcno) -= length;
1495 /* REG_LIVE_LENGTH is only an approximation after
1496 combine if sched is not run, so make sure that we
1497 still have a reasonable value. */
1498 if (REG_LIVE_LENGTH (srcno) < 2)
1499 REG_LIVE_LENGTH (srcno) = 2;
1502 if (regmove_dump_file)
1503 fprintf (regmove_dump_file,
1504 "Fixed operand %d of insn %d matching operand %d.\n",
1505 op_no, INSN_UID (insn), match_no);
1507 break;
1511 /* If we weren't able to replace any of the alternatives, try an
1512 alternative approach of copying the source to the destination. */
1513 if (!success && copy_src != NULL_RTX)
1514 copy_src_to_dest (insn, copy_src, copy_dst, old_max_uid);
1519 /* In fixup_match_1, some insns may have been inserted after basic block
1520 ends. Fix that here. */
1521 FOR_EACH_BB (bb)
1523 rtx end = bb->end;
1524 rtx new = end;
1525 rtx next = NEXT_INSN (new);
1526 while (next != 0 && INSN_UID (next) >= old_max_uid
1527 && (bb->next_bb == EXIT_BLOCK_PTR || bb->next_bb->head != next))
1528 new = next, next = NEXT_INSN (new);
1529 bb->end = new;
1532 done:
1533 /* Clean up. */
1534 free (regno_src_regno);
1535 free (regmove_bb_head);
1538 /* Returns nonzero if INSN's pattern has matching constraints for any operand.
1539 Returns 0 if INSN can't be recognized, or if the alternative can't be
1540 determined.
1542 Initialize the info in MATCHP based on the constraints. */
1544 static int
1545 find_matches (insn, matchp)
1546 rtx insn;
1547 struct match *matchp;
1549 int likely_spilled[MAX_RECOG_OPERANDS];
1550 int op_no;
1551 int any_matches = 0;
1553 extract_insn (insn);
1554 if (! constrain_operands (0))
1555 return 0;
1557 /* Must initialize this before main loop, because the code for
1558 the commutative case may set matches for operands other than
1559 the current one. */
1560 for (op_no = recog_data.n_operands; --op_no >= 0; )
1561 matchp->with[op_no] = matchp->commutative[op_no] = -1;
1563 for (op_no = 0; op_no < recog_data.n_operands; op_no++)
1565 const char *p;
1566 char c;
1567 int i = 0;
1569 p = recog_data.constraints[op_no];
1571 likely_spilled[op_no] = 0;
1572 matchp->use[op_no] = READ;
1573 matchp->early_clobber[op_no] = 0;
1574 if (*p == '=')
1575 matchp->use[op_no] = WRITE;
1576 else if (*p == '+')
1577 matchp->use[op_no] = READWRITE;
1579 for (;*p && i < which_alternative; p++)
1580 if (*p == ',')
1581 i++;
1583 while ((c = *p) != '\0' && c != ',')
1585 switch (c)
1587 case '=':
1588 break;
1589 case '+':
1590 break;
1591 case '&':
1592 matchp->early_clobber[op_no] = 1;
1593 break;
1594 case '%':
1595 matchp->commutative[op_no] = op_no + 1;
1596 matchp->commutative[op_no + 1] = op_no;
1597 break;
1599 case '0': case '1': case '2': case '3': case '4':
1600 case '5': case '6': case '7': case '8': case '9':
1602 char *end;
1603 unsigned long match_ul = strtoul (p, &end, 10);
1604 int match = match_ul;
1606 p = end;
1608 if (match < op_no && likely_spilled[match])
1609 continue;
1610 matchp->with[op_no] = match;
1611 any_matches = 1;
1612 if (matchp->commutative[op_no] >= 0)
1613 matchp->with[matchp->commutative[op_no]] = match;
1615 continue;
1617 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f': case 'h':
1618 case 'j': case 'k': case 'l': case 'p': case 'q': case 't': case 'u':
1619 case 'v': case 'w': case 'x': case 'y': case 'z': case 'A': case 'B':
1620 case 'C': case 'D': case 'W': case 'Y': case 'Z':
1621 if (CLASS_LIKELY_SPILLED_P (REG_CLASS_FROM_CONSTRAINT ((unsigned char) c, p) ))
1622 likely_spilled[op_no] = 1;
1623 break;
1625 p += CONSTRAINT_LEN (c, p);
1628 return any_matches;
1631 /* Try to replace all occurrences of DST_REG with SRC in LOC, that is
1632 assumed to be in INSN. */
1634 static void
1635 replace_in_call_usage (loc, dst_reg, src, insn)
1636 rtx *loc;
1637 unsigned int dst_reg;
1638 rtx src;
1639 rtx insn;
1641 rtx x = *loc;
1642 enum rtx_code code;
1643 const char *fmt;
1644 int i, j;
1646 if (! x)
1647 return;
1649 code = GET_CODE (x);
1650 if (code == REG)
1652 if (REGNO (x) != dst_reg)
1653 return;
1655 validate_change (insn, loc, src, 1);
1657 return;
1660 /* Process each of our operands recursively. */
1661 fmt = GET_RTX_FORMAT (code);
1662 for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
1663 if (*fmt == 'e')
1664 replace_in_call_usage (&XEXP (x, i), dst_reg, src, insn);
1665 else if (*fmt == 'E')
1666 for (j = 0; j < XVECLEN (x, i); j++)
1667 replace_in_call_usage (& XVECEXP (x, i, j), dst_reg, src, insn);
1670 /* Try to replace output operand DST in SET, with input operand SRC. SET is
1671 the only set in INSN. INSN has just been recognized and constrained.
1672 SRC is operand number OPERAND_NUMBER in INSN.
1673 DST is operand number MATCH_NUMBER in INSN.
1674 If BACKWARD is nonzero, we have been called in a backward pass.
1675 Return nonzero for success. */
1677 static int
1678 fixup_match_1 (insn, set, src, src_subreg, dst, backward, operand_number,
1679 match_number, regmove_dump_file)
1680 rtx insn, set, src, src_subreg, dst;
1681 int backward, operand_number, match_number;
1682 FILE *regmove_dump_file;
1684 rtx p;
1685 rtx post_inc = 0, post_inc_set = 0, search_end = 0;
1686 int success = 0;
1687 int num_calls = 0, s_num_calls = 0;
1688 enum rtx_code code = NOTE;
1689 HOST_WIDE_INT insn_const = 0, newconst = 0;
1690 rtx overlap = 0; /* need to move insn ? */
1691 rtx src_note = find_reg_note (insn, REG_DEAD, src), dst_note = NULL_RTX;
1692 int length, s_length;
1694 /* If SRC is marked as unchanging, we may not change it.
1695 ??? Maybe we could get better code by removing the unchanging bit
1696 instead, and changing it back if we don't succeed? */
1697 if (RTX_UNCHANGING_P (src))
1698 return 0;
1700 if (! src_note)
1702 /* Look for (set (regX) (op regA constX))
1703 (set (regY) (op regA constY))
1704 and change that to
1705 (set (regA) (op regA constX)).
1706 (set (regY) (op regA constY-constX)).
1707 This works for add and shift operations, if
1708 regA is dead after or set by the second insn. */
1710 code = GET_CODE (SET_SRC (set));
1711 if ((code == PLUS || code == LSHIFTRT
1712 || code == ASHIFT || code == ASHIFTRT)
1713 && XEXP (SET_SRC (set), 0) == src
1714 && GET_CODE (XEXP (SET_SRC (set), 1)) == CONST_INT)
1715 insn_const = INTVAL (XEXP (SET_SRC (set), 1));
1716 else if (! stable_and_no_regs_but_for_p (SET_SRC (set), src, dst))
1717 return 0;
1718 else
1719 /* We might find a src_note while scanning. */
1720 code = NOTE;
1723 if (regmove_dump_file)
1724 fprintf (regmove_dump_file,
1725 "Could fix operand %d of insn %d matching operand %d.\n",
1726 operand_number, INSN_UID (insn), match_number);
1728 /* If SRC is equivalent to a constant set in a different basic block,
1729 then do not use it for this optimization. We want the equivalence
1730 so that if we have to reload this register, we can reload the
1731 constant, rather than extending the lifespan of the register. */
1732 if (reg_is_remote_constant_p (src, insn, get_insns ()))
1733 return 0;
1735 /* Scan forward to find the next instruction that
1736 uses the output operand. If the operand dies here,
1737 then replace it in both instructions with
1738 operand_number. */
1740 for (length = s_length = 0, p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
1742 if (GET_CODE (p) == CALL_INSN)
1743 replace_in_call_usage (& CALL_INSN_FUNCTION_USAGE (p),
1744 REGNO (dst), src, p);
1746 /* ??? We can't scan past the end of a basic block without updating
1747 the register lifetime info (REG_DEAD/basic_block_live_at_start). */
1748 if (perhaps_ends_bb_p (p))
1749 break;
1750 else if (! INSN_P (p))
1751 continue;
1753 length++;
1754 if (src_note)
1755 s_length++;
1757 if (reg_set_p (src, p) || reg_set_p (dst, p)
1758 || (GET_CODE (PATTERN (p)) == USE
1759 && reg_overlap_mentioned_p (src, XEXP (PATTERN (p), 0))))
1760 break;
1762 /* See if all of DST dies in P. This test is
1763 slightly more conservative than it needs to be. */
1764 if ((dst_note = find_regno_note (p, REG_DEAD, REGNO (dst)))
1765 && (GET_MODE (XEXP (dst_note, 0)) == GET_MODE (dst)))
1767 /* If we would be moving INSN, check that we won't move it
1768 into the shadow of a live a live flags register. */
1769 /* ??? We only try to move it in front of P, although
1770 we could move it anywhere between OVERLAP and P. */
1771 if (overlap && GET_MODE (PREV_INSN (p)) != VOIDmode)
1772 break;
1774 if (! src_note)
1776 rtx q;
1777 rtx set2 = NULL_RTX;
1779 /* If an optimization is done, the value of SRC while P
1780 is executed will be changed. Check that this is OK. */
1781 if (reg_overlap_mentioned_p (src, PATTERN (p)))
1782 break;
1783 for (q = p; q; q = NEXT_INSN (q))
1785 /* ??? We can't scan past the end of a basic block without
1786 updating the register lifetime info
1787 (REG_DEAD/basic_block_live_at_start). */
1788 if (perhaps_ends_bb_p (q))
1790 q = 0;
1791 break;
1793 else if (! INSN_P (q))
1794 continue;
1795 else if (reg_overlap_mentioned_p (src, PATTERN (q))
1796 || reg_set_p (src, q))
1797 break;
1799 if (q)
1800 set2 = single_set (q);
1801 if (! q || ! set2 || GET_CODE (SET_SRC (set2)) != code
1802 || XEXP (SET_SRC (set2), 0) != src
1803 || GET_CODE (XEXP (SET_SRC (set2), 1)) != CONST_INT
1804 || (SET_DEST (set2) != src
1805 && ! find_reg_note (q, REG_DEAD, src)))
1807 /* If this is a PLUS, we can still save a register by doing
1808 src += insn_const;
1810 src -= insn_const; .
1811 This also gives opportunities for subsequent
1812 optimizations in the backward pass, so do it there. */
1813 if (code == PLUS && backward
1814 /* Don't do this if we can likely tie DST to SET_DEST
1815 of P later; we can't do this tying here if we got a
1816 hard register. */
1817 && ! (dst_note && ! REG_N_CALLS_CROSSED (REGNO (dst))
1818 && single_set (p)
1819 && GET_CODE (SET_DEST (single_set (p))) == REG
1820 && (REGNO (SET_DEST (single_set (p)))
1821 < FIRST_PSEUDO_REGISTER))
1822 /* We may only emit an insn directly after P if we
1823 are not in the shadow of a live flags register. */
1824 && GET_MODE (p) == VOIDmode)
1826 search_end = q;
1827 q = insn;
1828 set2 = set;
1829 newconst = -insn_const;
1830 code = MINUS;
1832 else
1833 break;
1835 else
1837 newconst = INTVAL (XEXP (SET_SRC (set2), 1)) - insn_const;
1838 /* Reject out of range shifts. */
1839 if (code != PLUS
1840 && (newconst < 0
1841 || ((unsigned HOST_WIDE_INT) newconst
1842 >= (GET_MODE_BITSIZE (GET_MODE
1843 (SET_SRC (set2)))))))
1844 break;
1845 if (code == PLUS)
1847 post_inc = q;
1848 if (SET_DEST (set2) != src)
1849 post_inc_set = set2;
1852 /* We use 1 as last argument to validate_change so that all
1853 changes are accepted or rejected together by apply_change_group
1854 when it is called by validate_replace_rtx . */
1855 validate_change (q, &XEXP (SET_SRC (set2), 1),
1856 GEN_INT (newconst), 1);
1858 validate_change (insn, recog_data.operand_loc[match_number], src, 1);
1859 if (validate_replace_rtx (dst, src_subreg, p))
1860 success = 1;
1861 break;
1864 if (reg_overlap_mentioned_p (dst, PATTERN (p)))
1865 break;
1866 if (! src_note && reg_overlap_mentioned_p (src, PATTERN (p)))
1868 /* INSN was already checked to be movable wrt. the registers that it
1869 sets / uses when we found no REG_DEAD note for src on it, but it
1870 still might clobber the flags register. We'll have to check that
1871 we won't insert it into the shadow of a live flags register when
1872 we finally know where we are to move it. */
1873 overlap = p;
1874 src_note = find_reg_note (p, REG_DEAD, src);
1877 /* If we have passed a call instruction, and the pseudo-reg SRC is not
1878 already live across a call, then don't perform the optimization. */
1879 if (GET_CODE (p) == CALL_INSN)
1881 if (REG_N_CALLS_CROSSED (REGNO (src)) == 0)
1882 break;
1884 num_calls++;
1886 if (src_note)
1887 s_num_calls++;
1892 if (! success)
1893 return 0;
1895 /* Remove the death note for DST from P. */
1896 remove_note (p, dst_note);
1897 if (code == MINUS)
1899 post_inc = emit_insn_after (copy_rtx (PATTERN (insn)), p);
1900 if ((HAVE_PRE_INCREMENT || HAVE_PRE_DECREMENT)
1901 && search_end
1902 && try_auto_increment (search_end, post_inc, 0, src, newconst, 1))
1903 post_inc = 0;
1904 validate_change (insn, &XEXP (SET_SRC (set), 1), GEN_INT (insn_const), 0);
1905 REG_N_SETS (REGNO (src))++;
1906 REG_LIVE_LENGTH (REGNO (src))++;
1908 if (overlap)
1910 /* The lifetime of src and dest overlap,
1911 but we can change this by moving insn. */
1912 rtx pat = PATTERN (insn);
1913 if (src_note)
1914 remove_note (overlap, src_note);
1915 if ((HAVE_POST_INCREMENT || HAVE_POST_DECREMENT)
1916 && code == PLUS
1917 && try_auto_increment (overlap, insn, 0, src, insn_const, 0))
1918 insn = overlap;
1919 else
1921 rtx notes = REG_NOTES (insn);
1923 emit_insn_after_with_line_notes (pat, PREV_INSN (p), insn);
1924 delete_insn (insn);
1925 /* emit_insn_after_with_line_notes has no
1926 return value, so search for the new insn. */
1927 insn = p;
1928 while (! INSN_P (insn) || PATTERN (insn) != pat)
1929 insn = PREV_INSN (insn);
1931 REG_NOTES (insn) = notes;
1934 /* Sometimes we'd generate src = const; src += n;
1935 if so, replace the instruction that set src
1936 in the first place. */
1938 if (! overlap && (code == PLUS || code == MINUS))
1940 rtx note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
1941 rtx q, set2 = NULL_RTX;
1942 int num_calls2 = 0, s_length2 = 0;
1944 if (note && CONSTANT_P (XEXP (note, 0)))
1946 for (q = PREV_INSN (insn); q; q = PREV_INSN (q))
1948 /* ??? We can't scan past the end of a basic block without
1949 updating the register lifetime info
1950 (REG_DEAD/basic_block_live_at_start). */
1951 if (perhaps_ends_bb_p (q))
1953 q = 0;
1954 break;
1956 else if (! INSN_P (q))
1957 continue;
1959 s_length2++;
1960 if (reg_set_p (src, q))
1962 set2 = single_set (q);
1963 break;
1965 if (reg_overlap_mentioned_p (src, PATTERN (q)))
1967 q = 0;
1968 break;
1970 if (GET_CODE (p) == CALL_INSN)
1971 num_calls2++;
1973 if (q && set2 && SET_DEST (set2) == src && CONSTANT_P (SET_SRC (set2))
1974 && validate_change (insn, &SET_SRC (set), XEXP (note, 0), 0))
1976 delete_insn (q);
1977 REG_N_SETS (REGNO (src))--;
1978 REG_N_CALLS_CROSSED (REGNO (src)) -= num_calls2;
1979 REG_LIVE_LENGTH (REGNO (src)) -= s_length2;
1980 insn_const = 0;
1985 if ((HAVE_PRE_INCREMENT || HAVE_PRE_DECREMENT)
1986 && (code == PLUS || code == MINUS) && insn_const
1987 && try_auto_increment (p, insn, 0, src, insn_const, 1))
1988 insn = p;
1989 else if ((HAVE_POST_INCREMENT || HAVE_POST_DECREMENT)
1990 && post_inc
1991 && try_auto_increment (p, post_inc, post_inc_set, src, newconst, 0))
1992 post_inc = 0;
1993 /* If post_inc still prevails, try to find an
1994 insn where it can be used as a pre-in/decrement.
1995 If code is MINUS, this was already tried. */
1996 if (post_inc && code == PLUS
1997 /* Check that newconst is likely to be usable
1998 in a pre-in/decrement before starting the search. */
1999 && ((HAVE_PRE_INCREMENT && newconst > 0 && newconst <= MOVE_MAX)
2000 || (HAVE_PRE_DECREMENT && newconst < 0 && newconst >= -MOVE_MAX))
2001 && exact_log2 (newconst))
2003 rtx q, inc_dest;
2005 inc_dest = post_inc_set ? SET_DEST (post_inc_set) : src;
2006 for (q = post_inc; (q = NEXT_INSN (q)); )
2008 /* ??? We can't scan past the end of a basic block without updating
2009 the register lifetime info
2010 (REG_DEAD/basic_block_live_at_start). */
2011 if (perhaps_ends_bb_p (q))
2012 break;
2013 else if (! INSN_P (q))
2014 continue;
2015 else if (src != inc_dest
2016 && (reg_overlap_mentioned_p (src, PATTERN (q))
2017 || reg_set_p (src, q)))
2018 break;
2019 else if (reg_set_p (inc_dest, q))
2020 break;
2021 else if (reg_overlap_mentioned_p (inc_dest, PATTERN (q)))
2023 try_auto_increment (q, post_inc,
2024 post_inc_set, inc_dest, newconst, 1);
2025 break;
2030 /* Move the death note for DST to INSN if it is used
2031 there. */
2032 if (reg_overlap_mentioned_p (dst, PATTERN (insn)))
2034 XEXP (dst_note, 1) = REG_NOTES (insn);
2035 REG_NOTES (insn) = dst_note;
2038 if (src_note)
2040 /* Move the death note for SRC from INSN to P. */
2041 if (! overlap)
2042 remove_note (insn, src_note);
2043 XEXP (src_note, 1) = REG_NOTES (p);
2044 REG_NOTES (p) = src_note;
2046 REG_N_CALLS_CROSSED (REGNO (src)) += s_num_calls;
2049 REG_N_SETS (REGNO (src))++;
2050 REG_N_SETS (REGNO (dst))--;
2052 REG_N_CALLS_CROSSED (REGNO (dst)) -= num_calls;
2054 REG_LIVE_LENGTH (REGNO (src)) += s_length;
2055 if (REG_LIVE_LENGTH (REGNO (dst)) >= 0)
2057 REG_LIVE_LENGTH (REGNO (dst)) -= length;
2058 /* REG_LIVE_LENGTH is only an approximation after
2059 combine if sched is not run, so make sure that we
2060 still have a reasonable value. */
2061 if (REG_LIVE_LENGTH (REGNO (dst)) < 2)
2062 REG_LIVE_LENGTH (REGNO (dst)) = 2;
2064 if (regmove_dump_file)
2065 fprintf (regmove_dump_file,
2066 "Fixed operand %d of insn %d matching operand %d.\n",
2067 operand_number, INSN_UID (insn), match_number);
2068 return 1;
2072 /* return nonzero if X is stable and mentions no regsiters but for
2073 mentioning SRC or mentioning / changing DST . If in doubt, presume
2074 it is unstable.
2075 The rationale is that we want to check if we can move an insn easily
2076 while just paying attention to SRC and DST. A register is considered
2077 stable if it has the RTX_UNCHANGING_P bit set, but that would still
2078 leave the burden to update REG_DEAD / REG_UNUSED notes, so we don't
2079 want any registers but SRC and DST. */
2080 static int
2081 stable_and_no_regs_but_for_p (x, src, dst)
2082 rtx x, src, dst;
2084 RTX_CODE code = GET_CODE (x);
2085 switch (GET_RTX_CLASS (code))
2087 case '<': case '1': case 'c': case '2': case 'b': case '3':
2089 int i;
2090 const char *fmt = GET_RTX_FORMAT (code);
2091 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2092 if (fmt[i] == 'e'
2093 && ! stable_and_no_regs_but_for_p (XEXP (x, i), src, dst))
2094 return 0;
2095 return 1;
2097 case 'o':
2098 if (code == REG)
2099 return x == src || x == dst;
2100 /* If this is a MEM, look inside - there might be a register hidden in
2101 the address of an unchanging MEM. */
2102 if (code == MEM
2103 && ! stable_and_no_regs_but_for_p (XEXP (x, 0), src, dst))
2104 return 0;
2105 /* fall through */
2106 default:
2107 return ! rtx_unstable_p (x);
2111 /* Track stack adjustments and stack memory references. Attempt to
2112 reduce the number of stack adjustments by back-propagating across
2113 the memory references.
2115 This is intended primarily for use with targets that do not define
2116 ACCUMULATE_OUTGOING_ARGS. It is of significantly more value to
2117 targets that define PREFERRED_STACK_BOUNDARY more aligned than
2118 STACK_BOUNDARY (e.g. x86), or if not all registers can be pushed
2119 (e.g. x86 fp regs) which would ordinarily have to be implemented
2120 as a sub/mov pair due to restrictions in calls.c.
2122 Propagation stops when any of the insns that need adjusting are
2123 (a) no longer valid because we've exceeded their range, (b) a
2124 non-trivial push instruction, or (c) a call instruction.
2126 Restriction B is based on the assumption that push instructions
2127 are smaller or faster. If a port really wants to remove all
2128 pushes, it should have defined ACCUMULATE_OUTGOING_ARGS. The
2129 one exception that is made is for an add immediately followed
2130 by a push. */
2132 /* This structure records stack memory references between stack adjusting
2133 instructions. */
2135 struct csa_memlist
2137 HOST_WIDE_INT sp_offset;
2138 rtx insn, *mem;
2139 struct csa_memlist *next;
2142 static int stack_memref_p PARAMS ((rtx));
2143 static rtx single_set_for_csa PARAMS ((rtx));
2144 static void free_csa_memlist PARAMS ((struct csa_memlist *));
2145 static struct csa_memlist *record_one_stack_memref
2146 PARAMS ((rtx, rtx *, struct csa_memlist *));
2147 static int try_apply_stack_adjustment
2148 PARAMS ((rtx, struct csa_memlist *, HOST_WIDE_INT, HOST_WIDE_INT));
2149 static void combine_stack_adjustments_for_block PARAMS ((basic_block));
2150 static int record_stack_memrefs PARAMS ((rtx *, void *));
2153 /* Main entry point for stack adjustment combination. */
2155 void
2156 combine_stack_adjustments ()
2158 basic_block bb;
2160 FOR_EACH_BB (bb)
2161 combine_stack_adjustments_for_block (bb);
2164 /* Recognize a MEM of the form (sp) or (plus sp const). */
2166 static int
2167 stack_memref_p (x)
2168 rtx x;
2170 if (GET_CODE (x) != MEM)
2171 return 0;
2172 x = XEXP (x, 0);
2174 if (x == stack_pointer_rtx)
2175 return 1;
2176 if (GET_CODE (x) == PLUS
2177 && XEXP (x, 0) == stack_pointer_rtx
2178 && GET_CODE (XEXP (x, 1)) == CONST_INT)
2179 return 1;
2181 return 0;
2184 /* Recognize either normal single_set or the hack in i386.md for
2185 tying fp and sp adjustments. */
2187 static rtx
2188 single_set_for_csa (insn)
2189 rtx insn;
2191 int i;
2192 rtx tmp = single_set (insn);
2193 if (tmp)
2194 return tmp;
2196 if (GET_CODE (insn) != INSN
2197 || GET_CODE (PATTERN (insn)) != PARALLEL)
2198 return NULL_RTX;
2200 tmp = PATTERN (insn);
2201 if (GET_CODE (XVECEXP (tmp, 0, 0)) != SET)
2202 return NULL_RTX;
2204 for (i = 1; i < XVECLEN (tmp, 0); ++i)
2206 rtx this = XVECEXP (tmp, 0, i);
2208 /* The special case is allowing a no-op set. */
2209 if (GET_CODE (this) == SET
2210 && SET_SRC (this) == SET_DEST (this))
2212 else if (GET_CODE (this) != CLOBBER
2213 && GET_CODE (this) != USE)
2214 return NULL_RTX;
2217 return XVECEXP (tmp, 0, 0);
2220 /* Free the list of csa_memlist nodes. */
2222 static void
2223 free_csa_memlist (memlist)
2224 struct csa_memlist *memlist;
2226 struct csa_memlist *next;
2227 for (; memlist ; memlist = next)
2229 next = memlist->next;
2230 free (memlist);
2234 /* Create a new csa_memlist node from the given memory reference.
2235 It is already known that the memory is stack_memref_p. */
2237 static struct csa_memlist *
2238 record_one_stack_memref (insn, mem, next_memlist)
2239 rtx insn, *mem;
2240 struct csa_memlist *next_memlist;
2242 struct csa_memlist *ml;
2244 ml = (struct csa_memlist *) xmalloc (sizeof (*ml));
2246 if (XEXP (*mem, 0) == stack_pointer_rtx)
2247 ml->sp_offset = 0;
2248 else
2249 ml->sp_offset = INTVAL (XEXP (XEXP (*mem, 0), 1));
2251 ml->insn = insn;
2252 ml->mem = mem;
2253 ml->next = next_memlist;
2255 return ml;
2258 /* Attempt to apply ADJUST to the stack adjusting insn INSN, as well
2259 as each of the memories in MEMLIST. Return true on success. */
2261 static int
2262 try_apply_stack_adjustment (insn, memlist, new_adjust, delta)
2263 rtx insn;
2264 struct csa_memlist *memlist;
2265 HOST_WIDE_INT new_adjust, delta;
2267 struct csa_memlist *ml;
2268 rtx set;
2270 set = single_set_for_csa (insn);
2271 validate_change (insn, &XEXP (SET_SRC (set), 1), GEN_INT (new_adjust), 1);
2273 for (ml = memlist; ml ; ml = ml->next)
2274 validate_change
2275 (ml->insn, ml->mem,
2276 replace_equiv_address_nv (*ml->mem,
2277 plus_constant (stack_pointer_rtx,
2278 ml->sp_offset - delta)), 1);
2280 if (apply_change_group ())
2282 /* Succeeded. Update our knowledge of the memory references. */
2283 for (ml = memlist; ml ; ml = ml->next)
2284 ml->sp_offset -= delta;
2286 return 1;
2288 else
2289 return 0;
2292 /* Called via for_each_rtx and used to record all stack memory references in
2293 the insn and discard all other stack pointer references. */
2294 struct record_stack_memrefs_data
2296 rtx insn;
2297 struct csa_memlist *memlist;
2300 static int
2301 record_stack_memrefs (xp, data)
2302 rtx *xp;
2303 void *data;
2305 rtx x = *xp;
2306 struct record_stack_memrefs_data *d =
2307 (struct record_stack_memrefs_data *) data;
2308 if (!x)
2309 return 0;
2310 switch (GET_CODE (x))
2312 case MEM:
2313 if (!reg_mentioned_p (stack_pointer_rtx, x))
2314 return -1;
2315 /* We are not able to handle correctly all possible memrefs containing
2316 stack pointer, so this check is necessary. */
2317 if (stack_memref_p (x))
2319 d->memlist = record_one_stack_memref (d->insn, xp, d->memlist);
2320 return -1;
2322 return 1;
2323 case REG:
2324 /* ??? We want be able to handle non-memory stack pointer
2325 references later. For now just discard all insns refering to
2326 stack pointer outside mem expressions. We would probably
2327 want to teach validate_replace to simplify expressions first.
2329 We can't just compare with STACK_POINTER_RTX because the
2330 reference to the stack pointer might be in some other mode.
2331 In particular, an explicit clobber in an asm statement will
2332 result in a QImode clober. */
2333 if (REGNO (x) == STACK_POINTER_REGNUM)
2334 return 1;
2335 break;
2336 default:
2337 break;
2339 return 0;
2342 /* Subroutine of combine_stack_adjustments, called for each basic block. */
2344 static void
2345 combine_stack_adjustments_for_block (bb)
2346 basic_block bb;
2348 HOST_WIDE_INT last_sp_adjust = 0;
2349 rtx last_sp_set = NULL_RTX;
2350 struct csa_memlist *memlist = NULL;
2351 rtx insn, next, set;
2352 struct record_stack_memrefs_data data;
2353 bool end_of_block = false;
2355 for (insn = bb->head; !end_of_block ; insn = next)
2357 end_of_block = insn == bb->end;
2358 next = NEXT_INSN (insn);
2360 if (! INSN_P (insn))
2361 continue;
2363 set = single_set_for_csa (insn);
2364 if (set)
2366 rtx dest = SET_DEST (set);
2367 rtx src = SET_SRC (set);
2369 /* Find constant additions to the stack pointer. */
2370 if (dest == stack_pointer_rtx
2371 && GET_CODE (src) == PLUS
2372 && XEXP (src, 0) == stack_pointer_rtx
2373 && GET_CODE (XEXP (src, 1)) == CONST_INT)
2375 HOST_WIDE_INT this_adjust = INTVAL (XEXP (src, 1));
2377 /* If we've not seen an adjustment previously, record
2378 it now and continue. */
2379 if (! last_sp_set)
2381 last_sp_set = insn;
2382 last_sp_adjust = this_adjust;
2383 continue;
2386 /* If not all recorded memrefs can be adjusted, or the
2387 adjustment is now too large for a constant addition,
2388 we cannot merge the two stack adjustments.
2390 Also we need to be careful to not move stack pointer
2391 such that we create stack accesses outside the allocated
2392 area. We can combine an allocation into the first insn,
2393 or a deallocation into the second insn. We can not
2394 combine an allocation followed by a deallocation.
2396 The only somewhat frequent occurrence of the later is when
2397 a function allocates a stack frame but does not use it.
2398 For this case, we would need to analyze rtl stream to be
2399 sure that allocated area is really unused. This means not
2400 only checking the memory references, but also all registers
2401 or global memory references possibly containing a stack
2402 frame address.
2404 Perhaps the best way to address this problem is to teach
2405 gcc not to allocate stack for objects never used. */
2407 /* Combine an allocation into the first instruction. */
2408 if (STACK_GROWS_DOWNWARD ? this_adjust <= 0 : this_adjust >= 0)
2410 if (try_apply_stack_adjustment (last_sp_set, memlist,
2411 last_sp_adjust + this_adjust,
2412 this_adjust))
2414 /* It worked! */
2415 delete_insn (insn);
2416 last_sp_adjust += this_adjust;
2417 continue;
2421 /* Otherwise we have a deallocation. Do not combine with
2422 a previous allocation. Combine into the second insn. */
2423 else if (STACK_GROWS_DOWNWARD
2424 ? last_sp_adjust >= 0 : last_sp_adjust <= 0)
2426 if (try_apply_stack_adjustment (insn, memlist,
2427 last_sp_adjust + this_adjust,
2428 -last_sp_adjust))
2430 /* It worked! */
2431 delete_insn (last_sp_set);
2432 last_sp_set = insn;
2433 last_sp_adjust += this_adjust;
2434 free_csa_memlist (memlist);
2435 memlist = NULL;
2436 continue;
2440 /* Combination failed. Restart processing from here. If
2441 deallocation+allocation conspired to cancel, we can
2442 delete the old deallocation insn. */
2443 if (last_sp_set && last_sp_adjust == 0)
2444 delete_insn (insn);
2445 free_csa_memlist (memlist);
2446 memlist = NULL;
2447 last_sp_set = insn;
2448 last_sp_adjust = this_adjust;
2449 continue;
2452 /* Find a predecrement of exactly the previous adjustment and
2453 turn it into a direct store. Obviously we can't do this if
2454 there were any intervening uses of the stack pointer. */
2455 if (memlist == NULL
2456 && GET_CODE (dest) == MEM
2457 && ((GET_CODE (XEXP (dest, 0)) == PRE_DEC
2458 && (last_sp_adjust
2459 == (HOST_WIDE_INT) GET_MODE_SIZE (GET_MODE (dest))))
2460 || (GET_CODE (XEXP (dest, 0)) == PRE_MODIFY
2461 && GET_CODE (XEXP (XEXP (dest, 0), 1)) == PLUS
2462 && XEXP (XEXP (XEXP (dest, 0), 1), 0) == stack_pointer_rtx
2463 && (GET_CODE (XEXP (XEXP (XEXP (dest, 0), 1), 1))
2464 == CONST_INT)
2465 && (INTVAL (XEXP (XEXP (XEXP (dest, 0), 1), 1))
2466 == -last_sp_adjust)))
2467 && XEXP (XEXP (dest, 0), 0) == stack_pointer_rtx
2468 && ! reg_mentioned_p (stack_pointer_rtx, src)
2469 && memory_address_p (GET_MODE (dest), stack_pointer_rtx)
2470 && validate_change (insn, &SET_DEST (set),
2471 replace_equiv_address (dest,
2472 stack_pointer_rtx),
2475 delete_insn (last_sp_set);
2476 free_csa_memlist (memlist);
2477 memlist = NULL;
2478 last_sp_set = NULL_RTX;
2479 last_sp_adjust = 0;
2480 continue;
2484 data.insn = insn;
2485 data.memlist = memlist;
2486 if (GET_CODE (insn) != CALL_INSN && last_sp_set
2487 && !for_each_rtx (&PATTERN (insn), record_stack_memrefs, &data))
2489 memlist = data.memlist;
2490 continue;
2492 memlist = data.memlist;
2494 /* Otherwise, we were not able to process the instruction.
2495 Do not continue collecting data across such a one. */
2496 if (last_sp_set
2497 && (GET_CODE (insn) == CALL_INSN
2498 || reg_mentioned_p (stack_pointer_rtx, PATTERN (insn))))
2500 if (last_sp_set && last_sp_adjust == 0)
2501 delete_insn (last_sp_set);
2502 free_csa_memlist (memlist);
2503 memlist = NULL;
2504 last_sp_set = NULL_RTX;
2505 last_sp_adjust = 0;
2509 if (last_sp_set && last_sp_adjust == 0)
2510 delete_insn (last_sp_set);