2016-11-05 Paul Thomas <pault@gcc.gnu.org>
[official-gcc.git] / gcc / postreload.c
blob8a4456238c438eadc9c2c0bb98aca0ae3bb0c576
1 /* Perform simple optimizations to clean up the result of reload.
2 Copyright (C) 1987-2016 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "predict.h"
28 #include "df.h"
29 #include "memmodel.h"
30 #include "tm_p.h"
31 #include "optabs.h"
32 #include "regs.h"
33 #include "emit-rtl.h"
34 #include "recog.h"
36 #include "cfgrtl.h"
37 #include "cfgbuild.h"
38 #include "cfgcleanup.h"
39 #include "reload.h"
40 #include "cselib.h"
41 #include "tree-pass.h"
42 #include "dbgcnt.h"
44 static int reload_cse_noop_set_p (rtx);
45 static bool reload_cse_simplify (rtx_insn *, rtx);
46 static void reload_cse_regs_1 (void);
47 static int reload_cse_simplify_set (rtx, rtx_insn *);
48 static int reload_cse_simplify_operands (rtx_insn *, rtx);
50 static void reload_combine (void);
51 static void reload_combine_note_use (rtx *, rtx_insn *, int, rtx);
52 static void reload_combine_note_store (rtx, const_rtx, void *);
54 static bool reload_cse_move2add (rtx_insn *);
55 static void move2add_note_store (rtx, const_rtx, void *);
57 /* Call cse / combine like post-reload optimization phases.
58 FIRST is the first instruction. */
60 static void
61 reload_cse_regs (rtx_insn *first ATTRIBUTE_UNUSED)
63 bool moves_converted;
64 reload_cse_regs_1 ();
65 reload_combine ();
66 moves_converted = reload_cse_move2add (first);
67 if (flag_expensive_optimizations)
69 if (moves_converted)
70 reload_combine ();
71 reload_cse_regs_1 ();
75 /* See whether a single set SET is a noop. */
76 static int
77 reload_cse_noop_set_p (rtx set)
79 if (cselib_reg_set_mode (SET_DEST (set)) != GET_MODE (SET_DEST (set)))
80 return 0;
82 return rtx_equal_for_cselib_p (SET_DEST (set), SET_SRC (set));
85 /* Try to simplify INSN. Return true if the CFG may have changed. */
86 static bool
87 reload_cse_simplify (rtx_insn *insn, rtx testreg)
89 rtx body = PATTERN (insn);
90 basic_block insn_bb = BLOCK_FOR_INSN (insn);
91 unsigned insn_bb_succs = EDGE_COUNT (insn_bb->succs);
93 if (GET_CODE (body) == SET)
95 int count = 0;
97 /* Simplify even if we may think it is a no-op.
98 We may think a memory load of a value smaller than WORD_SIZE
99 is redundant because we haven't taken into account possible
100 implicit extension. reload_cse_simplify_set() will bring
101 this out, so it's safer to simplify before we delete. */
102 count += reload_cse_simplify_set (body, insn);
104 if (!count && reload_cse_noop_set_p (body))
106 if (check_for_inc_dec (insn))
107 delete_insn_and_edges (insn);
108 /* We're done with this insn. */
109 goto done;
112 if (count > 0)
113 apply_change_group ();
114 else
115 reload_cse_simplify_operands (insn, testreg);
117 else if (GET_CODE (body) == PARALLEL)
119 int i;
120 int count = 0;
121 rtx value = NULL_RTX;
123 /* Registers mentioned in the clobber list for an asm cannot be reused
124 within the body of the asm. Invalidate those registers now so that
125 we don't try to substitute values for them. */
126 if (asm_noperands (body) >= 0)
128 for (i = XVECLEN (body, 0) - 1; i >= 0; --i)
130 rtx part = XVECEXP (body, 0, i);
131 if (GET_CODE (part) == CLOBBER && REG_P (XEXP (part, 0)))
132 cselib_invalidate_rtx (XEXP (part, 0));
136 /* If every action in a PARALLEL is a noop, we can delete
137 the entire PARALLEL. */
138 for (i = XVECLEN (body, 0) - 1; i >= 0; --i)
140 rtx part = XVECEXP (body, 0, i);
141 if (GET_CODE (part) == SET)
143 if (! reload_cse_noop_set_p (part))
144 break;
145 if (REG_P (SET_DEST (part))
146 && REG_FUNCTION_VALUE_P (SET_DEST (part)))
148 if (value)
149 break;
150 value = SET_DEST (part);
153 else if (GET_CODE (part) != CLOBBER
154 && GET_CODE (part) != USE)
155 break;
158 if (i < 0)
160 if (check_for_inc_dec (insn))
161 delete_insn_and_edges (insn);
162 /* We're done with this insn. */
163 goto done;
166 /* It's not a no-op, but we can try to simplify it. */
167 for (i = XVECLEN (body, 0) - 1; i >= 0; --i)
168 if (GET_CODE (XVECEXP (body, 0, i)) == SET)
169 count += reload_cse_simplify_set (XVECEXP (body, 0, i), insn);
171 if (count > 0)
172 apply_change_group ();
173 else
174 reload_cse_simplify_operands (insn, testreg);
177 done:
178 return (EDGE_COUNT (insn_bb->succs) != insn_bb_succs);
181 /* Do a very simple CSE pass over the hard registers.
183 This function detects no-op moves where we happened to assign two
184 different pseudo-registers to the same hard register, and then
185 copied one to the other. Reload will generate a useless
186 instruction copying a register to itself.
188 This function also detects cases where we load a value from memory
189 into two different registers, and (if memory is more expensive than
190 registers) changes it to simply copy the first register into the
191 second register.
193 Another optimization is performed that scans the operands of each
194 instruction to see whether the value is already available in a
195 hard register. It then replaces the operand with the hard register
196 if possible, much like an optional reload would. */
198 static void
199 reload_cse_regs_1 (void)
201 bool cfg_changed = false;
202 basic_block bb;
203 rtx_insn *insn;
204 rtx testreg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
206 cselib_init (CSELIB_RECORD_MEMORY);
207 init_alias_analysis ();
209 FOR_EACH_BB_FN (bb, cfun)
210 FOR_BB_INSNS (bb, insn)
212 if (INSN_P (insn))
213 cfg_changed |= reload_cse_simplify (insn, testreg);
215 cselib_process_insn (insn);
218 /* Clean up. */
219 end_alias_analysis ();
220 cselib_finish ();
221 if (cfg_changed)
222 cleanup_cfg (0);
225 /* Try to simplify a single SET instruction. SET is the set pattern.
226 INSN is the instruction it came from.
227 This function only handles one case: if we set a register to a value
228 which is not a register, we try to find that value in some other register
229 and change the set into a register copy. */
231 static int
232 reload_cse_simplify_set (rtx set, rtx_insn *insn)
234 int did_change = 0;
235 int dreg;
236 rtx src;
237 reg_class_t dclass;
238 int old_cost;
239 cselib_val *val;
240 struct elt_loc_list *l;
241 enum rtx_code extend_op = UNKNOWN;
242 bool speed = optimize_bb_for_speed_p (BLOCK_FOR_INSN (insn));
244 dreg = true_regnum (SET_DEST (set));
245 if (dreg < 0)
246 return 0;
248 src = SET_SRC (set);
249 if (side_effects_p (src) || true_regnum (src) >= 0)
250 return 0;
252 dclass = REGNO_REG_CLASS (dreg);
254 /* When replacing a memory with a register, we need to honor assumptions
255 that combine made wrt the contents of sign bits. We'll do this by
256 generating an extend instruction instead of a reg->reg copy. Thus
257 the destination must be a register that we can widen. */
258 if (MEM_P (src)
259 && GET_MODE_BITSIZE (GET_MODE (src)) < BITS_PER_WORD
260 && (extend_op = LOAD_EXTEND_OP (GET_MODE (src))) != UNKNOWN
261 && !REG_P (SET_DEST (set)))
262 return 0;
264 val = cselib_lookup (src, GET_MODE (SET_DEST (set)), 0, VOIDmode);
265 if (! val)
266 return 0;
268 /* If memory loads are cheaper than register copies, don't change them. */
269 if (MEM_P (src))
270 old_cost = memory_move_cost (GET_MODE (src), dclass, true);
271 else if (REG_P (src))
272 old_cost = register_move_cost (GET_MODE (src),
273 REGNO_REG_CLASS (REGNO (src)), dclass);
274 else
275 old_cost = set_src_cost (src, GET_MODE (SET_DEST (set)), speed);
277 for (l = val->locs; l; l = l->next)
279 rtx this_rtx = l->loc;
280 int this_cost;
282 if (CONSTANT_P (this_rtx) && ! references_value_p (this_rtx, 0))
284 if (extend_op != UNKNOWN)
286 wide_int result;
288 if (!CONST_SCALAR_INT_P (this_rtx))
289 continue;
291 switch (extend_op)
293 case ZERO_EXTEND:
294 result = wide_int::from (std::make_pair (this_rtx,
295 GET_MODE (src)),
296 BITS_PER_WORD, UNSIGNED);
297 break;
298 case SIGN_EXTEND:
299 result = wide_int::from (std::make_pair (this_rtx,
300 GET_MODE (src)),
301 BITS_PER_WORD, SIGNED);
302 break;
303 default:
304 gcc_unreachable ();
306 this_rtx = immed_wide_int_const (result, word_mode);
309 this_cost = set_src_cost (this_rtx, GET_MODE (SET_DEST (set)), speed);
311 else if (REG_P (this_rtx))
313 if (extend_op != UNKNOWN)
315 this_rtx = gen_rtx_fmt_e (extend_op, word_mode, this_rtx);
316 this_cost = set_src_cost (this_rtx, word_mode, speed);
318 else
319 this_cost = register_move_cost (GET_MODE (this_rtx),
320 REGNO_REG_CLASS (REGNO (this_rtx)),
321 dclass);
323 else
324 continue;
326 /* If equal costs, prefer registers over anything else. That
327 tends to lead to smaller instructions on some machines. */
328 if (this_cost < old_cost
329 || (this_cost == old_cost
330 && REG_P (this_rtx)
331 && !REG_P (SET_SRC (set))))
333 if (GET_MODE_BITSIZE (GET_MODE (SET_DEST (set))) < BITS_PER_WORD
334 && extend_op != UNKNOWN
335 #ifdef CANNOT_CHANGE_MODE_CLASS
336 && !CANNOT_CHANGE_MODE_CLASS (GET_MODE (SET_DEST (set)),
337 word_mode,
338 REGNO_REG_CLASS (REGNO (SET_DEST (set))))
339 #endif
342 rtx wide_dest = gen_rtx_REG (word_mode, REGNO (SET_DEST (set)));
343 ORIGINAL_REGNO (wide_dest) = ORIGINAL_REGNO (SET_DEST (set));
344 validate_change (insn, &SET_DEST (set), wide_dest, 1);
347 validate_unshare_change (insn, &SET_SRC (set), this_rtx, 1);
348 old_cost = this_cost, did_change = 1;
352 return did_change;
355 /* Try to replace operands in INSN with equivalent values that are already
356 in registers. This can be viewed as optional reloading.
358 For each non-register operand in the insn, see if any hard regs are
359 known to be equivalent to that operand. Record the alternatives which
360 can accept these hard registers. Among all alternatives, select the
361 ones which are better or equal to the one currently matching, where
362 "better" is in terms of '?' and '!' constraints. Among the remaining
363 alternatives, select the one which replaces most operands with
364 hard registers. */
366 static int
367 reload_cse_simplify_operands (rtx_insn *insn, rtx testreg)
369 int i, j;
371 /* For each operand, all registers that are equivalent to it. */
372 HARD_REG_SET equiv_regs[MAX_RECOG_OPERANDS];
374 const char *constraints[MAX_RECOG_OPERANDS];
376 /* Vector recording how bad an alternative is. */
377 int *alternative_reject;
378 /* Vector recording how many registers can be introduced by choosing
379 this alternative. */
380 int *alternative_nregs;
381 /* Array of vectors recording, for each operand and each alternative,
382 which hard register to substitute, or -1 if the operand should be
383 left as it is. */
384 int *op_alt_regno[MAX_RECOG_OPERANDS];
385 /* Array of alternatives, sorted in order of decreasing desirability. */
386 int *alternative_order;
388 extract_constrain_insn (insn);
390 if (recog_data.n_alternatives == 0 || recog_data.n_operands == 0)
391 return 0;
393 alternative_reject = XALLOCAVEC (int, recog_data.n_alternatives);
394 alternative_nregs = XALLOCAVEC (int, recog_data.n_alternatives);
395 alternative_order = XALLOCAVEC (int, recog_data.n_alternatives);
396 memset (alternative_reject, 0, recog_data.n_alternatives * sizeof (int));
397 memset (alternative_nregs, 0, recog_data.n_alternatives * sizeof (int));
399 /* For each operand, find out which regs are equivalent. */
400 for (i = 0; i < recog_data.n_operands; i++)
402 cselib_val *v;
403 struct elt_loc_list *l;
404 rtx op;
406 CLEAR_HARD_REG_SET (equiv_regs[i]);
408 /* cselib blows up on CODE_LABELs. Trying to fix that doesn't seem
409 right, so avoid the problem here. Likewise if we have a constant
410 and the insn pattern doesn't tell us the mode we need. */
411 if (LABEL_P (recog_data.operand[i])
412 || (CONSTANT_P (recog_data.operand[i])
413 && recog_data.operand_mode[i] == VOIDmode))
414 continue;
416 op = recog_data.operand[i];
417 if (MEM_P (op)
418 && GET_MODE_BITSIZE (GET_MODE (op)) < BITS_PER_WORD
419 && LOAD_EXTEND_OP (GET_MODE (op)) != UNKNOWN)
421 rtx set = single_set (insn);
423 /* We might have multiple sets, some of which do implicit
424 extension. Punt on this for now. */
425 if (! set)
426 continue;
427 /* If the destination is also a MEM or a STRICT_LOW_PART, no
428 extension applies.
429 Also, if there is an explicit extension, we don't have to
430 worry about an implicit one. */
431 else if (MEM_P (SET_DEST (set))
432 || GET_CODE (SET_DEST (set)) == STRICT_LOW_PART
433 || GET_CODE (SET_SRC (set)) == ZERO_EXTEND
434 || GET_CODE (SET_SRC (set)) == SIGN_EXTEND)
435 ; /* Continue ordinary processing. */
436 #ifdef CANNOT_CHANGE_MODE_CLASS
437 /* If the register cannot change mode to word_mode, it follows that
438 it cannot have been used in word_mode. */
439 else if (REG_P (SET_DEST (set))
440 && CANNOT_CHANGE_MODE_CLASS (GET_MODE (SET_DEST (set)),
441 word_mode,
442 REGNO_REG_CLASS (REGNO (SET_DEST (set)))))
443 ; /* Continue ordinary processing. */
444 #endif
445 /* If this is a straight load, make the extension explicit. */
446 else if (REG_P (SET_DEST (set))
447 && recog_data.n_operands == 2
448 && SET_SRC (set) == op
449 && SET_DEST (set) == recog_data.operand[1-i])
451 validate_change (insn, recog_data.operand_loc[i],
452 gen_rtx_fmt_e (LOAD_EXTEND_OP (GET_MODE (op)),
453 word_mode, op),
455 validate_change (insn, recog_data.operand_loc[1-i],
456 gen_rtx_REG (word_mode, REGNO (SET_DEST (set))),
458 if (! apply_change_group ())
459 return 0;
460 return reload_cse_simplify_operands (insn, testreg);
462 else
463 /* ??? There might be arithmetic operations with memory that are
464 safe to optimize, but is it worth the trouble? */
465 continue;
468 if (side_effects_p (op))
469 continue;
470 v = cselib_lookup (op, recog_data.operand_mode[i], 0, VOIDmode);
471 if (! v)
472 continue;
474 for (l = v->locs; l; l = l->next)
475 if (REG_P (l->loc))
476 SET_HARD_REG_BIT (equiv_regs[i], REGNO (l->loc));
479 alternative_mask preferred = get_preferred_alternatives (insn);
480 for (i = 0; i < recog_data.n_operands; i++)
482 machine_mode mode;
483 int regno;
484 const char *p;
486 op_alt_regno[i] = XALLOCAVEC (int, recog_data.n_alternatives);
487 for (j = 0; j < recog_data.n_alternatives; j++)
488 op_alt_regno[i][j] = -1;
490 p = constraints[i] = recog_data.constraints[i];
491 mode = recog_data.operand_mode[i];
493 /* Add the reject values for each alternative given by the constraints
494 for this operand. */
495 j = 0;
496 while (*p != '\0')
498 char c = *p++;
499 if (c == ',')
500 j++;
501 else if (c == '?')
502 alternative_reject[j] += 3;
503 else if (c == '!')
504 alternative_reject[j] += 300;
507 /* We won't change operands which are already registers. We
508 also don't want to modify output operands. */
509 regno = true_regnum (recog_data.operand[i]);
510 if (regno >= 0
511 || constraints[i][0] == '='
512 || constraints[i][0] == '+')
513 continue;
515 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
517 enum reg_class rclass = NO_REGS;
519 if (! TEST_HARD_REG_BIT (equiv_regs[i], regno))
520 continue;
522 set_mode_and_regno (testreg, mode, regno);
524 /* We found a register equal to this operand. Now look for all
525 alternatives that can accept this register and have not been
526 assigned a register they can use yet. */
527 j = 0;
528 p = constraints[i];
529 for (;;)
531 char c = *p;
533 switch (c)
535 case 'g':
536 rclass = reg_class_subunion[rclass][GENERAL_REGS];
537 break;
539 default:
540 rclass
541 = (reg_class_subunion
542 [rclass]
543 [reg_class_for_constraint (lookup_constraint (p))]);
544 break;
546 case ',': case '\0':
547 /* See if REGNO fits this alternative, and set it up as the
548 replacement register if we don't have one for this
549 alternative yet and the operand being replaced is not
550 a cheap CONST_INT. */
551 if (op_alt_regno[i][j] == -1
552 && TEST_BIT (preferred, j)
553 && reg_fits_class_p (testreg, rclass, 0, mode)
554 && (!CONST_INT_P (recog_data.operand[i])
555 || (set_src_cost (recog_data.operand[i], mode,
556 optimize_bb_for_speed_p
557 (BLOCK_FOR_INSN (insn)))
558 > set_src_cost (testreg, mode,
559 optimize_bb_for_speed_p
560 (BLOCK_FOR_INSN (insn))))))
562 alternative_nregs[j]++;
563 op_alt_regno[i][j] = regno;
565 j++;
566 rclass = NO_REGS;
567 break;
569 p += CONSTRAINT_LEN (c, p);
571 if (c == '\0')
572 break;
577 /* Record all alternatives which are better or equal to the currently
578 matching one in the alternative_order array. */
579 for (i = j = 0; i < recog_data.n_alternatives; i++)
580 if (alternative_reject[i] <= alternative_reject[which_alternative])
581 alternative_order[j++] = i;
582 recog_data.n_alternatives = j;
584 /* Sort it. Given a small number of alternatives, a dumb algorithm
585 won't hurt too much. */
586 for (i = 0; i < recog_data.n_alternatives - 1; i++)
588 int best = i;
589 int best_reject = alternative_reject[alternative_order[i]];
590 int best_nregs = alternative_nregs[alternative_order[i]];
592 for (j = i + 1; j < recog_data.n_alternatives; j++)
594 int this_reject = alternative_reject[alternative_order[j]];
595 int this_nregs = alternative_nregs[alternative_order[j]];
597 if (this_reject < best_reject
598 || (this_reject == best_reject && this_nregs > best_nregs))
600 best = j;
601 best_reject = this_reject;
602 best_nregs = this_nregs;
606 std::swap (alternative_order[best], alternative_order[i]);
609 /* Substitute the operands as determined by op_alt_regno for the best
610 alternative. */
611 j = alternative_order[0];
613 for (i = 0; i < recog_data.n_operands; i++)
615 machine_mode mode = recog_data.operand_mode[i];
616 if (op_alt_regno[i][j] == -1)
617 continue;
619 validate_change (insn, recog_data.operand_loc[i],
620 gen_rtx_REG (mode, op_alt_regno[i][j]), 1);
623 for (i = recog_data.n_dups - 1; i >= 0; i--)
625 int op = recog_data.dup_num[i];
626 machine_mode mode = recog_data.operand_mode[op];
628 if (op_alt_regno[op][j] == -1)
629 continue;
631 validate_change (insn, recog_data.dup_loc[i],
632 gen_rtx_REG (mode, op_alt_regno[op][j]), 1);
635 return apply_change_group ();
638 /* If reload couldn't use reg+reg+offset addressing, try to use reg+reg
639 addressing now.
640 This code might also be useful when reload gave up on reg+reg addressing
641 because of clashes between the return register and INDEX_REG_CLASS. */
643 /* The maximum number of uses of a register we can keep track of to
644 replace them with reg+reg addressing. */
645 #define RELOAD_COMBINE_MAX_USES 16
647 /* Describes a recorded use of a register. */
648 struct reg_use
650 /* The insn where a register has been used. */
651 rtx_insn *insn;
652 /* Points to the memory reference enclosing the use, if any, NULL_RTX
653 otherwise. */
654 rtx containing_mem;
655 /* Location of the register within INSN. */
656 rtx *usep;
657 /* The reverse uid of the insn. */
658 int ruid;
661 /* If the register is used in some unknown fashion, USE_INDEX is negative.
662 If it is dead, USE_INDEX is RELOAD_COMBINE_MAX_USES, and STORE_RUID
663 indicates where it is first set or clobbered.
664 Otherwise, USE_INDEX is the index of the last encountered use of the
665 register (which is first among these we have seen since we scan backwards).
666 USE_RUID indicates the first encountered, i.e. last, of these uses.
667 If ALL_OFFSETS_MATCH is true, all encountered uses were inside a PLUS
668 with a constant offset; OFFSET contains this constant in that case.
669 STORE_RUID is always meaningful if we only want to use a value in a
670 register in a different place: it denotes the next insn in the insn
671 stream (i.e. the last encountered) that sets or clobbers the register.
672 REAL_STORE_RUID is similar, but clobbers are ignored when updating it. */
673 static struct
675 struct reg_use reg_use[RELOAD_COMBINE_MAX_USES];
676 rtx offset;
677 int use_index;
678 int store_ruid;
679 int real_store_ruid;
680 int use_ruid;
681 bool all_offsets_match;
682 } reg_state[FIRST_PSEUDO_REGISTER];
684 /* Reverse linear uid. This is increased in reload_combine while scanning
685 the instructions from last to first. It is used to set last_label_ruid
686 and the store_ruid / use_ruid fields in reg_state. */
687 static int reload_combine_ruid;
689 /* The RUID of the last label we encountered in reload_combine. */
690 static int last_label_ruid;
692 /* The RUID of the last jump we encountered in reload_combine. */
693 static int last_jump_ruid;
695 /* The register numbers of the first and last index register. A value of
696 -1 in LAST_INDEX_REG indicates that we've previously computed these
697 values and found no suitable index registers. */
698 static int first_index_reg = -1;
699 static int last_index_reg;
701 #define LABEL_LIVE(LABEL) \
702 (label_live[CODE_LABEL_NUMBER (LABEL) - min_labelno])
704 /* Subroutine of reload_combine_split_ruids, called to fix up a single
705 ruid pointed to by *PRUID if it is higher than SPLIT_RUID. */
707 static inline void
708 reload_combine_split_one_ruid (int *pruid, int split_ruid)
710 if (*pruid > split_ruid)
711 (*pruid)++;
714 /* Called when we insert a new insn in a position we've already passed in
715 the scan. Examine all our state, increasing all ruids that are higher
716 than SPLIT_RUID by one in order to make room for a new insn. */
718 static void
719 reload_combine_split_ruids (int split_ruid)
721 unsigned i;
723 reload_combine_split_one_ruid (&reload_combine_ruid, split_ruid);
724 reload_combine_split_one_ruid (&last_label_ruid, split_ruid);
725 reload_combine_split_one_ruid (&last_jump_ruid, split_ruid);
727 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
729 int j, idx = reg_state[i].use_index;
730 reload_combine_split_one_ruid (&reg_state[i].use_ruid, split_ruid);
731 reload_combine_split_one_ruid (&reg_state[i].store_ruid, split_ruid);
732 reload_combine_split_one_ruid (&reg_state[i].real_store_ruid,
733 split_ruid);
734 if (idx < 0)
735 continue;
736 for (j = idx; j < RELOAD_COMBINE_MAX_USES; j++)
738 reload_combine_split_one_ruid (&reg_state[i].reg_use[j].ruid,
739 split_ruid);
744 /* Called when we are about to rescan a previously encountered insn with
745 reload_combine_note_use after modifying some part of it. This clears all
746 information about uses in that particular insn. */
748 static void
749 reload_combine_purge_insn_uses (rtx_insn *insn)
751 unsigned i;
753 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
755 int j, k, idx = reg_state[i].use_index;
756 if (idx < 0)
757 continue;
758 j = k = RELOAD_COMBINE_MAX_USES;
759 while (j-- > idx)
761 if (reg_state[i].reg_use[j].insn != insn)
763 k--;
764 if (k != j)
765 reg_state[i].reg_use[k] = reg_state[i].reg_use[j];
768 reg_state[i].use_index = k;
772 /* Called when we need to forget about all uses of REGNO after an insn
773 which is identified by RUID. */
775 static void
776 reload_combine_purge_reg_uses_after_ruid (unsigned regno, int ruid)
778 int j, k, idx = reg_state[regno].use_index;
779 if (idx < 0)
780 return;
781 j = k = RELOAD_COMBINE_MAX_USES;
782 while (j-- > idx)
784 if (reg_state[regno].reg_use[j].ruid >= ruid)
786 k--;
787 if (k != j)
788 reg_state[regno].reg_use[k] = reg_state[regno].reg_use[j];
791 reg_state[regno].use_index = k;
794 /* Find the use of REGNO with the ruid that is highest among those
795 lower than RUID_LIMIT, and return it if it is the only use of this
796 reg in the insn. Return NULL otherwise. */
798 static struct reg_use *
799 reload_combine_closest_single_use (unsigned regno, int ruid_limit)
801 int i, best_ruid = 0;
802 int use_idx = reg_state[regno].use_index;
803 struct reg_use *retval;
805 if (use_idx < 0)
806 return NULL;
807 retval = NULL;
808 for (i = use_idx; i < RELOAD_COMBINE_MAX_USES; i++)
810 struct reg_use *use = reg_state[regno].reg_use + i;
811 int this_ruid = use->ruid;
812 if (this_ruid >= ruid_limit)
813 continue;
814 if (this_ruid > best_ruid)
816 best_ruid = this_ruid;
817 retval = use;
819 else if (this_ruid == best_ruid)
820 retval = NULL;
822 if (last_label_ruid >= best_ruid)
823 return NULL;
824 return retval;
827 /* After we've moved an add insn, fix up any debug insns that occur
828 between the old location of the add and the new location. REG is
829 the destination register of the add insn; REPLACEMENT is the
830 SET_SRC of the add. FROM and TO specify the range in which we
831 should make this change on debug insns. */
833 static void
834 fixup_debug_insns (rtx reg, rtx replacement, rtx_insn *from, rtx_insn *to)
836 rtx_insn *insn;
837 for (insn = from; insn != to; insn = NEXT_INSN (insn))
839 rtx t;
841 if (!DEBUG_INSN_P (insn))
842 continue;
844 t = INSN_VAR_LOCATION_LOC (insn);
845 t = simplify_replace_rtx (t, reg, replacement);
846 validate_change (insn, &INSN_VAR_LOCATION_LOC (insn), t, 0);
850 /* Subroutine of reload_combine_recognize_const_pattern. Try to replace REG
851 with SRC in the insn described by USE, taking costs into account. Return
852 true if we made the replacement. */
854 static bool
855 try_replace_in_use (struct reg_use *use, rtx reg, rtx src)
857 rtx_insn *use_insn = use->insn;
858 rtx mem = use->containing_mem;
859 bool speed = optimize_bb_for_speed_p (BLOCK_FOR_INSN (use_insn));
861 if (mem != NULL_RTX)
863 addr_space_t as = MEM_ADDR_SPACE (mem);
864 rtx oldaddr = XEXP (mem, 0);
865 rtx newaddr = NULL_RTX;
866 int old_cost = address_cost (oldaddr, GET_MODE (mem), as, speed);
867 int new_cost;
869 newaddr = simplify_replace_rtx (oldaddr, reg, src);
870 if (memory_address_addr_space_p (GET_MODE (mem), newaddr, as))
872 XEXP (mem, 0) = newaddr;
873 new_cost = address_cost (newaddr, GET_MODE (mem), as, speed);
874 XEXP (mem, 0) = oldaddr;
875 if (new_cost <= old_cost
876 && validate_change (use_insn,
877 &XEXP (mem, 0), newaddr, 0))
878 return true;
881 else
883 rtx new_set = single_set (use_insn);
884 if (new_set
885 && REG_P (SET_DEST (new_set))
886 && GET_CODE (SET_SRC (new_set)) == PLUS
887 && REG_P (XEXP (SET_SRC (new_set), 0))
888 && CONSTANT_P (XEXP (SET_SRC (new_set), 1)))
890 rtx new_src;
891 machine_mode mode = GET_MODE (SET_DEST (new_set));
892 int old_cost = set_src_cost (SET_SRC (new_set), mode, speed);
894 gcc_assert (rtx_equal_p (XEXP (SET_SRC (new_set), 0), reg));
895 new_src = simplify_replace_rtx (SET_SRC (new_set), reg, src);
897 if (set_src_cost (new_src, mode, speed) <= old_cost
898 && validate_change (use_insn, &SET_SRC (new_set),
899 new_src, 0))
900 return true;
903 return false;
906 /* Called by reload_combine when scanning INSN. This function tries to detect
907 patterns where a constant is added to a register, and the result is used
908 in an address.
909 Return true if no further processing is needed on INSN; false if it wasn't
910 recognized and should be handled normally. */
912 static bool
913 reload_combine_recognize_const_pattern (rtx_insn *insn)
915 int from_ruid = reload_combine_ruid;
916 rtx set, pat, reg, src, addreg;
917 unsigned int regno;
918 struct reg_use *use;
919 bool must_move_add;
920 rtx_insn *add_moved_after_insn = NULL;
921 int add_moved_after_ruid = 0;
922 int clobbered_regno = -1;
924 set = single_set (insn);
925 if (set == NULL_RTX)
926 return false;
928 reg = SET_DEST (set);
929 src = SET_SRC (set);
930 if (!REG_P (reg)
931 || REG_NREGS (reg) != 1
932 || GET_MODE (reg) != Pmode
933 || reg == stack_pointer_rtx)
934 return false;
936 regno = REGNO (reg);
938 /* We look for a REG1 = REG2 + CONSTANT insn, followed by either
939 uses of REG1 inside an address, or inside another add insn. If
940 possible and profitable, merge the addition into subsequent
941 uses. */
942 if (GET_CODE (src) != PLUS
943 || !REG_P (XEXP (src, 0))
944 || !CONSTANT_P (XEXP (src, 1)))
945 return false;
947 addreg = XEXP (src, 0);
948 must_move_add = rtx_equal_p (reg, addreg);
950 pat = PATTERN (insn);
951 if (must_move_add && set != pat)
953 /* We have to be careful when moving the add; apart from the
954 single_set there may also be clobbers. Recognize one special
955 case, that of one clobber alongside the set (likely a clobber
956 of the CC register). */
957 gcc_assert (GET_CODE (PATTERN (insn)) == PARALLEL);
958 if (XVECLEN (pat, 0) != 2 || XVECEXP (pat, 0, 0) != set
959 || GET_CODE (XVECEXP (pat, 0, 1)) != CLOBBER
960 || !REG_P (XEXP (XVECEXP (pat, 0, 1), 0)))
961 return false;
962 clobbered_regno = REGNO (XEXP (XVECEXP (pat, 0, 1), 0));
967 use = reload_combine_closest_single_use (regno, from_ruid);
969 if (use)
970 /* Start the search for the next use from here. */
971 from_ruid = use->ruid;
973 if (use && GET_MODE (*use->usep) == Pmode)
975 bool delete_add = false;
976 rtx_insn *use_insn = use->insn;
977 int use_ruid = use->ruid;
979 /* Avoid moving the add insn past a jump. */
980 if (must_move_add && use_ruid <= last_jump_ruid)
981 break;
983 /* If the add clobbers another hard reg in parallel, don't move
984 it past a real set of this hard reg. */
985 if (must_move_add && clobbered_regno >= 0
986 && reg_state[clobbered_regno].real_store_ruid >= use_ruid)
987 break;
989 /* Do not separate cc0 setter and cc0 user on HAVE_cc0 targets. */
990 if (HAVE_cc0 && must_move_add && sets_cc0_p (PATTERN (use_insn)))
991 break;
993 gcc_assert (reg_state[regno].store_ruid <= use_ruid);
994 /* Avoid moving a use of ADDREG past a point where it is stored. */
995 if (reg_state[REGNO (addreg)].store_ruid > use_ruid)
996 break;
998 /* We also must not move the addition past an insn that sets
999 the same register, unless we can combine two add insns. */
1000 if (must_move_add && reg_state[regno].store_ruid == use_ruid)
1002 if (use->containing_mem == NULL_RTX)
1003 delete_add = true;
1004 else
1005 break;
1008 if (try_replace_in_use (use, reg, src))
1010 reload_combine_purge_insn_uses (use_insn);
1011 reload_combine_note_use (&PATTERN (use_insn), use_insn,
1012 use_ruid, NULL_RTX);
1014 if (delete_add)
1016 fixup_debug_insns (reg, src, insn, use_insn);
1017 delete_insn (insn);
1018 return true;
1020 if (must_move_add)
1022 add_moved_after_insn = use_insn;
1023 add_moved_after_ruid = use_ruid;
1025 continue;
1028 /* If we get here, we couldn't handle this use. */
1029 if (must_move_add)
1030 break;
1032 while (use);
1034 if (!must_move_add || add_moved_after_insn == NULL_RTX)
1035 /* Process the add normally. */
1036 return false;
1038 fixup_debug_insns (reg, src, insn, add_moved_after_insn);
1040 reorder_insns (insn, insn, add_moved_after_insn);
1041 reload_combine_purge_reg_uses_after_ruid (regno, add_moved_after_ruid);
1042 reload_combine_split_ruids (add_moved_after_ruid - 1);
1043 reload_combine_note_use (&PATTERN (insn), insn,
1044 add_moved_after_ruid, NULL_RTX);
1045 reg_state[regno].store_ruid = add_moved_after_ruid;
1047 return true;
1050 /* Called by reload_combine when scanning INSN. Try to detect a pattern we
1051 can handle and improve. Return true if no further processing is needed on
1052 INSN; false if it wasn't recognized and should be handled normally. */
1054 static bool
1055 reload_combine_recognize_pattern (rtx_insn *insn)
1057 rtx set, reg, src;
1059 set = single_set (insn);
1060 if (set == NULL_RTX)
1061 return false;
1063 reg = SET_DEST (set);
1064 src = SET_SRC (set);
1065 if (!REG_P (reg) || REG_NREGS (reg) != 1)
1066 return false;
1068 unsigned int regno = REGNO (reg);
1069 machine_mode mode = GET_MODE (reg);
1071 if (reg_state[regno].use_index < 0
1072 || reg_state[regno].use_index >= RELOAD_COMBINE_MAX_USES)
1073 return false;
1075 for (int i = reg_state[regno].use_index;
1076 i < RELOAD_COMBINE_MAX_USES; i++)
1078 struct reg_use *use = reg_state[regno].reg_use + i;
1079 if (GET_MODE (*use->usep) != mode)
1080 return false;
1083 /* Look for (set (REGX) (CONST_INT))
1084 (set (REGX) (PLUS (REGX) (REGY)))
1086 ... (MEM (REGX)) ...
1087 and convert it to
1088 (set (REGZ) (CONST_INT))
1090 ... (MEM (PLUS (REGZ) (REGY)))... .
1092 First, check that we have (set (REGX) (PLUS (REGX) (REGY)))
1093 and that we know all uses of REGX before it dies.
1094 Also, explicitly check that REGX != REGY; our life information
1095 does not yet show whether REGY changes in this insn. */
1097 if (GET_CODE (src) == PLUS
1098 && reg_state[regno].all_offsets_match
1099 && last_index_reg != -1
1100 && REG_P (XEXP (src, 1))
1101 && rtx_equal_p (XEXP (src, 0), reg)
1102 && !rtx_equal_p (XEXP (src, 1), reg)
1103 && last_label_ruid < reg_state[regno].use_ruid)
1105 rtx base = XEXP (src, 1);
1106 rtx_insn *prev = prev_nonnote_nondebug_insn (insn);
1107 rtx prev_set = prev ? single_set (prev) : NULL_RTX;
1108 rtx index_reg = NULL_RTX;
1109 rtx reg_sum = NULL_RTX;
1110 int i;
1112 /* Now we need to set INDEX_REG to an index register (denoted as
1113 REGZ in the illustration above) and REG_SUM to the expression
1114 register+register that we want to use to substitute uses of REG
1115 (typically in MEMs) with. First check REG and BASE for being
1116 index registers; we can use them even if they are not dead. */
1117 if (TEST_HARD_REG_BIT (reg_class_contents[INDEX_REG_CLASS], regno)
1118 || TEST_HARD_REG_BIT (reg_class_contents[INDEX_REG_CLASS],
1119 REGNO (base)))
1121 index_reg = reg;
1122 reg_sum = src;
1124 else
1126 /* Otherwise, look for a free index register. Since we have
1127 checked above that neither REG nor BASE are index registers,
1128 if we find anything at all, it will be different from these
1129 two registers. */
1130 for (i = first_index_reg; i <= last_index_reg; i++)
1132 if (TEST_HARD_REG_BIT (reg_class_contents[INDEX_REG_CLASS], i)
1133 && reg_state[i].use_index == RELOAD_COMBINE_MAX_USES
1134 && reg_state[i].store_ruid <= reg_state[regno].use_ruid
1135 && (call_used_regs[i] || df_regs_ever_live_p (i))
1136 && (!frame_pointer_needed || i != HARD_FRAME_POINTER_REGNUM)
1137 && !fixed_regs[i] && !global_regs[i]
1138 && hard_regno_nregs[i][GET_MODE (reg)] == 1
1139 && targetm.hard_regno_scratch_ok (i))
1141 index_reg = gen_rtx_REG (GET_MODE (reg), i);
1142 reg_sum = gen_rtx_PLUS (GET_MODE (reg), index_reg, base);
1143 break;
1148 /* Check that PREV_SET is indeed (set (REGX) (CONST_INT)) and that
1149 (REGY), i.e. BASE, is not clobbered before the last use we'll
1150 create. */
1151 if (reg_sum
1152 && prev_set
1153 && CONST_INT_P (SET_SRC (prev_set))
1154 && rtx_equal_p (SET_DEST (prev_set), reg)
1155 && (reg_state[REGNO (base)].store_ruid
1156 <= reg_state[regno].use_ruid))
1158 /* Change destination register and, if necessary, the constant
1159 value in PREV, the constant loading instruction. */
1160 validate_change (prev, &SET_DEST (prev_set), index_reg, 1);
1161 if (reg_state[regno].offset != const0_rtx)
1162 validate_change (prev,
1163 &SET_SRC (prev_set),
1164 GEN_INT (INTVAL (SET_SRC (prev_set))
1165 + INTVAL (reg_state[regno].offset)),
1168 /* Now for every use of REG that we have recorded, replace REG
1169 with REG_SUM. */
1170 for (i = reg_state[regno].use_index;
1171 i < RELOAD_COMBINE_MAX_USES; i++)
1172 validate_unshare_change (reg_state[regno].reg_use[i].insn,
1173 reg_state[regno].reg_use[i].usep,
1174 /* Each change must have its own
1175 replacement. */
1176 reg_sum, 1);
1178 if (apply_change_group ())
1180 struct reg_use *lowest_ruid = NULL;
1182 /* For every new use of REG_SUM, we have to record the use
1183 of BASE therein, i.e. operand 1. */
1184 for (i = reg_state[regno].use_index;
1185 i < RELOAD_COMBINE_MAX_USES; i++)
1187 struct reg_use *use = reg_state[regno].reg_use + i;
1188 reload_combine_note_use (&XEXP (*use->usep, 1), use->insn,
1189 use->ruid, use->containing_mem);
1190 if (lowest_ruid == NULL || use->ruid < lowest_ruid->ruid)
1191 lowest_ruid = use;
1194 fixup_debug_insns (reg, reg_sum, insn, lowest_ruid->insn);
1196 /* Delete the reg-reg addition. */
1197 delete_insn (insn);
1199 if (reg_state[regno].offset != const0_rtx)
1200 /* Previous REG_EQUIV / REG_EQUAL notes for PREV
1201 are now invalid. */
1202 remove_reg_equal_equiv_notes (prev);
1204 reg_state[regno].use_index = RELOAD_COMBINE_MAX_USES;
1205 return true;
1209 return false;
1212 static void
1213 reload_combine (void)
1215 rtx_insn *insn, *prev;
1216 basic_block bb;
1217 unsigned int r;
1218 int min_labelno, n_labels;
1219 HARD_REG_SET ever_live_at_start, *label_live;
1221 /* To avoid wasting too much time later searching for an index register,
1222 determine the minimum and maximum index register numbers. */
1223 if (INDEX_REG_CLASS == NO_REGS)
1224 last_index_reg = -1;
1225 else if (first_index_reg == -1 && last_index_reg == 0)
1227 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1228 if (TEST_HARD_REG_BIT (reg_class_contents[INDEX_REG_CLASS], r))
1230 if (first_index_reg == -1)
1231 first_index_reg = r;
1233 last_index_reg = r;
1236 /* If no index register is available, we can quit now. Set LAST_INDEX_REG
1237 to -1 so we'll know to quit early the next time we get here. */
1238 if (first_index_reg == -1)
1240 last_index_reg = -1;
1241 return;
1245 /* Set up LABEL_LIVE and EVER_LIVE_AT_START. The register lifetime
1246 information is a bit fuzzy immediately after reload, but it's
1247 still good enough to determine which registers are live at a jump
1248 destination. */
1249 min_labelno = get_first_label_num ();
1250 n_labels = max_label_num () - min_labelno;
1251 label_live = XNEWVEC (HARD_REG_SET, n_labels);
1252 CLEAR_HARD_REG_SET (ever_live_at_start);
1254 FOR_EACH_BB_REVERSE_FN (bb, cfun)
1256 insn = BB_HEAD (bb);
1257 if (LABEL_P (insn))
1259 HARD_REG_SET live;
1260 bitmap live_in = df_get_live_in (bb);
1262 REG_SET_TO_HARD_REG_SET (live, live_in);
1263 compute_use_by_pseudos (&live, live_in);
1264 COPY_HARD_REG_SET (LABEL_LIVE (insn), live);
1265 IOR_HARD_REG_SET (ever_live_at_start, live);
1269 /* Initialize last_label_ruid, reload_combine_ruid and reg_state. */
1270 last_label_ruid = last_jump_ruid = reload_combine_ruid = 0;
1271 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1273 reg_state[r].store_ruid = 0;
1274 reg_state[r].real_store_ruid = 0;
1275 if (fixed_regs[r])
1276 reg_state[r].use_index = -1;
1277 else
1278 reg_state[r].use_index = RELOAD_COMBINE_MAX_USES;
1281 for (insn = get_last_insn (); insn; insn = prev)
1283 bool control_flow_insn;
1284 rtx note;
1286 prev = PREV_INSN (insn);
1288 /* We cannot do our optimization across labels. Invalidating all the use
1289 information we have would be costly, so we just note where the label
1290 is and then later disable any optimization that would cross it. */
1291 if (LABEL_P (insn))
1292 last_label_ruid = reload_combine_ruid;
1293 else if (BARRIER_P (insn))
1295 /* Crossing a barrier resets all the use information. */
1296 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1297 if (! fixed_regs[r])
1298 reg_state[r].use_index = RELOAD_COMBINE_MAX_USES;
1300 else if (INSN_P (insn) && volatile_insn_p (PATTERN (insn)))
1301 /* Optimizations across insns being marked as volatile must be
1302 prevented. All the usage information is invalidated
1303 here. */
1304 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1305 if (! fixed_regs[r]
1306 && reg_state[r].use_index != RELOAD_COMBINE_MAX_USES)
1307 reg_state[r].use_index = -1;
1309 if (! NONDEBUG_INSN_P (insn))
1310 continue;
1312 reload_combine_ruid++;
1314 control_flow_insn = control_flow_insn_p (insn);
1315 if (control_flow_insn)
1316 last_jump_ruid = reload_combine_ruid;
1318 if (reload_combine_recognize_const_pattern (insn)
1319 || reload_combine_recognize_pattern (insn))
1320 continue;
1322 note_stores (PATTERN (insn), reload_combine_note_store, NULL);
1324 if (CALL_P (insn))
1326 rtx link;
1327 HARD_REG_SET used_regs;
1329 get_call_reg_set_usage (insn, &used_regs, call_used_reg_set);
1331 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1332 if (TEST_HARD_REG_BIT (used_regs, r))
1334 reg_state[r].use_index = RELOAD_COMBINE_MAX_USES;
1335 reg_state[r].store_ruid = reload_combine_ruid;
1338 for (link = CALL_INSN_FUNCTION_USAGE (insn); link;
1339 link = XEXP (link, 1))
1341 rtx setuse = XEXP (link, 0);
1342 rtx usage_rtx = XEXP (setuse, 0);
1343 if ((GET_CODE (setuse) == USE || GET_CODE (setuse) == CLOBBER)
1344 && REG_P (usage_rtx))
1346 unsigned int end_regno = END_REGNO (usage_rtx);
1347 for (unsigned int i = REGNO (usage_rtx); i < end_regno; ++i)
1348 if (GET_CODE (XEXP (link, 0)) == CLOBBER)
1350 reg_state[i].use_index = RELOAD_COMBINE_MAX_USES;
1351 reg_state[i].store_ruid = reload_combine_ruid;
1353 else
1354 reg_state[i].use_index = -1;
1359 if (control_flow_insn && !ANY_RETURN_P (PATTERN (insn)))
1361 /* Non-spill registers might be used at the call destination in
1362 some unknown fashion, so we have to mark the unknown use. */
1363 HARD_REG_SET *live;
1365 if ((condjump_p (insn) || condjump_in_parallel_p (insn))
1366 && JUMP_LABEL (insn))
1368 if (ANY_RETURN_P (JUMP_LABEL (insn)))
1369 live = NULL;
1370 else
1371 live = &LABEL_LIVE (JUMP_LABEL (insn));
1373 else
1374 live = &ever_live_at_start;
1376 if (live)
1377 for (r = 0; r < FIRST_PSEUDO_REGISTER; r++)
1378 if (TEST_HARD_REG_BIT (*live, r))
1379 reg_state[r].use_index = -1;
1382 reload_combine_note_use (&PATTERN (insn), insn, reload_combine_ruid,
1383 NULL_RTX);
1385 for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
1387 if (REG_NOTE_KIND (note) == REG_INC && REG_P (XEXP (note, 0)))
1389 int regno = REGNO (XEXP (note, 0));
1390 reg_state[regno].store_ruid = reload_combine_ruid;
1391 reg_state[regno].real_store_ruid = reload_combine_ruid;
1392 reg_state[regno].use_index = -1;
1397 free (label_live);
1400 /* Check if DST is a register or a subreg of a register; if it is,
1401 update store_ruid, real_store_ruid and use_index in the reg_state
1402 structure accordingly. Called via note_stores from reload_combine. */
1404 static void
1405 reload_combine_note_store (rtx dst, const_rtx set, void *data ATTRIBUTE_UNUSED)
1407 int regno = 0;
1408 int i;
1409 machine_mode mode = GET_MODE (dst);
1411 if (GET_CODE (dst) == SUBREG)
1413 regno = subreg_regno_offset (REGNO (SUBREG_REG (dst)),
1414 GET_MODE (SUBREG_REG (dst)),
1415 SUBREG_BYTE (dst),
1416 GET_MODE (dst));
1417 dst = SUBREG_REG (dst);
1420 /* Some targets do argument pushes without adding REG_INC notes. */
1422 if (MEM_P (dst))
1424 dst = XEXP (dst, 0);
1425 if (GET_CODE (dst) == PRE_INC || GET_CODE (dst) == POST_INC
1426 || GET_CODE (dst) == PRE_DEC || GET_CODE (dst) == POST_DEC
1427 || GET_CODE (dst) == PRE_MODIFY || GET_CODE (dst) == POST_MODIFY)
1429 unsigned int end_regno = END_REGNO (XEXP (dst, 0));
1430 for (unsigned int i = REGNO (XEXP (dst, 0)); i < end_regno; ++i)
1432 /* We could probably do better, but for now mark the register
1433 as used in an unknown fashion and set/clobbered at this
1434 insn. */
1435 reg_state[i].use_index = -1;
1436 reg_state[i].store_ruid = reload_combine_ruid;
1437 reg_state[i].real_store_ruid = reload_combine_ruid;
1440 else
1441 return;
1444 if (!REG_P (dst))
1445 return;
1446 regno += REGNO (dst);
1448 /* note_stores might have stripped a STRICT_LOW_PART, so we have to be
1449 careful with registers / register parts that are not full words.
1450 Similarly for ZERO_EXTRACT. */
1451 if (GET_CODE (SET_DEST (set)) == ZERO_EXTRACT
1452 || GET_CODE (SET_DEST (set)) == STRICT_LOW_PART)
1454 for (i = hard_regno_nregs[regno][mode] - 1 + regno; i >= regno; i--)
1456 reg_state[i].use_index = -1;
1457 reg_state[i].store_ruid = reload_combine_ruid;
1458 reg_state[i].real_store_ruid = reload_combine_ruid;
1461 else
1463 for (i = hard_regno_nregs[regno][mode] - 1 + regno; i >= regno; i--)
1465 reg_state[i].store_ruid = reload_combine_ruid;
1466 if (GET_CODE (set) == SET)
1467 reg_state[i].real_store_ruid = reload_combine_ruid;
1468 reg_state[i].use_index = RELOAD_COMBINE_MAX_USES;
1473 /* XP points to a piece of rtl that has to be checked for any uses of
1474 registers.
1475 *XP is the pattern of INSN, or a part of it.
1476 Called from reload_combine, and recursively by itself. */
1477 static void
1478 reload_combine_note_use (rtx *xp, rtx_insn *insn, int ruid, rtx containing_mem)
1480 rtx x = *xp;
1481 enum rtx_code code = x->code;
1482 const char *fmt;
1483 int i, j;
1484 rtx offset = const0_rtx; /* For the REG case below. */
1486 switch (code)
1488 case SET:
1489 if (REG_P (SET_DEST (x)))
1491 reload_combine_note_use (&SET_SRC (x), insn, ruid, NULL_RTX);
1492 return;
1494 break;
1496 case USE:
1497 /* If this is the USE of a return value, we can't change it. */
1498 if (REG_P (XEXP (x, 0)) && REG_FUNCTION_VALUE_P (XEXP (x, 0)))
1500 /* Mark the return register as used in an unknown fashion. */
1501 rtx reg = XEXP (x, 0);
1502 unsigned int end_regno = END_REGNO (reg);
1503 for (unsigned int regno = REGNO (reg); regno < end_regno; ++regno)
1504 reg_state[regno].use_index = -1;
1505 return;
1507 break;
1509 case CLOBBER:
1510 if (REG_P (SET_DEST (x)))
1512 /* No spurious CLOBBERs of pseudo registers may remain. */
1513 gcc_assert (REGNO (SET_DEST (x)) < FIRST_PSEUDO_REGISTER);
1514 return;
1516 break;
1518 case PLUS:
1519 /* We are interested in (plus (reg) (const_int)) . */
1520 if (!REG_P (XEXP (x, 0))
1521 || !CONST_INT_P (XEXP (x, 1)))
1522 break;
1523 offset = XEXP (x, 1);
1524 x = XEXP (x, 0);
1525 /* Fall through. */
1526 case REG:
1528 int regno = REGNO (x);
1529 int use_index;
1530 int nregs;
1532 /* No spurious USEs of pseudo registers may remain. */
1533 gcc_assert (regno < FIRST_PSEUDO_REGISTER);
1535 nregs = REG_NREGS (x);
1537 /* We can't substitute into multi-hard-reg uses. */
1538 if (nregs > 1)
1540 while (--nregs >= 0)
1541 reg_state[regno + nregs].use_index = -1;
1542 return;
1545 /* We may be called to update uses in previously seen insns.
1546 Don't add uses beyond the last store we saw. */
1547 if (ruid < reg_state[regno].store_ruid)
1548 return;
1550 /* If this register is already used in some unknown fashion, we
1551 can't do anything.
1552 If we decrement the index from zero to -1, we can't store more
1553 uses, so this register becomes used in an unknown fashion. */
1554 use_index = --reg_state[regno].use_index;
1555 if (use_index < 0)
1556 return;
1558 if (use_index == RELOAD_COMBINE_MAX_USES - 1)
1560 /* This is the first use of this register we have seen since we
1561 marked it as dead. */
1562 reg_state[regno].offset = offset;
1563 reg_state[regno].all_offsets_match = true;
1564 reg_state[regno].use_ruid = ruid;
1566 else
1568 if (reg_state[regno].use_ruid > ruid)
1569 reg_state[regno].use_ruid = ruid;
1571 if (! rtx_equal_p (offset, reg_state[regno].offset))
1572 reg_state[regno].all_offsets_match = false;
1575 reg_state[regno].reg_use[use_index].insn = insn;
1576 reg_state[regno].reg_use[use_index].ruid = ruid;
1577 reg_state[regno].reg_use[use_index].containing_mem = containing_mem;
1578 reg_state[regno].reg_use[use_index].usep = xp;
1579 return;
1582 case MEM:
1583 containing_mem = x;
1584 break;
1586 default:
1587 break;
1590 /* Recursively process the components of X. */
1591 fmt = GET_RTX_FORMAT (code);
1592 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1594 if (fmt[i] == 'e')
1595 reload_combine_note_use (&XEXP (x, i), insn, ruid, containing_mem);
1596 else if (fmt[i] == 'E')
1598 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
1599 reload_combine_note_use (&XVECEXP (x, i, j), insn, ruid,
1600 containing_mem);
1605 /* See if we can reduce the cost of a constant by replacing a move
1606 with an add. We track situations in which a register is set to a
1607 constant or to a register plus a constant. */
1608 /* We cannot do our optimization across labels. Invalidating all the
1609 information about register contents we have would be costly, so we
1610 use move2add_last_label_luid to note where the label is and then
1611 later disable any optimization that would cross it.
1612 reg_offset[n] / reg_base_reg[n] / reg_symbol_ref[n] / reg_mode[n]
1613 are only valid if reg_set_luid[n] is greater than
1614 move2add_last_label_luid.
1615 For a set that established a new (potential) base register with
1616 non-constant value, we use move2add_luid from the place where the
1617 setting insn is encountered; registers based off that base then
1618 get the same reg_set_luid. Constants all get
1619 move2add_last_label_luid + 1 as their reg_set_luid. */
1620 static int reg_set_luid[FIRST_PSEUDO_REGISTER];
1622 /* If reg_base_reg[n] is negative, register n has been set to
1623 reg_offset[n] or reg_symbol_ref[n] + reg_offset[n] in mode reg_mode[n].
1624 If reg_base_reg[n] is non-negative, register n has been set to the
1625 sum of reg_offset[n] and the value of register reg_base_reg[n]
1626 before reg_set_luid[n], calculated in mode reg_mode[n] .
1627 For multi-hard-register registers, all but the first one are
1628 recorded as BLKmode in reg_mode. Setting reg_mode to VOIDmode
1629 marks it as invalid. */
1630 static HOST_WIDE_INT reg_offset[FIRST_PSEUDO_REGISTER];
1631 static int reg_base_reg[FIRST_PSEUDO_REGISTER];
1632 static rtx reg_symbol_ref[FIRST_PSEUDO_REGISTER];
1633 static machine_mode reg_mode[FIRST_PSEUDO_REGISTER];
1635 /* move2add_luid is linearly increased while scanning the instructions
1636 from first to last. It is used to set reg_set_luid in
1637 reload_cse_move2add and move2add_note_store. */
1638 static int move2add_luid;
1640 /* move2add_last_label_luid is set whenever a label is found. Labels
1641 invalidate all previously collected reg_offset data. */
1642 static int move2add_last_label_luid;
1644 /* ??? We don't know how zero / sign extension is handled, hence we
1645 can't go from a narrower to a wider mode. */
1646 #define MODES_OK_FOR_MOVE2ADD(OUTMODE, INMODE) \
1647 (GET_MODE_SIZE (OUTMODE) == GET_MODE_SIZE (INMODE) \
1648 || (GET_MODE_SIZE (OUTMODE) <= GET_MODE_SIZE (INMODE) \
1649 && TRULY_NOOP_TRUNCATION_MODES_P (OUTMODE, INMODE)))
1651 /* Record that REG is being set to a value with the mode of REG. */
1653 static void
1654 move2add_record_mode (rtx reg)
1656 int regno, nregs;
1657 machine_mode mode = GET_MODE (reg);
1659 if (GET_CODE (reg) == SUBREG)
1661 regno = subreg_regno (reg);
1662 nregs = subreg_nregs (reg);
1664 else if (REG_P (reg))
1666 regno = REGNO (reg);
1667 nregs = REG_NREGS (reg);
1669 else
1670 gcc_unreachable ();
1671 for (int i = nregs - 1; i > 0; i--)
1672 reg_mode[regno + i] = BLKmode;
1673 reg_mode[regno] = mode;
1676 /* Record that REG is being set to the sum of SYM and OFF. */
1678 static void
1679 move2add_record_sym_value (rtx reg, rtx sym, rtx off)
1681 int regno = REGNO (reg);
1683 move2add_record_mode (reg);
1684 reg_set_luid[regno] = move2add_luid;
1685 reg_base_reg[regno] = -1;
1686 reg_symbol_ref[regno] = sym;
1687 reg_offset[regno] = INTVAL (off);
1690 /* Check if REGNO contains a valid value in MODE. */
1692 static bool
1693 move2add_valid_value_p (int regno, machine_mode mode)
1695 if (reg_set_luid[regno] <= move2add_last_label_luid)
1696 return false;
1698 if (mode != reg_mode[regno])
1700 if (!MODES_OK_FOR_MOVE2ADD (mode, reg_mode[regno]))
1701 return false;
1702 /* The value loaded into regno in reg_mode[regno] is also valid in
1703 mode after truncation only if (REG:mode regno) is the lowpart of
1704 (REG:reg_mode[regno] regno). Now, for big endian, the starting
1705 regno of the lowpart might be different. */
1706 int s_off = subreg_lowpart_offset (mode, reg_mode[regno]);
1707 s_off = subreg_regno_offset (regno, reg_mode[regno], s_off, mode);
1708 if (s_off != 0)
1709 /* We could in principle adjust regno, check reg_mode[regno] to be
1710 BLKmode, and return s_off to the caller (vs. -1 for failure),
1711 but we currently have no callers that could make use of this
1712 information. */
1713 return false;
1716 for (int i = hard_regno_nregs[regno][mode] - 1; i > 0; i--)
1717 if (reg_mode[regno + i] != BLKmode)
1718 return false;
1719 return true;
1722 /* This function is called with INSN that sets REG to (SYM + OFF),
1723 while REG is known to already have value (SYM + offset).
1724 This function tries to change INSN into an add instruction
1725 (set (REG) (plus (REG) (OFF - offset))) using the known value.
1726 It also updates the information about REG's known value.
1727 Return true if we made a change. */
1729 static bool
1730 move2add_use_add2_insn (rtx reg, rtx sym, rtx off, rtx_insn *insn)
1732 rtx pat = PATTERN (insn);
1733 rtx src = SET_SRC (pat);
1734 int regno = REGNO (reg);
1735 rtx new_src = gen_int_mode (UINTVAL (off) - reg_offset[regno],
1736 GET_MODE (reg));
1737 bool speed = optimize_bb_for_speed_p (BLOCK_FOR_INSN (insn));
1738 bool changed = false;
1740 /* (set (reg) (plus (reg) (const_int 0))) is not canonical;
1741 use (set (reg) (reg)) instead.
1742 We don't delete this insn, nor do we convert it into a
1743 note, to avoid losing register notes or the return
1744 value flag. jump2 already knows how to get rid of
1745 no-op moves. */
1746 if (new_src == const0_rtx)
1748 /* If the constants are different, this is a
1749 truncation, that, if turned into (set (reg)
1750 (reg)), would be discarded. Maybe we should
1751 try a truncMN pattern? */
1752 if (INTVAL (off) == reg_offset [regno])
1753 changed = validate_change (insn, &SET_SRC (pat), reg, 0);
1755 else
1757 struct full_rtx_costs oldcst, newcst;
1758 rtx tem = gen_rtx_PLUS (GET_MODE (reg), reg, new_src);
1760 get_full_set_rtx_cost (pat, &oldcst);
1761 SET_SRC (pat) = tem;
1762 get_full_set_rtx_cost (pat, &newcst);
1763 SET_SRC (pat) = src;
1765 if (costs_lt_p (&newcst, &oldcst, speed)
1766 && have_add2_insn (reg, new_src))
1767 changed = validate_change (insn, &SET_SRC (pat), tem, 0);
1768 else if (sym == NULL_RTX && GET_MODE (reg) != BImode)
1770 machine_mode narrow_mode;
1771 for (narrow_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
1772 narrow_mode != VOIDmode
1773 && narrow_mode != GET_MODE (reg);
1774 narrow_mode = GET_MODE_WIDER_MODE (narrow_mode))
1776 if (have_insn_for (STRICT_LOW_PART, narrow_mode)
1777 && ((reg_offset[regno] & ~GET_MODE_MASK (narrow_mode))
1778 == (INTVAL (off) & ~GET_MODE_MASK (narrow_mode))))
1780 rtx narrow_reg = gen_lowpart_common (narrow_mode, reg);
1781 rtx narrow_src = gen_int_mode (INTVAL (off),
1782 narrow_mode);
1783 rtx new_set
1784 = gen_rtx_SET (gen_rtx_STRICT_LOW_PART (VOIDmode,
1785 narrow_reg),
1786 narrow_src);
1787 get_full_set_rtx_cost (new_set, &newcst);
1788 if (costs_lt_p (&newcst, &oldcst, speed))
1790 changed = validate_change (insn, &PATTERN (insn),
1791 new_set, 0);
1792 if (changed)
1793 break;
1799 move2add_record_sym_value (reg, sym, off);
1800 return changed;
1804 /* This function is called with INSN that sets REG to (SYM + OFF),
1805 but REG doesn't have known value (SYM + offset). This function
1806 tries to find another register which is known to already have
1807 value (SYM + offset) and change INSN into an add instruction
1808 (set (REG) (plus (the found register) (OFF - offset))) if such
1809 a register is found. It also updates the information about
1810 REG's known value.
1811 Return true iff we made a change. */
1813 static bool
1814 move2add_use_add3_insn (rtx reg, rtx sym, rtx off, rtx_insn *insn)
1816 rtx pat = PATTERN (insn);
1817 rtx src = SET_SRC (pat);
1818 int regno = REGNO (reg);
1819 int min_regno = 0;
1820 bool speed = optimize_bb_for_speed_p (BLOCK_FOR_INSN (insn));
1821 int i;
1822 bool changed = false;
1823 struct full_rtx_costs oldcst, newcst, mincst;
1824 rtx plus_expr;
1826 init_costs_to_max (&mincst);
1827 get_full_set_rtx_cost (pat, &oldcst);
1829 plus_expr = gen_rtx_PLUS (GET_MODE (reg), reg, const0_rtx);
1830 SET_SRC (pat) = plus_expr;
1832 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1833 if (move2add_valid_value_p (i, GET_MODE (reg))
1834 && reg_base_reg[i] < 0
1835 && reg_symbol_ref[i] != NULL_RTX
1836 && rtx_equal_p (sym, reg_symbol_ref[i]))
1838 rtx new_src = gen_int_mode (UINTVAL (off) - reg_offset[i],
1839 GET_MODE (reg));
1840 /* (set (reg) (plus (reg) (const_int 0))) is not canonical;
1841 use (set (reg) (reg)) instead.
1842 We don't delete this insn, nor do we convert it into a
1843 note, to avoid losing register notes or the return
1844 value flag. jump2 already knows how to get rid of
1845 no-op moves. */
1846 if (new_src == const0_rtx)
1848 init_costs_to_zero (&mincst);
1849 min_regno = i;
1850 break;
1852 else
1854 XEXP (plus_expr, 1) = new_src;
1855 get_full_set_rtx_cost (pat, &newcst);
1857 if (costs_lt_p (&newcst, &mincst, speed))
1859 mincst = newcst;
1860 min_regno = i;
1864 SET_SRC (pat) = src;
1866 if (costs_lt_p (&mincst, &oldcst, speed))
1868 rtx tem;
1870 tem = gen_rtx_REG (GET_MODE (reg), min_regno);
1871 if (i != min_regno)
1873 rtx new_src = gen_int_mode (UINTVAL (off) - reg_offset[min_regno],
1874 GET_MODE (reg));
1875 tem = gen_rtx_PLUS (GET_MODE (reg), tem, new_src);
1877 if (validate_change (insn, &SET_SRC (pat), tem, 0))
1878 changed = true;
1880 reg_set_luid[regno] = move2add_luid;
1881 move2add_record_sym_value (reg, sym, off);
1882 return changed;
1885 /* Convert move insns with constant inputs to additions if they are cheaper.
1886 Return true if any changes were made. */
1887 static bool
1888 reload_cse_move2add (rtx_insn *first)
1890 int i;
1891 rtx_insn *insn;
1892 bool changed = false;
1894 for (i = FIRST_PSEUDO_REGISTER - 1; i >= 0; i--)
1896 reg_set_luid[i] = 0;
1897 reg_offset[i] = 0;
1898 reg_base_reg[i] = 0;
1899 reg_symbol_ref[i] = NULL_RTX;
1900 reg_mode[i] = VOIDmode;
1903 move2add_last_label_luid = 0;
1904 move2add_luid = 2;
1905 for (insn = first; insn; insn = NEXT_INSN (insn), move2add_luid++)
1907 rtx pat, note;
1909 if (LABEL_P (insn))
1911 move2add_last_label_luid = move2add_luid;
1912 /* We're going to increment move2add_luid twice after a
1913 label, so that we can use move2add_last_label_luid + 1 as
1914 the luid for constants. */
1915 move2add_luid++;
1916 continue;
1918 if (! INSN_P (insn))
1919 continue;
1920 pat = PATTERN (insn);
1921 /* For simplicity, we only perform this optimization on
1922 straightforward SETs. */
1923 if (GET_CODE (pat) == SET
1924 && REG_P (SET_DEST (pat)))
1926 rtx reg = SET_DEST (pat);
1927 int regno = REGNO (reg);
1928 rtx src = SET_SRC (pat);
1930 /* Check if we have valid information on the contents of this
1931 register in the mode of REG. */
1932 if (move2add_valid_value_p (regno, GET_MODE (reg))
1933 && dbg_cnt (cse2_move2add))
1935 /* Try to transform (set (REGX) (CONST_INT A))
1937 (set (REGX) (CONST_INT B))
1939 (set (REGX) (CONST_INT A))
1941 (set (REGX) (plus (REGX) (CONST_INT B-A)))
1943 (set (REGX) (CONST_INT A))
1945 (set (STRICT_LOW_PART (REGX)) (CONST_INT B))
1948 if (CONST_INT_P (src)
1949 && reg_base_reg[regno] < 0
1950 && reg_symbol_ref[regno] == NULL_RTX)
1952 changed |= move2add_use_add2_insn (reg, NULL_RTX, src, insn);
1953 continue;
1956 /* Try to transform (set (REGX) (REGY))
1957 (set (REGX) (PLUS (REGX) (CONST_INT A)))
1959 (set (REGX) (REGY))
1960 (set (REGX) (PLUS (REGX) (CONST_INT B)))
1962 (set (REGX) (REGY))
1963 (set (REGX) (PLUS (REGX) (CONST_INT A)))
1965 (set (REGX) (plus (REGX) (CONST_INT B-A))) */
1966 else if (REG_P (src)
1967 && reg_set_luid[regno] == reg_set_luid[REGNO (src)]
1968 && reg_base_reg[regno] == reg_base_reg[REGNO (src)]
1969 && move2add_valid_value_p (REGNO (src), GET_MODE (reg)))
1971 rtx_insn *next = next_nonnote_nondebug_insn (insn);
1972 rtx set = NULL_RTX;
1973 if (next)
1974 set = single_set (next);
1975 if (set
1976 && SET_DEST (set) == reg
1977 && GET_CODE (SET_SRC (set)) == PLUS
1978 && XEXP (SET_SRC (set), 0) == reg
1979 && CONST_INT_P (XEXP (SET_SRC (set), 1)))
1981 rtx src3 = XEXP (SET_SRC (set), 1);
1982 unsigned HOST_WIDE_INT added_offset = UINTVAL (src3);
1983 HOST_WIDE_INT base_offset = reg_offset[REGNO (src)];
1984 HOST_WIDE_INT regno_offset = reg_offset[regno];
1985 rtx new_src =
1986 gen_int_mode (added_offset
1987 + base_offset
1988 - regno_offset,
1989 GET_MODE (reg));
1990 bool success = false;
1991 bool speed = optimize_bb_for_speed_p (BLOCK_FOR_INSN (insn));
1993 if (new_src == const0_rtx)
1994 /* See above why we create (set (reg) (reg)) here. */
1995 success
1996 = validate_change (next, &SET_SRC (set), reg, 0);
1997 else
1999 rtx old_src = SET_SRC (set);
2000 struct full_rtx_costs oldcst, newcst;
2001 rtx tem = gen_rtx_PLUS (GET_MODE (reg), reg, new_src);
2003 get_full_set_rtx_cost (set, &oldcst);
2004 SET_SRC (set) = tem;
2005 get_full_set_src_cost (tem, GET_MODE (reg), &newcst);
2006 SET_SRC (set) = old_src;
2007 costs_add_n_insns (&oldcst, 1);
2009 if (costs_lt_p (&newcst, &oldcst, speed)
2010 && have_add2_insn (reg, new_src))
2012 rtx newpat = gen_rtx_SET (reg, tem);
2013 success
2014 = validate_change (next, &PATTERN (next),
2015 newpat, 0);
2018 if (success)
2019 delete_insn (insn);
2020 changed |= success;
2021 insn = next;
2022 move2add_record_mode (reg);
2023 reg_offset[regno]
2024 = trunc_int_for_mode (added_offset + base_offset,
2025 GET_MODE (reg));
2026 continue;
2031 /* Try to transform
2032 (set (REGX) (CONST (PLUS (SYMBOL_REF) (CONST_INT A))))
2034 (set (REGY) (CONST (PLUS (SYMBOL_REF) (CONST_INT B))))
2036 (set (REGX) (CONST (PLUS (SYMBOL_REF) (CONST_INT A))))
2038 (set (REGY) (CONST (PLUS (REGX) (CONST_INT B-A)))) */
2039 if ((GET_CODE (src) == SYMBOL_REF
2040 || (GET_CODE (src) == CONST
2041 && GET_CODE (XEXP (src, 0)) == PLUS
2042 && GET_CODE (XEXP (XEXP (src, 0), 0)) == SYMBOL_REF
2043 && CONST_INT_P (XEXP (XEXP (src, 0), 1))))
2044 && dbg_cnt (cse2_move2add))
2046 rtx sym, off;
2048 if (GET_CODE (src) == SYMBOL_REF)
2050 sym = src;
2051 off = const0_rtx;
2053 else
2055 sym = XEXP (XEXP (src, 0), 0);
2056 off = XEXP (XEXP (src, 0), 1);
2059 /* If the reg already contains the value which is sum of
2060 sym and some constant value, we can use an add2 insn. */
2061 if (move2add_valid_value_p (regno, GET_MODE (reg))
2062 && reg_base_reg[regno] < 0
2063 && reg_symbol_ref[regno] != NULL_RTX
2064 && rtx_equal_p (sym, reg_symbol_ref[regno]))
2065 changed |= move2add_use_add2_insn (reg, sym, off, insn);
2067 /* Otherwise, we have to find a register whose value is sum
2068 of sym and some constant value. */
2069 else
2070 changed |= move2add_use_add3_insn (reg, sym, off, insn);
2072 continue;
2076 for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
2078 if (REG_NOTE_KIND (note) == REG_INC
2079 && REG_P (XEXP (note, 0)))
2081 /* Reset the information about this register. */
2082 int regno = REGNO (XEXP (note, 0));
2083 if (regno < FIRST_PSEUDO_REGISTER)
2085 move2add_record_mode (XEXP (note, 0));
2086 reg_mode[regno] = VOIDmode;
2090 note_stores (PATTERN (insn), move2add_note_store, insn);
2092 /* If INSN is a conditional branch, we try to extract an
2093 implicit set out of it. */
2094 if (any_condjump_p (insn))
2096 rtx cnd = fis_get_condition (insn);
2098 if (cnd != NULL_RTX
2099 && GET_CODE (cnd) == NE
2100 && REG_P (XEXP (cnd, 0))
2101 && !reg_set_p (XEXP (cnd, 0), insn)
2102 /* The following two checks, which are also in
2103 move2add_note_store, are intended to reduce the
2104 number of calls to gen_rtx_SET to avoid memory
2105 allocation if possible. */
2106 && SCALAR_INT_MODE_P (GET_MODE (XEXP (cnd, 0)))
2107 && REG_NREGS (XEXP (cnd, 0)) == 1
2108 && CONST_INT_P (XEXP (cnd, 1)))
2110 rtx implicit_set =
2111 gen_rtx_SET (XEXP (cnd, 0), XEXP (cnd, 1));
2112 move2add_note_store (SET_DEST (implicit_set), implicit_set, insn);
2116 /* If this is a CALL_INSN, all call used registers are stored with
2117 unknown values. */
2118 if (CALL_P (insn))
2120 rtx link;
2122 for (i = FIRST_PSEUDO_REGISTER - 1; i >= 0; i--)
2124 if (call_used_regs[i])
2125 /* Reset the information about this register. */
2126 reg_mode[i] = VOIDmode;
2129 for (link = CALL_INSN_FUNCTION_USAGE (insn); link;
2130 link = XEXP (link, 1))
2132 rtx setuse = XEXP (link, 0);
2133 rtx usage_rtx = XEXP (setuse, 0);
2134 if (GET_CODE (setuse) == CLOBBER
2135 && REG_P (usage_rtx))
2137 unsigned int end_regno = END_REGNO (usage_rtx);
2138 for (unsigned int r = REGNO (usage_rtx); r < end_regno; ++r)
2139 /* Reset the information about this register. */
2140 reg_mode[r] = VOIDmode;
2145 return changed;
2148 /* SET is a SET or CLOBBER that sets DST. DATA is the insn which
2149 contains SET.
2150 Update reg_set_luid, reg_offset and reg_base_reg accordingly.
2151 Called from reload_cse_move2add via note_stores. */
2153 static void
2154 move2add_note_store (rtx dst, const_rtx set, void *data)
2156 rtx_insn *insn = (rtx_insn *) data;
2157 unsigned int regno = 0;
2158 machine_mode mode = GET_MODE (dst);
2160 /* Some targets do argument pushes without adding REG_INC notes. */
2162 if (MEM_P (dst))
2164 dst = XEXP (dst, 0);
2165 if (GET_CODE (dst) == PRE_INC || GET_CODE (dst) == POST_INC
2166 || GET_CODE (dst) == PRE_DEC || GET_CODE (dst) == POST_DEC)
2167 reg_mode[REGNO (XEXP (dst, 0))] = VOIDmode;
2168 return;
2171 if (GET_CODE (dst) == SUBREG)
2172 regno = subreg_regno (dst);
2173 else if (REG_P (dst))
2174 regno = REGNO (dst);
2175 else
2176 return;
2178 if (SCALAR_INT_MODE_P (mode)
2179 && GET_CODE (set) == SET)
2181 rtx note, sym = NULL_RTX;
2182 rtx off;
2184 note = find_reg_equal_equiv_note (insn);
2185 if (note && GET_CODE (XEXP (note, 0)) == SYMBOL_REF)
2187 sym = XEXP (note, 0);
2188 off = const0_rtx;
2190 else if (note && GET_CODE (XEXP (note, 0)) == CONST
2191 && GET_CODE (XEXP (XEXP (note, 0), 0)) == PLUS
2192 && GET_CODE (XEXP (XEXP (XEXP (note, 0), 0), 0)) == SYMBOL_REF
2193 && CONST_INT_P (XEXP (XEXP (XEXP (note, 0), 0), 1)))
2195 sym = XEXP (XEXP (XEXP (note, 0), 0), 0);
2196 off = XEXP (XEXP (XEXP (note, 0), 0), 1);
2199 if (sym != NULL_RTX)
2201 move2add_record_sym_value (dst, sym, off);
2202 return;
2206 if (SCALAR_INT_MODE_P (mode)
2207 && GET_CODE (set) == SET
2208 && GET_CODE (SET_DEST (set)) != ZERO_EXTRACT
2209 && GET_CODE (SET_DEST (set)) != STRICT_LOW_PART)
2211 rtx src = SET_SRC (set);
2212 rtx base_reg;
2213 unsigned HOST_WIDE_INT offset;
2214 int base_regno;
2216 switch (GET_CODE (src))
2218 case PLUS:
2219 if (REG_P (XEXP (src, 0)))
2221 base_reg = XEXP (src, 0);
2223 if (CONST_INT_P (XEXP (src, 1)))
2224 offset = UINTVAL (XEXP (src, 1));
2225 else if (REG_P (XEXP (src, 1))
2226 && move2add_valid_value_p (REGNO (XEXP (src, 1)), mode))
2228 if (reg_base_reg[REGNO (XEXP (src, 1))] < 0
2229 && reg_symbol_ref[REGNO (XEXP (src, 1))] == NULL_RTX)
2230 offset = reg_offset[REGNO (XEXP (src, 1))];
2231 /* Maybe the first register is known to be a
2232 constant. */
2233 else if (move2add_valid_value_p (REGNO (base_reg), mode)
2234 && reg_base_reg[REGNO (base_reg)] < 0
2235 && reg_symbol_ref[REGNO (base_reg)] == NULL_RTX)
2237 offset = reg_offset[REGNO (base_reg)];
2238 base_reg = XEXP (src, 1);
2240 else
2241 goto invalidate;
2243 else
2244 goto invalidate;
2246 break;
2249 goto invalidate;
2251 case REG:
2252 base_reg = src;
2253 offset = 0;
2254 break;
2256 case CONST_INT:
2257 /* Start tracking the register as a constant. */
2258 reg_base_reg[regno] = -1;
2259 reg_symbol_ref[regno] = NULL_RTX;
2260 reg_offset[regno] = INTVAL (SET_SRC (set));
2261 /* We assign the same luid to all registers set to constants. */
2262 reg_set_luid[regno] = move2add_last_label_luid + 1;
2263 move2add_record_mode (dst);
2264 return;
2266 default:
2267 goto invalidate;
2270 base_regno = REGNO (base_reg);
2271 /* If information about the base register is not valid, set it
2272 up as a new base register, pretending its value is known
2273 starting from the current insn. */
2274 if (!move2add_valid_value_p (base_regno, mode))
2276 reg_base_reg[base_regno] = base_regno;
2277 reg_symbol_ref[base_regno] = NULL_RTX;
2278 reg_offset[base_regno] = 0;
2279 reg_set_luid[base_regno] = move2add_luid;
2280 gcc_assert (GET_MODE (base_reg) == mode);
2281 move2add_record_mode (base_reg);
2284 /* Copy base information from our base register. */
2285 reg_set_luid[regno] = reg_set_luid[base_regno];
2286 reg_base_reg[regno] = reg_base_reg[base_regno];
2287 reg_symbol_ref[regno] = reg_symbol_ref[base_regno];
2289 /* Compute the sum of the offsets or constants. */
2290 reg_offset[regno]
2291 = trunc_int_for_mode (offset + reg_offset[base_regno], mode);
2293 move2add_record_mode (dst);
2295 else
2297 invalidate:
2298 /* Invalidate the contents of the register. */
2299 move2add_record_mode (dst);
2300 reg_mode[regno] = VOIDmode;
2304 namespace {
2306 const pass_data pass_data_postreload_cse =
2308 RTL_PASS, /* type */
2309 "postreload", /* name */
2310 OPTGROUP_NONE, /* optinfo_flags */
2311 TV_RELOAD_CSE_REGS, /* tv_id */
2312 0, /* properties_required */
2313 0, /* properties_provided */
2314 0, /* properties_destroyed */
2315 0, /* todo_flags_start */
2316 TODO_df_finish, /* todo_flags_finish */
2319 class pass_postreload_cse : public rtl_opt_pass
2321 public:
2322 pass_postreload_cse (gcc::context *ctxt)
2323 : rtl_opt_pass (pass_data_postreload_cse, ctxt)
2326 /* opt_pass methods: */
2327 virtual bool gate (function *) { return (optimize > 0 && reload_completed); }
2329 virtual unsigned int execute (function *);
2331 }; // class pass_postreload_cse
2333 unsigned int
2334 pass_postreload_cse::execute (function *fun)
2336 if (!dbg_cnt (postreload_cse))
2337 return 0;
2339 /* Do a very simple CSE pass over just the hard registers. */
2340 reload_cse_regs (get_insns ());
2341 /* Reload_cse_regs can eliminate potentially-trapping MEMs.
2342 Remove any EH edges associated with them. */
2343 if (fun->can_throw_non_call_exceptions
2344 && purge_all_dead_edges ())
2345 cleanup_cfg (0);
2347 return 0;
2350 } // anon namespace
2352 rtl_opt_pass *
2353 make_pass_postreload_cse (gcc::context *ctxt)
2355 return new pass_postreload_cse (ctxt);