Tighten up params of create_basic_block_structure
[official-gcc.git] / gcc / bt-load.c
blob41288fe66528b66a1147c3bc1a4148fd0893b0d0
2 /* Perform branch target register load optimizations.
3 Copyright (C) 2001-2014 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "rtl.h"
26 #include "hard-reg-set.h"
27 #include "regs.h"
28 #include "fibheap.h"
29 #include "target.h"
30 #include "expr.h"
31 #include "flags.h"
32 #include "insn-attr.h"
33 #include "function.h"
34 #include "except.h"
35 #include "tm_p.h"
36 #include "diagnostic-core.h"
37 #include "tree-pass.h"
38 #include "recog.h"
39 #include "df.h"
40 #include "cfgloop.h"
42 /* Target register optimizations - these are performed after reload. */
44 typedef struct btr_def_group_s
46 struct btr_def_group_s *next;
47 rtx src;
48 struct btr_def_s *members;
49 } *btr_def_group;
51 typedef struct btr_user_s
53 struct btr_user_s *next;
54 basic_block bb;
55 int luid;
56 rtx_insn *insn;
57 /* If INSN has a single use of a single branch register, then
58 USE points to it within INSN. If there is more than
59 one branch register use, or the use is in some way ambiguous,
60 then USE is NULL. */
61 rtx use;
62 int n_reaching_defs;
63 int first_reaching_def;
64 char other_use_this_block;
65 } *btr_user;
67 /* btr_def structs appear on three lists:
68 1. A list of all btr_def structures (head is
69 ALL_BTR_DEFS, linked by the NEXT field).
70 2. A list of branch reg definitions per basic block (head is
71 BB_BTR_DEFS[i], linked by the NEXT_THIS_BB field).
72 3. A list of all branch reg definitions belonging to the same
73 group (head is in a BTR_DEF_GROUP struct, linked by
74 NEXT_THIS_GROUP field). */
76 typedef struct btr_def_s
78 struct btr_def_s *next_this_bb;
79 struct btr_def_s *next_this_group;
80 basic_block bb;
81 int luid;
82 rtx_insn *insn;
83 int btr;
84 int cost;
85 /* For a branch register setting insn that has a constant
86 source (i.e. a label), group links together all the
87 insns with the same source. For other branch register
88 setting insns, group is NULL. */
89 btr_def_group group;
90 btr_user uses;
91 /* If this def has a reaching use which is not a simple use
92 in a branch instruction, then has_ambiguous_use will be true,
93 and we will not attempt to migrate this definition. */
94 char has_ambiguous_use;
95 /* live_range is an approximation to the true live range for this
96 def/use web, because it records the set of blocks that contain
97 the live range. There could be other live ranges for the same
98 branch register in that set of blocks, either in the block
99 containing the def (before the def), or in a block containing
100 a use (after the use). If there are such other live ranges, then
101 other_btr_uses_before_def or other_btr_uses_after_use must be set true
102 as appropriate. */
103 char other_btr_uses_before_def;
104 char other_btr_uses_after_use;
105 /* We set own_end when we have moved a definition into a dominator.
106 Thus, when a later combination removes this definition again, we know
107 to clear out trs_live_at_end again. */
108 char own_end;
109 bitmap live_range;
110 } *btr_def;
112 static int issue_rate;
114 static int basic_block_freq (const_basic_block);
115 static int insn_sets_btr_p (const rtx_insn *, int, int *);
116 static rtx *find_btr_use (rtx);
117 static int btr_referenced_p (rtx, rtx *);
118 static int find_btr_reference (rtx *, void *);
119 static void find_btr_def_group (btr_def_group *, btr_def);
120 static btr_def add_btr_def (fibheap_t, basic_block, int, rtx_insn *,
121 unsigned int, int, btr_def_group *);
122 static btr_user new_btr_user (basic_block, int, rtx_insn *);
123 static void dump_hard_reg_set (HARD_REG_SET);
124 static void dump_btrs_live (int);
125 static void note_other_use_this_block (unsigned int, btr_user);
126 static void compute_defs_uses_and_gen (fibheap_t, btr_def *,btr_user *,
127 sbitmap *, sbitmap *, HARD_REG_SET *);
128 static void compute_kill (sbitmap *, sbitmap *, HARD_REG_SET *);
129 static void compute_out (sbitmap *bb_out, sbitmap *, sbitmap *, int);
130 static void link_btr_uses (btr_def *, btr_user *, sbitmap *, sbitmap *, int);
131 static void build_btr_def_use_webs (fibheap_t);
132 static int block_at_edge_of_live_range_p (int, btr_def);
133 static void clear_btr_from_live_range (btr_def def);
134 static void add_btr_to_live_range (btr_def, int);
135 static void augment_live_range (bitmap, HARD_REG_SET *, basic_block,
136 basic_block, int);
137 static int choose_btr (HARD_REG_SET);
138 static void combine_btr_defs (btr_def, HARD_REG_SET *);
139 static void btr_def_live_range (btr_def, HARD_REG_SET *);
140 static void move_btr_def (basic_block, int, btr_def, bitmap, HARD_REG_SET *);
141 static int migrate_btr_def (btr_def, int);
142 static void migrate_btr_defs (enum reg_class, int);
143 static int can_move_up (const_basic_block, const rtx_insn *, int);
144 static void note_btr_set (rtx, const_rtx, void *);
146 /* The following code performs code motion of target load instructions
147 (instructions that set branch target registers), to move them
148 forward away from the branch instructions and out of loops (or,
149 more generally, from a more frequently executed place to a less
150 frequently executed place).
151 Moving target load instructions further in front of the branch
152 instruction that uses the target register value means that the hardware
153 has a better chance of preloading the instructions at the branch
154 target by the time the branch is reached. This avoids bubbles
155 when a taken branch needs to flush out the pipeline.
156 Moving target load instructions out of loops means they are executed
157 less frequently. */
159 /* An obstack to hold the def-use web data structures built up for
160 migrating branch target load instructions. */
161 static struct obstack migrate_btrl_obstack;
163 /* Array indexed by basic block number, giving the set of registers
164 live in that block. */
165 static HARD_REG_SET *btrs_live;
167 /* Array indexed by basic block number, giving the set of registers live at
168 the end of that block, including any uses by a final jump insn, if any. */
169 static HARD_REG_SET *btrs_live_at_end;
171 /* Set of all target registers that we are willing to allocate. */
172 static HARD_REG_SET all_btrs;
174 /* Provide lower and upper bounds for target register numbers, so that
175 we don't need to search through all the hard registers all the time. */
176 static int first_btr, last_btr;
180 /* Return an estimate of the frequency of execution of block bb. */
181 static int
182 basic_block_freq (const_basic_block bb)
184 return bb->frequency;
187 static rtx *btr_reference_found;
189 /* A subroutine of btr_referenced_p, called through for_each_rtx.
190 PREG is a pointer to an rtx that is to be excluded from the
191 traversal. If we find a reference to a target register anywhere
192 else, return 1, and put a pointer to it into btr_reference_found. */
193 static int
194 find_btr_reference (rtx *px, void *preg)
196 rtx x;
198 if (px == preg)
199 return -1;
200 x = *px;
201 if (!REG_P (x))
202 return 0;
203 if (overlaps_hard_reg_set_p (all_btrs, GET_MODE (x), REGNO (x)))
205 btr_reference_found = px;
206 return 1;
208 return -1;
211 /* Return nonzero if X references (sets or reads) any branch target register.
212 If EXCLUDEP is set, disregard any references within the rtx pointed to
213 by it. If returning nonzero, also set btr_reference_found as above. */
214 static int
215 btr_referenced_p (rtx x, rtx *excludep)
217 return for_each_rtx (&x, find_btr_reference, excludep);
220 /* Return true if insn is an instruction that sets a target register.
221 if CHECK_CONST is true, only return true if the source is constant.
222 If such a set is found and REGNO is nonzero, assign the register number
223 of the destination register to *REGNO. */
224 static int
225 insn_sets_btr_p (const rtx_insn *insn, int check_const, int *regno)
227 rtx set;
229 if (NONJUMP_INSN_P (insn)
230 && (set = single_set (insn)))
232 rtx dest = SET_DEST (set);
233 rtx src = SET_SRC (set);
235 if (GET_CODE (dest) == SUBREG)
236 dest = XEXP (dest, 0);
238 if (REG_P (dest)
239 && TEST_HARD_REG_BIT (all_btrs, REGNO (dest)))
241 gcc_assert (!btr_referenced_p (src, NULL));
243 if (!check_const || CONSTANT_P (src))
245 if (regno)
246 *regno = REGNO (dest);
247 return 1;
251 return 0;
254 /* Find and return a use of a target register within an instruction INSN. */
255 static rtx *
256 find_btr_use (rtx insn)
258 return btr_referenced_p (insn, NULL) ? btr_reference_found : NULL;
261 /* Find the group that the target register definition DEF belongs
262 to in the list starting with *ALL_BTR_DEF_GROUPS. If no such
263 group exists, create one. Add def to the group. */
264 static void
265 find_btr_def_group (btr_def_group *all_btr_def_groups, btr_def def)
267 if (insn_sets_btr_p (def->insn, 1, NULL))
269 btr_def_group this_group;
270 rtx def_src = SET_SRC (single_set (def->insn));
272 /* ?? This linear search is an efficiency concern, particularly
273 as the search will almost always fail to find a match. */
274 for (this_group = *all_btr_def_groups;
275 this_group != NULL;
276 this_group = this_group->next)
277 if (rtx_equal_p (def_src, this_group->src))
278 break;
280 if (!this_group)
282 this_group = XOBNEW (&migrate_btrl_obstack, struct btr_def_group_s);
283 this_group->src = def_src;
284 this_group->members = NULL;
285 this_group->next = *all_btr_def_groups;
286 *all_btr_def_groups = this_group;
288 def->group = this_group;
289 def->next_this_group = this_group->members;
290 this_group->members = def;
292 else
293 def->group = NULL;
296 /* Create a new target register definition structure, for a definition in
297 block BB, instruction INSN, and insert it into ALL_BTR_DEFS. Return
298 the new definition. */
299 static btr_def
300 add_btr_def (fibheap_t all_btr_defs, basic_block bb, int insn_luid,
301 rtx_insn *insn,
302 unsigned int dest_reg, int other_btr_uses_before_def,
303 btr_def_group *all_btr_def_groups)
305 btr_def this_def = XOBNEW (&migrate_btrl_obstack, struct btr_def_s);
306 this_def->bb = bb;
307 this_def->luid = insn_luid;
308 this_def->insn = insn;
309 this_def->btr = dest_reg;
310 this_def->cost = basic_block_freq (bb);
311 this_def->has_ambiguous_use = 0;
312 this_def->other_btr_uses_before_def = other_btr_uses_before_def;
313 this_def->other_btr_uses_after_use = 0;
314 this_def->next_this_bb = NULL;
315 this_def->next_this_group = NULL;
316 this_def->uses = NULL;
317 this_def->live_range = NULL;
318 find_btr_def_group (all_btr_def_groups, this_def);
320 fibheap_insert (all_btr_defs, -this_def->cost, this_def);
322 if (dump_file)
323 fprintf (dump_file,
324 "Found target reg definition: sets %u { bb %d, insn %d }%s priority %d\n",
325 dest_reg, bb->index, INSN_UID (insn),
326 (this_def->group ? "" : ":not const"), this_def->cost);
328 return this_def;
331 /* Create a new target register user structure, for a use in block BB,
332 instruction INSN. Return the new user. */
333 static btr_user
334 new_btr_user (basic_block bb, int insn_luid, rtx_insn *insn)
336 /* This instruction reads target registers. We need
337 to decide whether we can replace all target register
338 uses easily.
340 rtx *usep = find_btr_use (PATTERN (insn));
341 rtx use;
342 btr_user user = NULL;
344 if (usep)
346 int unambiguous_single_use;
348 /* We want to ensure that USE is the only use of a target
349 register in INSN, so that we know that to rewrite INSN to use
350 a different target register, all we have to do is replace USE. */
351 unambiguous_single_use = !btr_referenced_p (PATTERN (insn), usep);
352 if (!unambiguous_single_use)
353 usep = NULL;
355 use = usep ? *usep : NULL_RTX;
356 user = XOBNEW (&migrate_btrl_obstack, struct btr_user_s);
357 user->bb = bb;
358 user->luid = insn_luid;
359 user->insn = insn;
360 user->use = use;
361 user->other_use_this_block = 0;
362 user->next = NULL;
363 user->n_reaching_defs = 0;
364 user->first_reaching_def = -1;
366 if (dump_file)
368 fprintf (dump_file, "Uses target reg: { bb %d, insn %d }",
369 bb->index, INSN_UID (insn));
371 if (user->use)
372 fprintf (dump_file, ": unambiguous use of reg %d\n",
373 REGNO (user->use));
376 return user;
379 /* Write the contents of S to the dump file. */
380 static void
381 dump_hard_reg_set (HARD_REG_SET s)
383 int reg;
384 for (reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
385 if (TEST_HARD_REG_BIT (s, reg))
386 fprintf (dump_file, " %d", reg);
389 /* Write the set of target regs live in block BB to the dump file. */
390 static void
391 dump_btrs_live (int bb)
393 fprintf (dump_file, "BB%d live:", bb);
394 dump_hard_reg_set (btrs_live[bb]);
395 fprintf (dump_file, "\n");
398 /* REGNO is the number of a branch target register that is being used or
399 set. USERS_THIS_BB is a list of preceding branch target register users;
400 If any of them use the same register, set their other_use_this_block
401 flag. */
402 static void
403 note_other_use_this_block (unsigned int regno, btr_user users_this_bb)
405 btr_user user;
407 for (user = users_this_bb; user != NULL; user = user->next)
408 if (user->use && REGNO (user->use) == regno)
409 user->other_use_this_block = 1;
412 typedef struct {
413 btr_user users_this_bb;
414 HARD_REG_SET btrs_written_in_block;
415 HARD_REG_SET btrs_live_in_block;
416 sbitmap bb_gen;
417 sbitmap *btr_defset;
418 } defs_uses_info;
420 /* Called via note_stores or directly to register stores into /
421 clobbers of a branch target register DEST that are not recognized as
422 straightforward definitions. DATA points to information about the
423 current basic block that needs updating. */
424 static void
425 note_btr_set (rtx dest, const_rtx set ATTRIBUTE_UNUSED, void *data)
427 defs_uses_info *info = (defs_uses_info *) data;
428 int regno, end_regno;
430 if (!REG_P (dest))
431 return;
432 regno = REGNO (dest);
433 end_regno = END_HARD_REGNO (dest);
434 for (; regno < end_regno; regno++)
435 if (TEST_HARD_REG_BIT (all_btrs, regno))
437 note_other_use_this_block (regno, info->users_this_bb);
438 SET_HARD_REG_BIT (info->btrs_written_in_block, regno);
439 SET_HARD_REG_BIT (info->btrs_live_in_block, regno);
440 bitmap_and_compl (info->bb_gen, info->bb_gen,
441 info->btr_defset[regno - first_btr]);
445 static void
446 compute_defs_uses_and_gen (fibheap_t all_btr_defs, btr_def *def_array,
447 btr_user *use_array, sbitmap *btr_defset,
448 sbitmap *bb_gen, HARD_REG_SET *btrs_written)
450 /* Scan the code building up the set of all defs and all uses.
451 For each target register, build the set of defs of that register.
452 For each block, calculate the set of target registers
453 written in that block.
454 Also calculate the set of btrs ever live in that block.
456 int i;
457 int insn_luid = 0;
458 btr_def_group all_btr_def_groups = NULL;
459 defs_uses_info info;
461 bitmap_vector_clear (bb_gen, last_basic_block_for_fn (cfun));
462 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
464 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
465 int reg;
466 btr_def defs_this_bb = NULL;
467 rtx_insn *insn;
468 rtx_insn *last;
469 int can_throw = 0;
471 info.users_this_bb = NULL;
472 info.bb_gen = bb_gen[i];
473 info.btr_defset = btr_defset;
475 CLEAR_HARD_REG_SET (info.btrs_live_in_block);
476 CLEAR_HARD_REG_SET (info.btrs_written_in_block);
477 for (reg = first_btr; reg <= last_btr; reg++)
478 if (TEST_HARD_REG_BIT (all_btrs, reg)
479 && REGNO_REG_SET_P (df_get_live_in (bb), reg))
480 SET_HARD_REG_BIT (info.btrs_live_in_block, reg);
482 for (insn = BB_HEAD (bb), last = NEXT_INSN (BB_END (bb));
483 insn != last;
484 insn = NEXT_INSN (insn), insn_luid++)
486 if (INSN_P (insn))
488 int regno;
489 int insn_uid = INSN_UID (insn);
491 if (insn_sets_btr_p (insn, 0, &regno))
493 btr_def def = add_btr_def (
494 all_btr_defs, bb, insn_luid, insn, regno,
495 TEST_HARD_REG_BIT (info.btrs_live_in_block, regno),
496 &all_btr_def_groups);
498 def_array[insn_uid] = def;
499 SET_HARD_REG_BIT (info.btrs_written_in_block, regno);
500 SET_HARD_REG_BIT (info.btrs_live_in_block, regno);
501 bitmap_and_compl (bb_gen[i], bb_gen[i],
502 btr_defset[regno - first_btr]);
503 bitmap_set_bit (bb_gen[i], insn_uid);
504 def->next_this_bb = defs_this_bb;
505 defs_this_bb = def;
506 bitmap_set_bit (btr_defset[regno - first_btr], insn_uid);
507 note_other_use_this_block (regno, info.users_this_bb);
509 /* Check for the blockage emitted by expand_nl_goto_receiver. */
510 else if (cfun->has_nonlocal_label
511 && GET_CODE (PATTERN (insn)) == UNSPEC_VOLATILE)
513 btr_user user;
515 /* Do the equivalent of calling note_other_use_this_block
516 for every target register. */
517 for (user = info.users_this_bb; user != NULL;
518 user = user->next)
519 if (user->use)
520 user->other_use_this_block = 1;
521 IOR_HARD_REG_SET (info.btrs_written_in_block, all_btrs);
522 IOR_HARD_REG_SET (info.btrs_live_in_block, all_btrs);
523 bitmap_clear (info.bb_gen);
525 else
527 if (btr_referenced_p (PATTERN (insn), NULL))
529 btr_user user = new_btr_user (bb, insn_luid, insn);
531 use_array[insn_uid] = user;
532 if (user->use)
533 SET_HARD_REG_BIT (info.btrs_live_in_block,
534 REGNO (user->use));
535 else
537 int reg;
538 for (reg = first_btr; reg <= last_btr; reg++)
539 if (TEST_HARD_REG_BIT (all_btrs, reg)
540 && refers_to_regno_p (reg, reg + 1, user->insn,
541 NULL))
543 note_other_use_this_block (reg,
544 info.users_this_bb);
545 SET_HARD_REG_BIT (info.btrs_live_in_block, reg);
547 note_stores (PATTERN (insn), note_btr_set, &info);
549 user->next = info.users_this_bb;
550 info.users_this_bb = user;
552 if (CALL_P (insn))
554 HARD_REG_SET *clobbered = &call_used_reg_set;
555 HARD_REG_SET call_saved;
556 rtx pat = PATTERN (insn);
557 int i;
559 /* Check for sibcall. */
560 if (GET_CODE (pat) == PARALLEL)
561 for (i = XVECLEN (pat, 0) - 1; i >= 0; i--)
562 if (ANY_RETURN_P (XVECEXP (pat, 0, i)))
564 COMPL_HARD_REG_SET (call_saved,
565 call_used_reg_set);
566 clobbered = &call_saved;
569 for (regno = first_btr; regno <= last_btr; regno++)
570 if (TEST_HARD_REG_BIT (*clobbered, regno))
571 note_btr_set (regno_reg_rtx[regno], NULL_RTX, &info);
577 COPY_HARD_REG_SET (btrs_live[i], info.btrs_live_in_block);
578 COPY_HARD_REG_SET (btrs_written[i], info.btrs_written_in_block);
580 REG_SET_TO_HARD_REG_SET (btrs_live_at_end[i], df_get_live_out (bb));
581 /* If this block ends in a jump insn, add any uses or even clobbers
582 of branch target registers that it might have. */
583 for (insn = BB_END (bb); insn != BB_HEAD (bb) && ! INSN_P (insn); )
584 insn = PREV_INSN (insn);
585 /* ??? for the fall-through edge, it would make sense to insert the
586 btr set on the edge, but that would require to split the block
587 early on so that we can distinguish between dominance from the fall
588 through edge - which can use the call-clobbered registers - from
589 dominance by the throw edge. */
590 if (can_throw_internal (insn))
592 HARD_REG_SET tmp;
594 COPY_HARD_REG_SET (tmp, call_used_reg_set);
595 AND_HARD_REG_SET (tmp, all_btrs);
596 IOR_HARD_REG_SET (btrs_live_at_end[i], tmp);
597 can_throw = 1;
599 if (can_throw || JUMP_P (insn))
601 int regno;
603 for (regno = first_btr; regno <= last_btr; regno++)
604 if (refers_to_regno_p (regno, regno+1, insn, NULL))
605 SET_HARD_REG_BIT (btrs_live_at_end[i], regno);
608 if (dump_file)
609 dump_btrs_live (i);
613 static void
614 compute_kill (sbitmap *bb_kill, sbitmap *btr_defset,
615 HARD_REG_SET *btrs_written)
617 int i;
618 int regno;
620 /* For each basic block, form the set BB_KILL - the set
621 of definitions that the block kills. */
622 bitmap_vector_clear (bb_kill, last_basic_block_for_fn (cfun));
623 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
625 for (regno = first_btr; regno <= last_btr; regno++)
626 if (TEST_HARD_REG_BIT (all_btrs, regno)
627 && TEST_HARD_REG_BIT (btrs_written[i], regno))
628 bitmap_ior (bb_kill[i], bb_kill[i],
629 btr_defset[regno - first_btr]);
633 static void
634 compute_out (sbitmap *bb_out, sbitmap *bb_gen, sbitmap *bb_kill, int max_uid)
636 /* Perform iterative dataflow:
637 Initially, for all blocks, BB_OUT = BB_GEN.
638 For each block,
639 BB_IN = union over predecessors of BB_OUT(pred)
640 BB_OUT = (BB_IN - BB_KILL) + BB_GEN
641 Iterate until the bb_out sets stop growing. */
642 int i;
643 int changed;
644 sbitmap bb_in = sbitmap_alloc (max_uid);
646 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
647 bitmap_copy (bb_out[i], bb_gen[i]);
649 changed = 1;
650 while (changed)
652 changed = 0;
653 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
655 bitmap_union_of_preds (bb_in, bb_out, BASIC_BLOCK_FOR_FN (cfun, i));
656 changed |= bitmap_ior_and_compl (bb_out[i], bb_gen[i],
657 bb_in, bb_kill[i]);
660 sbitmap_free (bb_in);
663 static void
664 link_btr_uses (btr_def *def_array, btr_user *use_array, sbitmap *bb_out,
665 sbitmap *btr_defset, int max_uid)
667 int i;
668 sbitmap reaching_defs = sbitmap_alloc (max_uid);
670 /* Link uses to the uses lists of all of their reaching defs.
671 Count up the number of reaching defs of each use. */
672 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
674 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
675 rtx_insn *insn;
676 rtx_insn *last;
678 bitmap_union_of_preds (reaching_defs, bb_out, BASIC_BLOCK_FOR_FN (cfun, i));
679 for (insn = BB_HEAD (bb), last = NEXT_INSN (BB_END (bb));
680 insn != last;
681 insn = NEXT_INSN (insn))
683 if (INSN_P (insn))
685 int insn_uid = INSN_UID (insn);
687 btr_def def = def_array[insn_uid];
688 btr_user user = use_array[insn_uid];
689 if (def != NULL)
691 /* Remove all reaching defs of regno except
692 for this one. */
693 bitmap_and_compl (reaching_defs, reaching_defs,
694 btr_defset[def->btr - first_btr]);
695 bitmap_set_bit (reaching_defs, insn_uid);
698 if (user != NULL)
700 /* Find all the reaching defs for this use. */
701 sbitmap reaching_defs_of_reg = sbitmap_alloc (max_uid);
702 unsigned int uid = 0;
703 sbitmap_iterator sbi;
705 if (user->use)
706 bitmap_and (
707 reaching_defs_of_reg,
708 reaching_defs,
709 btr_defset[REGNO (user->use) - first_btr]);
710 else
712 int reg;
714 bitmap_clear (reaching_defs_of_reg);
715 for (reg = first_btr; reg <= last_btr; reg++)
716 if (TEST_HARD_REG_BIT (all_btrs, reg)
717 && refers_to_regno_p (reg, reg + 1, user->insn,
718 NULL))
719 bitmap_or_and (reaching_defs_of_reg,
720 reaching_defs_of_reg,
721 reaching_defs,
722 btr_defset[reg - first_btr]);
724 EXECUTE_IF_SET_IN_BITMAP (reaching_defs_of_reg, 0, uid, sbi)
726 btr_def def = def_array[uid];
728 /* We now know that def reaches user. */
730 if (dump_file)
731 fprintf (dump_file,
732 "Def in insn %d reaches use in insn %d\n",
733 uid, insn_uid);
735 user->n_reaching_defs++;
736 if (!user->use)
737 def->has_ambiguous_use = 1;
738 if (user->first_reaching_def != -1)
739 { /* There is more than one reaching def. This is
740 a rare case, so just give up on this def/use
741 web when it occurs. */
742 def->has_ambiguous_use = 1;
743 def_array[user->first_reaching_def]
744 ->has_ambiguous_use = 1;
745 if (dump_file)
746 fprintf (dump_file,
747 "(use %d has multiple reaching defs)\n",
748 insn_uid);
750 else
751 user->first_reaching_def = uid;
752 if (user->other_use_this_block)
753 def->other_btr_uses_after_use = 1;
754 user->next = def->uses;
755 def->uses = user;
757 sbitmap_free (reaching_defs_of_reg);
760 if (CALL_P (insn))
762 int regno;
764 for (regno = first_btr; regno <= last_btr; regno++)
765 if (TEST_HARD_REG_BIT (all_btrs, regno)
766 && TEST_HARD_REG_BIT (call_used_reg_set, regno))
767 bitmap_and_compl (reaching_defs, reaching_defs,
768 btr_defset[regno - first_btr]);
773 sbitmap_free (reaching_defs);
776 static void
777 build_btr_def_use_webs (fibheap_t all_btr_defs)
779 const int max_uid = get_max_uid ();
780 btr_def *def_array = XCNEWVEC (btr_def, max_uid);
781 btr_user *use_array = XCNEWVEC (btr_user, max_uid);
782 sbitmap *btr_defset = sbitmap_vector_alloc (
783 (last_btr - first_btr) + 1, max_uid);
784 sbitmap *bb_gen = sbitmap_vector_alloc (last_basic_block_for_fn (cfun),
785 max_uid);
786 HARD_REG_SET *btrs_written = XCNEWVEC (HARD_REG_SET,
787 last_basic_block_for_fn (cfun));
788 sbitmap *bb_kill;
789 sbitmap *bb_out;
791 bitmap_vector_clear (btr_defset, (last_btr - first_btr) + 1);
793 compute_defs_uses_and_gen (all_btr_defs, def_array, use_array, btr_defset,
794 bb_gen, btrs_written);
796 bb_kill = sbitmap_vector_alloc (last_basic_block_for_fn (cfun), max_uid);
797 compute_kill (bb_kill, btr_defset, btrs_written);
798 free (btrs_written);
800 bb_out = sbitmap_vector_alloc (last_basic_block_for_fn (cfun), max_uid);
801 compute_out (bb_out, bb_gen, bb_kill, max_uid);
803 sbitmap_vector_free (bb_gen);
804 sbitmap_vector_free (bb_kill);
806 link_btr_uses (def_array, use_array, bb_out, btr_defset, max_uid);
808 sbitmap_vector_free (bb_out);
809 sbitmap_vector_free (btr_defset);
810 free (use_array);
811 free (def_array);
814 /* Return true if basic block BB contains the start or end of the
815 live range of the definition DEF, AND there are other live
816 ranges of the same target register that include BB. */
817 static int
818 block_at_edge_of_live_range_p (int bb, btr_def def)
820 if (def->other_btr_uses_before_def
821 && BASIC_BLOCK_FOR_FN (cfun, bb) == def->bb)
822 return 1;
823 else if (def->other_btr_uses_after_use)
825 btr_user user;
826 for (user = def->uses; user != NULL; user = user->next)
827 if (BASIC_BLOCK_FOR_FN (cfun, bb) == user->bb)
828 return 1;
830 return 0;
833 /* We are removing the def/use web DEF. The target register
834 used in this web is therefore no longer live in the live range
835 of this web, so remove it from the live set of all basic blocks
836 in the live range of the web.
837 Blocks at the boundary of the live range may contain other live
838 ranges for the same target register, so we have to be careful
839 to remove the target register from the live set of these blocks
840 only if they do not contain other live ranges for the same register. */
841 static void
842 clear_btr_from_live_range (btr_def def)
844 unsigned bb;
845 bitmap_iterator bi;
847 EXECUTE_IF_SET_IN_BITMAP (def->live_range, 0, bb, bi)
849 if ((!def->other_btr_uses_before_def
850 && !def->other_btr_uses_after_use)
851 || !block_at_edge_of_live_range_p (bb, def))
853 CLEAR_HARD_REG_BIT (btrs_live[bb], def->btr);
854 CLEAR_HARD_REG_BIT (btrs_live_at_end[bb], def->btr);
855 if (dump_file)
856 dump_btrs_live (bb);
859 if (def->own_end)
860 CLEAR_HARD_REG_BIT (btrs_live_at_end[def->bb->index], def->btr);
864 /* We are adding the def/use web DEF. Add the target register used
865 in this web to the live set of all of the basic blocks that contain
866 the live range of the web.
867 If OWN_END is set, also show that the register is live from our
868 definitions at the end of the basic block where it is defined. */
869 static void
870 add_btr_to_live_range (btr_def def, int own_end)
872 unsigned bb;
873 bitmap_iterator bi;
875 EXECUTE_IF_SET_IN_BITMAP (def->live_range, 0, bb, bi)
877 SET_HARD_REG_BIT (btrs_live[bb], def->btr);
878 SET_HARD_REG_BIT (btrs_live_at_end[bb], def->btr);
879 if (dump_file)
880 dump_btrs_live (bb);
882 if (own_end)
884 SET_HARD_REG_BIT (btrs_live_at_end[def->bb->index], def->btr);
885 def->own_end = 1;
889 /* Update a live range to contain the basic block NEW_BLOCK, and all
890 blocks on paths between the existing live range and NEW_BLOCK.
891 HEAD is a block contained in the existing live range that dominates
892 all other blocks in the existing live range.
893 Also add to the set BTRS_LIVE_IN_RANGE all target registers that
894 are live in the blocks that we add to the live range.
895 If FULL_RANGE is set, include the full live range of NEW_BB;
896 otherwise, if NEW_BB dominates HEAD_BB, only add registers that
897 are life at the end of NEW_BB for NEW_BB itself.
898 It is a precondition that either NEW_BLOCK dominates HEAD,or
899 HEAD dom NEW_BLOCK. This is used to speed up the
900 implementation of this function. */
901 static void
902 augment_live_range (bitmap live_range, HARD_REG_SET *btrs_live_in_range,
903 basic_block head_bb, basic_block new_bb, int full_range)
905 basic_block *worklist, *tos;
907 tos = worklist = XNEWVEC (basic_block, n_basic_blocks_for_fn (cfun) + 1);
909 if (dominated_by_p (CDI_DOMINATORS, new_bb, head_bb))
911 if (new_bb == head_bb)
913 if (full_range)
914 IOR_HARD_REG_SET (*btrs_live_in_range, btrs_live[new_bb->index]);
915 free (tos);
916 return;
918 *tos++ = new_bb;
920 else
922 edge e;
923 edge_iterator ei;
924 int new_block = new_bb->index;
926 gcc_assert (dominated_by_p (CDI_DOMINATORS, head_bb, new_bb));
928 IOR_HARD_REG_SET (*btrs_live_in_range, btrs_live[head_bb->index]);
929 bitmap_set_bit (live_range, new_block);
930 /* A previous btr migration could have caused a register to be
931 live just at the end of new_block which we need in full, so
932 use trs_live_at_end even if full_range is set. */
933 IOR_HARD_REG_SET (*btrs_live_in_range, btrs_live_at_end[new_block]);
934 if (full_range)
935 IOR_HARD_REG_SET (*btrs_live_in_range, btrs_live[new_block]);
936 if (dump_file)
938 fprintf (dump_file,
939 "Adding end of block %d and rest of %d to live range\n",
940 new_block, head_bb->index);
941 fprintf (dump_file,"Now live btrs are ");
942 dump_hard_reg_set (*btrs_live_in_range);
943 fprintf (dump_file, "\n");
945 FOR_EACH_EDGE (e, ei, head_bb->preds)
946 *tos++ = e->src;
949 while (tos != worklist)
951 basic_block bb = *--tos;
952 if (!bitmap_bit_p (live_range, bb->index))
954 edge e;
955 edge_iterator ei;
957 bitmap_set_bit (live_range, bb->index);
958 IOR_HARD_REG_SET (*btrs_live_in_range,
959 btrs_live[bb->index]);
960 /* A previous btr migration could have caused a register to be
961 live just at the end of a block which we need in full. */
962 IOR_HARD_REG_SET (*btrs_live_in_range,
963 btrs_live_at_end[bb->index]);
964 if (dump_file)
966 fprintf (dump_file,
967 "Adding block %d to live range\n", bb->index);
968 fprintf (dump_file,"Now live btrs are ");
969 dump_hard_reg_set (*btrs_live_in_range);
970 fprintf (dump_file, "\n");
973 FOR_EACH_EDGE (e, ei, bb->preds)
975 basic_block pred = e->src;
976 if (!bitmap_bit_p (live_range, pred->index))
977 *tos++ = pred;
982 free (worklist);
985 /* Return the most desirable target register that is not in
986 the set USED_BTRS. */
987 static int
988 choose_btr (HARD_REG_SET used_btrs)
990 int i;
992 if (!hard_reg_set_subset_p (all_btrs, used_btrs))
993 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
995 #ifdef REG_ALLOC_ORDER
996 int regno = reg_alloc_order[i];
997 #else
998 int regno = i;
999 #endif
1000 if (TEST_HARD_REG_BIT (all_btrs, regno)
1001 && !TEST_HARD_REG_BIT (used_btrs, regno))
1002 return regno;
1004 return -1;
1007 /* Calculate the set of basic blocks that contain the live range of
1008 the def/use web DEF.
1009 Also calculate the set of target registers that are live at time
1010 in this live range, but ignore the live range represented by DEF
1011 when calculating this set. */
1012 static void
1013 btr_def_live_range (btr_def def, HARD_REG_SET *btrs_live_in_range)
1015 if (!def->live_range)
1017 btr_user user;
1019 def->live_range = BITMAP_ALLOC (NULL);
1021 bitmap_set_bit (def->live_range, def->bb->index);
1022 COPY_HARD_REG_SET (*btrs_live_in_range,
1023 (flag_btr_bb_exclusive
1024 ? btrs_live : btrs_live_at_end)[def->bb->index]);
1026 for (user = def->uses; user != NULL; user = user->next)
1027 augment_live_range (def->live_range, btrs_live_in_range,
1028 def->bb, user->bb,
1029 (flag_btr_bb_exclusive
1030 || user->insn != BB_END (def->bb)
1031 || !JUMP_P (user->insn)));
1033 else
1035 /* def->live_range is accurate, but we need to recompute
1036 the set of target registers live over it, because migration
1037 of other PT instructions may have affected it.
1039 unsigned bb;
1040 unsigned def_bb = flag_btr_bb_exclusive ? -1 : def->bb->index;
1041 bitmap_iterator bi;
1043 CLEAR_HARD_REG_SET (*btrs_live_in_range);
1044 EXECUTE_IF_SET_IN_BITMAP (def->live_range, 0, bb, bi)
1046 IOR_HARD_REG_SET (*btrs_live_in_range,
1047 (def_bb == bb
1048 ? btrs_live_at_end : btrs_live) [bb]);
1051 if (!def->other_btr_uses_before_def &&
1052 !def->other_btr_uses_after_use)
1053 CLEAR_HARD_REG_BIT (*btrs_live_in_range, def->btr);
1056 /* Merge into the def/use web DEF any other def/use webs in the same
1057 group that are dominated by DEF, provided that there is a target
1058 register available to allocate to the merged web. */
1059 static void
1060 combine_btr_defs (btr_def def, HARD_REG_SET *btrs_live_in_range)
1062 btr_def other_def;
1064 for (other_def = def->group->members;
1065 other_def != NULL;
1066 other_def = other_def->next_this_group)
1068 if (other_def != def
1069 && other_def->uses != NULL
1070 && ! other_def->has_ambiguous_use
1071 && dominated_by_p (CDI_DOMINATORS, other_def->bb, def->bb))
1073 /* def->bb dominates the other def, so def and other_def could
1074 be combined. */
1075 /* Merge their live ranges, and get the set of
1076 target registers live over the merged range. */
1077 int btr;
1078 HARD_REG_SET combined_btrs_live;
1079 bitmap combined_live_range = BITMAP_ALLOC (NULL);
1080 btr_user user;
1082 if (other_def->live_range == NULL)
1084 HARD_REG_SET dummy_btrs_live_in_range;
1085 btr_def_live_range (other_def, &dummy_btrs_live_in_range);
1087 COPY_HARD_REG_SET (combined_btrs_live, *btrs_live_in_range);
1088 bitmap_copy (combined_live_range, def->live_range);
1090 for (user = other_def->uses; user != NULL; user = user->next)
1091 augment_live_range (combined_live_range, &combined_btrs_live,
1092 def->bb, user->bb,
1093 (flag_btr_bb_exclusive
1094 || user->insn != BB_END (def->bb)
1095 || !JUMP_P (user->insn)));
1097 btr = choose_btr (combined_btrs_live);
1098 if (btr != -1)
1100 /* We can combine them. */
1101 if (dump_file)
1102 fprintf (dump_file,
1103 "Combining def in insn %d with def in insn %d\n",
1104 INSN_UID (other_def->insn), INSN_UID (def->insn));
1106 def->btr = btr;
1107 user = other_def->uses;
1108 while (user != NULL)
1110 btr_user next = user->next;
1112 user->next = def->uses;
1113 def->uses = user;
1114 user = next;
1116 /* Combining def/use webs can make target registers live
1117 after uses where they previously were not. This means
1118 some REG_DEAD notes may no longer be correct. We could
1119 be more precise about this if we looked at the combined
1120 live range, but here I just delete any REG_DEAD notes
1121 in case they are no longer correct. */
1122 for (user = def->uses; user != NULL; user = user->next)
1123 remove_note (user->insn,
1124 find_regno_note (user->insn, REG_DEAD,
1125 REGNO (user->use)));
1126 clear_btr_from_live_range (other_def);
1127 other_def->uses = NULL;
1128 bitmap_copy (def->live_range, combined_live_range);
1129 if (other_def->btr == btr && other_def->other_btr_uses_after_use)
1130 def->other_btr_uses_after_use = 1;
1131 COPY_HARD_REG_SET (*btrs_live_in_range, combined_btrs_live);
1133 /* Delete the old target register initialization. */
1134 delete_insn (other_def->insn);
1137 BITMAP_FREE (combined_live_range);
1142 /* Move the definition DEF from its current position to basic
1143 block NEW_DEF_BB, and modify it to use branch target register BTR.
1144 Delete the old defining insn, and insert a new one in NEW_DEF_BB.
1145 Update all reaching uses of DEF in the RTL to use BTR.
1146 If this new position means that other defs in the
1147 same group can be combined with DEF then combine them. */
1148 static void
1149 move_btr_def (basic_block new_def_bb, int btr, btr_def def, bitmap live_range,
1150 HARD_REG_SET *btrs_live_in_range)
1152 /* We can move the instruction.
1153 Set a target register in block NEW_DEF_BB to the value
1154 needed for this target register definition.
1155 Replace all uses of the old target register definition by
1156 uses of the new definition. Delete the old definition. */
1157 basic_block b = new_def_bb;
1158 rtx_insn *insp = BB_HEAD (b);
1159 rtx_insn *old_insn = def->insn;
1160 rtx src;
1161 rtx btr_rtx;
1162 rtx_insn *new_insn;
1163 enum machine_mode btr_mode;
1164 btr_user user;
1165 rtx set;
1167 if (dump_file)
1168 fprintf(dump_file, "migrating to basic block %d, using reg %d\n",
1169 new_def_bb->index, btr);
1171 clear_btr_from_live_range (def);
1172 def->btr = btr;
1173 def->bb = new_def_bb;
1174 def->luid = 0;
1175 def->cost = basic_block_freq (new_def_bb);
1176 bitmap_copy (def->live_range, live_range);
1177 combine_btr_defs (def, btrs_live_in_range);
1178 btr = def->btr;
1179 def->other_btr_uses_before_def
1180 = TEST_HARD_REG_BIT (btrs_live[b->index], btr) ? 1 : 0;
1181 add_btr_to_live_range (def, 1);
1182 if (LABEL_P (insp))
1183 insp = NEXT_INSN (insp);
1184 /* N.B.: insp is expected to be NOTE_INSN_BASIC_BLOCK now. Some
1185 optimizations can result in insp being both first and last insn of
1186 its basic block. */
1187 /* ?? some assertions to check that insp is sensible? */
1189 if (def->other_btr_uses_before_def)
1191 insp = BB_END (b);
1192 for (insp = BB_END (b); ! INSN_P (insp); insp = PREV_INSN (insp))
1193 gcc_assert (insp != BB_HEAD (b));
1195 if (JUMP_P (insp) || can_throw_internal (insp))
1196 insp = PREV_INSN (insp);
1199 set = single_set (old_insn);
1200 src = SET_SRC (set);
1201 btr_mode = GET_MODE (SET_DEST (set));
1202 btr_rtx = gen_rtx_REG (btr_mode, btr);
1204 new_insn = as_a <rtx_insn *> (gen_move_insn (btr_rtx, src));
1206 /* Insert target register initialization at head of basic block. */
1207 def->insn = emit_insn_after (new_insn, insp);
1209 df_set_regs_ever_live (btr, true);
1211 if (dump_file)
1212 fprintf (dump_file, "New pt is insn %d, inserted after insn %d\n",
1213 INSN_UID (def->insn), INSN_UID (insp));
1215 /* Delete the old target register initialization. */
1216 delete_insn (old_insn);
1218 /* Replace each use of the old target register by a use of the new target
1219 register. */
1220 for (user = def->uses; user != NULL; user = user->next)
1222 /* Some extra work here to ensure consistent modes, because
1223 it seems that a target register REG rtx can be given a different
1224 mode depending on the context (surely that should not be
1225 the case?). */
1226 rtx replacement_rtx;
1227 if (GET_MODE (user->use) == GET_MODE (btr_rtx)
1228 || GET_MODE (user->use) == VOIDmode)
1229 replacement_rtx = btr_rtx;
1230 else
1231 replacement_rtx = gen_rtx_REG (GET_MODE (user->use), btr);
1232 validate_replace_rtx (user->use, replacement_rtx, user->insn);
1233 user->use = replacement_rtx;
1237 /* We anticipate intra-block scheduling to be done. See if INSN could move
1238 up within BB by N_INSNS. */
1239 static int
1240 can_move_up (const_basic_block bb, const rtx_insn *insn, int n_insns)
1242 while (insn != BB_HEAD (bb) && n_insns > 0)
1244 insn = PREV_INSN (insn);
1245 /* ??? What if we have an anti-dependency that actually prevents the
1246 scheduler from doing the move? We'd like to re-allocate the register,
1247 but not necessarily put the load into another basic block. */
1248 if (INSN_P (insn))
1249 n_insns--;
1251 return n_insns <= 0;
1254 /* Attempt to migrate the target register definition DEF to an
1255 earlier point in the flowgraph.
1257 It is a precondition of this function that DEF is migratable:
1258 i.e. it has a constant source, and all uses are unambiguous.
1260 Only migrations that reduce the cost of DEF will be made.
1261 MIN_COST is the lower bound on the cost of the DEF after migration.
1262 If we migrate DEF so that its cost falls below MIN_COST,
1263 then we do not attempt to migrate further. The idea is that
1264 we migrate definitions in a priority order based on their cost,
1265 when the cost of this definition falls below MIN_COST, then
1266 there is another definition with cost == MIN_COST which now
1267 has a higher priority than this definition.
1269 Return nonzero if there may be benefit from attempting to
1270 migrate this DEF further (i.e. we have reduced the cost below
1271 MIN_COST, but we may be able to reduce it further).
1272 Return zero if no further migration is possible. */
1273 static int
1274 migrate_btr_def (btr_def def, int min_cost)
1276 bitmap live_range;
1277 HARD_REG_SET btrs_live_in_range;
1278 int btr_used_near_def = 0;
1279 int def_basic_block_freq;
1280 basic_block attempt;
1281 int give_up = 0;
1282 int def_moved = 0;
1283 btr_user user;
1284 int def_latency;
1286 if (dump_file)
1287 fprintf (dump_file,
1288 "Attempting to migrate pt from insn %d (cost = %d, min_cost = %d) ... ",
1289 INSN_UID (def->insn), def->cost, min_cost);
1291 if (!def->group || def->has_ambiguous_use)
1292 /* These defs are not migratable. */
1294 if (dump_file)
1295 fprintf (dump_file, "it's not migratable\n");
1296 return 0;
1299 if (!def->uses)
1300 /* We have combined this def with another in the same group, so
1301 no need to consider it further.
1304 if (dump_file)
1305 fprintf (dump_file, "it's already combined with another pt\n");
1306 return 0;
1309 btr_def_live_range (def, &btrs_live_in_range);
1310 live_range = BITMAP_ALLOC (NULL);
1311 bitmap_copy (live_range, def->live_range);
1313 #ifdef INSN_SCHEDULING
1314 def_latency = insn_default_latency (def->insn) * issue_rate;
1315 #else
1316 def_latency = issue_rate;
1317 #endif
1319 for (user = def->uses; user != NULL; user = user->next)
1321 if (user->bb == def->bb
1322 && user->luid > def->luid
1323 && (def->luid + def_latency) > user->luid
1324 && ! can_move_up (def->bb, def->insn,
1325 (def->luid + def_latency) - user->luid))
1327 btr_used_near_def = 1;
1328 break;
1332 def_basic_block_freq = basic_block_freq (def->bb);
1334 for (attempt = get_immediate_dominator (CDI_DOMINATORS, def->bb);
1335 !give_up && attempt && attempt != ENTRY_BLOCK_PTR_FOR_FN (cfun)
1336 && def->cost >= min_cost;
1337 attempt = get_immediate_dominator (CDI_DOMINATORS, attempt))
1339 /* Try to move the instruction that sets the target register into
1340 basic block ATTEMPT. */
1341 int try_freq = basic_block_freq (attempt);
1342 edge_iterator ei;
1343 edge e;
1345 /* If ATTEMPT has abnormal edges, skip it. */
1346 FOR_EACH_EDGE (e, ei, attempt->succs)
1347 if (e->flags & EDGE_COMPLEX)
1348 break;
1349 if (e)
1350 continue;
1352 if (dump_file)
1353 fprintf (dump_file, "trying block %d ...", attempt->index);
1355 if (try_freq < def_basic_block_freq
1356 || (try_freq == def_basic_block_freq && btr_used_near_def))
1358 int btr;
1359 augment_live_range (live_range, &btrs_live_in_range, def->bb, attempt,
1360 flag_btr_bb_exclusive);
1361 if (dump_file)
1363 fprintf (dump_file, "Now btrs live in range are: ");
1364 dump_hard_reg_set (btrs_live_in_range);
1365 fprintf (dump_file, "\n");
1367 btr = choose_btr (btrs_live_in_range);
1368 if (btr != -1)
1370 move_btr_def (attempt, btr, def, live_range, &btrs_live_in_range);
1371 bitmap_copy (live_range, def->live_range);
1372 btr_used_near_def = 0;
1373 def_moved = 1;
1374 def_basic_block_freq = basic_block_freq (def->bb);
1376 else
1378 /* There are no free target registers available to move
1379 this far forward, so give up */
1380 give_up = 1;
1381 if (dump_file)
1382 fprintf (dump_file,
1383 "giving up because there are no free target registers\n");
1388 if (!def_moved)
1390 give_up = 1;
1391 if (dump_file)
1392 fprintf (dump_file, "failed to move\n");
1394 BITMAP_FREE (live_range);
1395 return !give_up;
1398 /* Attempt to move instructions that set target registers earlier
1399 in the flowgraph, away from their corresponding uses. */
1400 static void
1401 migrate_btr_defs (enum reg_class btr_class, int allow_callee_save)
1403 fibheap_t all_btr_defs = fibheap_new ();
1404 int reg;
1406 gcc_obstack_init (&migrate_btrl_obstack);
1407 if (dump_file)
1409 int i;
1411 for (i = NUM_FIXED_BLOCKS; i < last_basic_block_for_fn (cfun); i++)
1413 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
1414 fprintf (dump_file,
1415 "Basic block %d: count = %" PRId64
1416 " loop-depth = %d idom = %d\n",
1417 i, (int64_t) bb->count, bb_loop_depth (bb),
1418 get_immediate_dominator (CDI_DOMINATORS, bb)->index);
1422 CLEAR_HARD_REG_SET (all_btrs);
1423 for (first_btr = -1, reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
1424 if (TEST_HARD_REG_BIT (reg_class_contents[(int) btr_class], reg)
1425 && (allow_callee_save || call_used_regs[reg]
1426 || df_regs_ever_live_p (reg)))
1428 SET_HARD_REG_BIT (all_btrs, reg);
1429 last_btr = reg;
1430 if (first_btr < 0)
1431 first_btr = reg;
1434 btrs_live = XCNEWVEC (HARD_REG_SET, last_basic_block_for_fn (cfun));
1435 btrs_live_at_end = XCNEWVEC (HARD_REG_SET, last_basic_block_for_fn (cfun));
1437 build_btr_def_use_webs (all_btr_defs);
1439 while (!fibheap_empty (all_btr_defs))
1441 btr_def def = (btr_def) fibheap_extract_min (all_btr_defs);
1442 int min_cost = -fibheap_min_key (all_btr_defs);
1443 if (migrate_btr_def (def, min_cost))
1445 fibheap_insert (all_btr_defs, -def->cost, (void *) def);
1446 if (dump_file)
1448 fprintf (dump_file,
1449 "Putting insn %d back on queue with priority %d\n",
1450 INSN_UID (def->insn), def->cost);
1453 else
1454 BITMAP_FREE (def->live_range);
1457 free (btrs_live);
1458 free (btrs_live_at_end);
1459 obstack_free (&migrate_btrl_obstack, NULL);
1460 fibheap_delete (all_btr_defs);
1463 static void
1464 branch_target_load_optimize (bool after_prologue_epilogue_gen)
1466 enum reg_class klass
1467 = (enum reg_class) targetm.branch_target_register_class ();
1468 if (klass != NO_REGS)
1470 /* Initialize issue_rate. */
1471 if (targetm.sched.issue_rate)
1472 issue_rate = targetm.sched.issue_rate ();
1473 else
1474 issue_rate = 1;
1476 if (!after_prologue_epilogue_gen)
1478 /* Build the CFG for migrate_btr_defs. */
1479 #if 1
1480 /* This may or may not be needed, depending on where we
1481 run this phase. */
1482 cleanup_cfg (optimize ? CLEANUP_EXPENSIVE : 0);
1483 #endif
1485 df_analyze ();
1488 /* Dominator info is also needed for migrate_btr_def. */
1489 calculate_dominance_info (CDI_DOMINATORS);
1490 migrate_btr_defs (klass,
1491 (targetm.branch_target_register_callee_saved
1492 (after_prologue_epilogue_gen)));
1494 free_dominance_info (CDI_DOMINATORS);
1498 namespace {
1500 const pass_data pass_data_branch_target_load_optimize1 =
1502 RTL_PASS, /* type */
1503 "btl1", /* name */
1504 OPTGROUP_NONE, /* optinfo_flags */
1505 TV_NONE, /* tv_id */
1506 0, /* properties_required */
1507 0, /* properties_provided */
1508 0, /* properties_destroyed */
1509 0, /* todo_flags_start */
1510 0, /* todo_flags_finish */
1513 class pass_branch_target_load_optimize1 : public rtl_opt_pass
1515 public:
1516 pass_branch_target_load_optimize1 (gcc::context *ctxt)
1517 : rtl_opt_pass (pass_data_branch_target_load_optimize1, ctxt)
1520 /* opt_pass methods: */
1521 virtual bool gate (function *) { return flag_branch_target_load_optimize; }
1522 virtual unsigned int execute (function *)
1524 branch_target_load_optimize (epilogue_completed);
1525 return 0;
1528 }; // class pass_branch_target_load_optimize1
1530 } // anon namespace
1532 rtl_opt_pass *
1533 make_pass_branch_target_load_optimize1 (gcc::context *ctxt)
1535 return new pass_branch_target_load_optimize1 (ctxt);
1539 namespace {
1541 const pass_data pass_data_branch_target_load_optimize2 =
1543 RTL_PASS, /* type */
1544 "btl2", /* name */
1545 OPTGROUP_NONE, /* optinfo_flags */
1546 TV_NONE, /* tv_id */
1547 0, /* properties_required */
1548 0, /* properties_provided */
1549 0, /* properties_destroyed */
1550 0, /* todo_flags_start */
1551 0, /* todo_flags_finish */
1554 class pass_branch_target_load_optimize2 : public rtl_opt_pass
1556 public:
1557 pass_branch_target_load_optimize2 (gcc::context *ctxt)
1558 : rtl_opt_pass (pass_data_branch_target_load_optimize2, ctxt)
1561 /* opt_pass methods: */
1562 virtual bool gate (function *)
1564 return (optimize > 0 && flag_branch_target_load_optimize2);
1567 virtual unsigned int execute (function *);
1569 }; // class pass_branch_target_load_optimize2
1571 unsigned int
1572 pass_branch_target_load_optimize2::execute (function *)
1574 static int warned = 0;
1576 /* Leave this a warning for now so that it is possible to experiment
1577 with running this pass twice. In 3.6, we should either make this
1578 an error, or use separate dump files. */
1579 if (flag_branch_target_load_optimize
1580 && flag_branch_target_load_optimize2
1581 && !warned)
1583 warning (0, "branch target register load optimization is not intended "
1584 "to be run twice");
1586 warned = 1;
1589 branch_target_load_optimize (epilogue_completed);
1590 return 0;
1593 } // anon namespace
1595 rtl_opt_pass *
1596 make_pass_branch_target_load_optimize2 (gcc::context *ctxt)
1598 return new pass_branch_target_load_optimize2 (ctxt);