1 /* Integrated Register Allocator. Changing code and generating moves.
2 Copyright (C) 2006-2018 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 /* When we have more one region, we need to change the original RTL
22 code after coloring. Let us consider two allocnos representing the
23 same pseudo-register outside and inside a region respectively.
24 They can get different hard-registers. The reload pass works on
25 pseudo registers basis and there is no way to say the reload that
26 pseudo could be in different registers and it is even more
27 difficult to say in what places of the code the pseudo should have
28 particular hard-registers. So in this case IRA has to create and
29 use a new pseudo-register inside the region and adds code to move
30 allocno values on the region's borders. This is done by the code
33 The code makes top-down traversal of the regions and generate new
34 pseudos and the move code on the region borders. In some
35 complicated cases IRA can create a new pseudo used temporarily to
36 move allocno values when a swap of values stored in two
37 hard-registers is needed (e.g. two allocnos representing different
38 pseudos outside region got respectively hard registers 1 and 2 and
39 the corresponding allocnos inside the region got respectively hard
40 registers 2 and 1). At this stage, the new pseudo is marked as
43 IRA still creates the pseudo-register and the moves on the region
44 borders even when the both corresponding allocnos were assigned to
45 the same hard-register. It is done because, if the reload pass for
46 some reason spills a pseudo-register representing the original
47 pseudo outside or inside the region, the effect will be smaller
48 because another pseudo will still be in the hard-register. In most
49 cases, this is better then spilling the original pseudo in its
50 whole live-range. If reload does not change the allocation for the
51 two pseudo-registers, the trivial move will be removed by
52 post-reload optimizations.
54 IRA does not generate a new pseudo and moves for the allocno values
55 if the both allocnos representing an original pseudo inside and
56 outside region assigned to the same hard register when the register
57 pressure in the region for the corresponding pressure class is less
58 than number of available hard registers for given pressure class.
60 IRA also does some optimizations to remove redundant moves which is
61 transformed into stores by the reload pass on CFG edges
62 representing exits from the region.
64 IRA tries to reduce duplication of code generated on CFG edges
65 which are enters and exits to/from regions by moving some code to
66 the edge sources or destinations when it is possible. */
70 #include "coretypes.h"
76 #include "insn-config.h"
88 /* Data used to emit live range split insns and to flattening IR. */
89 ira_emit_data_t ira_allocno_emit_data
;
91 /* Definitions for vectors of pointers. */
94 /* Pointers to data allocated for allocnos being created during
95 emitting. Usually there are quite few such allocnos because they
96 are created only for resolving loop in register shuffling. */
97 static vec
<void_p
> new_allocno_emit_data_vec
;
99 /* Allocate and initiate the emit data. */
101 ira_initiate_emit_data (void)
104 ira_allocno_iterator ai
;
106 ira_allocno_emit_data
107 = (ira_emit_data_t
) ira_allocate (ira_allocnos_num
108 * sizeof (struct ira_emit_data
));
109 memset (ira_allocno_emit_data
, 0,
110 ira_allocnos_num
* sizeof (struct ira_emit_data
));
111 FOR_EACH_ALLOCNO (a
, ai
)
112 ALLOCNO_ADD_DATA (a
) = ira_allocno_emit_data
+ ALLOCNO_NUM (a
);
113 new_allocno_emit_data_vec
.create (50);
117 /* Free the emit data. */
119 ira_finish_emit_data (void)
123 ira_allocno_iterator ai
;
125 ira_free (ira_allocno_emit_data
);
126 FOR_EACH_ALLOCNO (a
, ai
)
127 ALLOCNO_ADD_DATA (a
) = NULL
;
128 for (;new_allocno_emit_data_vec
.length () != 0;)
130 p
= new_allocno_emit_data_vec
.pop ();
133 new_allocno_emit_data_vec
.release ();
136 /* Create and return a new allocno with given REGNO and
137 LOOP_TREE_NODE. Allocate emit data for it. */
139 create_new_allocno (int regno
, ira_loop_tree_node_t loop_tree_node
)
143 a
= ira_create_allocno (regno
, false, loop_tree_node
);
144 ALLOCNO_ADD_DATA (a
) = ira_allocate (sizeof (struct ira_emit_data
));
145 memset (ALLOCNO_ADD_DATA (a
), 0, sizeof (struct ira_emit_data
));
146 new_allocno_emit_data_vec
.safe_push (ALLOCNO_ADD_DATA (a
));
152 /* See comments below. */
153 typedef struct move
*move_t
;
155 /* The structure represents an allocno move. Both allocnos have the
156 same original regno but different allocation. */
159 /* The allocnos involved in the move. */
160 ira_allocno_t from
, to
;
161 /* The next move in the move sequence. */
163 /* Used for finding dependencies. */
165 /* The size of the following array. */
167 /* Moves on which given move depends on. Dependency can be cyclic.
168 It means we need a temporary to generates the moves. Sequence
169 A1->A2, B1->B2 where A1 and B2 are assigned to reg R1 and A2 and
170 B1 are assigned to reg R2 is an example of the cyclic
173 /* First insn generated for the move. */
177 /* Array of moves (indexed by BB index) which should be put at the
178 start/end of the corresponding basic blocks. */
179 static move_t
*at_bb_start
, *at_bb_end
;
181 /* Max regno before renaming some pseudo-registers. For example, the
182 same pseudo-register can be renamed in a loop if its allocation is
183 different outside the loop. */
184 static int max_regno_before_changing
;
186 /* Return new move of allocnos TO and FROM. */
188 create_move (ira_allocno_t to
, ira_allocno_t from
)
192 move
= (move_t
) ira_allocate (sizeof (struct move
));
199 move
->visited_p
= false;
203 /* Free memory for MOVE and its dependencies. */
205 free_move (move_t move
)
207 if (move
->deps
!= NULL
)
208 ira_free (move
->deps
);
212 /* Free memory for list of the moves given by its HEAD. */
214 free_move_list (move_t head
)
218 for (; head
!= NULL
; head
= next
)
225 /* Return TRUE if the move list LIST1 and LIST2 are equal (two
226 moves are equal if they involve the same allocnos). */
228 eq_move_lists_p (move_t list1
, move_t list2
)
230 for (; list1
!= NULL
&& list2
!= NULL
;
231 list1
= list1
->next
, list2
= list2
->next
)
232 if (list1
->from
!= list2
->from
|| list1
->to
!= list2
->to
)
234 return list1
== list2
;
237 /* Print move list LIST into file F. */
239 print_move_list (FILE *f
, move_t list
)
241 for (; list
!= NULL
; list
= list
->next
)
242 fprintf (f
, " a%dr%d->a%dr%d",
243 ALLOCNO_NUM (list
->from
), ALLOCNO_REGNO (list
->from
),
244 ALLOCNO_NUM (list
->to
), ALLOCNO_REGNO (list
->to
));
248 extern void ira_debug_move_list (move_t list
);
250 /* Print move list LIST into stderr. */
252 ira_debug_move_list (move_t list
)
254 print_move_list (stderr
, list
);
257 /* This recursive function changes pseudo-registers in *LOC if it is
258 necessary. The function returns TRUE if a change was done. */
260 change_regs (rtx
*loc
)
262 int i
, regno
, result
= false;
267 if (*loc
== NULL_RTX
)
269 code
= GET_CODE (*loc
);
272 regno
= REGNO (*loc
);
273 if (regno
< FIRST_PSEUDO_REGISTER
)
275 if (regno
>= max_regno_before_changing
)
276 /* It is a shared register which was changed already. */
278 if (ira_curr_regno_allocno_map
[regno
] == NULL
)
280 reg
= allocno_emit_reg (ira_curr_regno_allocno_map
[regno
]);
287 fmt
= GET_RTX_FORMAT (code
);
288 for (i
= GET_RTX_LENGTH (code
) - 1; i
>= 0; i
--)
291 result
= change_regs (&XEXP (*loc
, i
)) || result
;
292 else if (fmt
[i
] == 'E')
296 for (j
= XVECLEN (*loc
, i
) - 1; j
>= 0; j
--)
297 result
= change_regs (&XVECEXP (*loc
, i
, j
)) || result
;
304 change_regs_in_insn (rtx_insn
**insn_ptr
)
307 bool result
= change_regs (&rtx
);
308 *insn_ptr
= as_a
<rtx_insn
*> (rtx
);
312 /* Attach MOVE to the edge E. The move is attached to the head of the
313 list if HEAD_P is TRUE. */
315 add_to_edge_list (edge e
, move_t move
, bool head_p
)
319 if (head_p
|| e
->aux
== NULL
)
321 move
->next
= (move_t
) e
->aux
;
326 for (last
= (move_t
) e
->aux
; last
->next
!= NULL
; last
= last
->next
)
333 /* Create and return new pseudo-register with the same attributes as
336 ira_create_new_reg (rtx original_reg
)
340 new_reg
= gen_reg_rtx (GET_MODE (original_reg
));
341 ORIGINAL_REGNO (new_reg
) = ORIGINAL_REGNO (original_reg
);
342 REG_USERVAR_P (new_reg
) = REG_USERVAR_P (original_reg
);
343 REG_POINTER (new_reg
) = REG_POINTER (original_reg
);
344 REG_ATTRS (new_reg
) = REG_ATTRS (original_reg
);
345 if (internal_flag_ira_verbose
> 3 && ira_dump_file
!= NULL
)
346 fprintf (ira_dump_file
, " Creating newreg=%i from oldreg=%i\n",
347 REGNO (new_reg
), REGNO (original_reg
));
348 ira_expand_reg_equiv ();
352 /* Return TRUE if loop given by SUBNODE inside the loop given by
355 subloop_tree_node_p (ira_loop_tree_node_t subnode
, ira_loop_tree_node_t node
)
357 for (; subnode
!= NULL
; subnode
= subnode
->parent
)
363 /* Set up member `reg' to REG for allocnos which has the same regno as
364 ALLOCNO and which are inside the loop corresponding to ALLOCNO. */
366 set_allocno_reg (ira_allocno_t allocno
, rtx reg
)
370 ira_loop_tree_node_t node
;
372 node
= ALLOCNO_LOOP_TREE_NODE (allocno
);
373 for (a
= ira_regno_allocno_map
[ALLOCNO_REGNO (allocno
)];
375 a
= ALLOCNO_NEXT_REGNO_ALLOCNO (a
))
376 if (subloop_tree_node_p (ALLOCNO_LOOP_TREE_NODE (a
), node
))
377 ALLOCNO_EMIT_DATA (a
)->reg
= reg
;
378 for (a
= ALLOCNO_CAP (allocno
); a
!= NULL
; a
= ALLOCNO_CAP (a
))
379 ALLOCNO_EMIT_DATA (a
)->reg
= reg
;
380 regno
= ALLOCNO_REGNO (allocno
);
383 if (a
== NULL
|| (a
= ALLOCNO_CAP (a
)) == NULL
)
388 a
= node
->regno_allocno_map
[regno
];
392 if (ALLOCNO_EMIT_DATA (a
)->child_renamed_p
)
394 ALLOCNO_EMIT_DATA (a
)->child_renamed_p
= true;
398 /* Return true if there is an entry to given loop not from its parent
399 (or grandparent) block. For example, it is possible for two
400 adjacent loops inside another loop. */
402 entered_from_non_parent_p (ira_loop_tree_node_t loop_node
)
404 ira_loop_tree_node_t bb_node
, src_loop_node
, parent
;
408 for (bb_node
= loop_node
->children
;
410 bb_node
= bb_node
->next
)
411 if (bb_node
->bb
!= NULL
)
413 FOR_EACH_EDGE (e
, ei
, bb_node
->bb
->preds
)
414 if (e
->src
!= ENTRY_BLOCK_PTR_FOR_FN (cfun
)
415 && (src_loop_node
= IRA_BB_NODE (e
->src
)->parent
) != loop_node
)
417 for (parent
= src_loop_node
->parent
;
419 parent
= parent
->parent
)
420 if (parent
== loop_node
)
423 /* That is an exit from a nested loop -- skip it. */
425 for (parent
= loop_node
->parent
;
427 parent
= parent
->parent
)
428 if (src_loop_node
== parent
)
437 /* Set up ENTERED_FROM_NON_PARENT_P for each loop region. */
439 setup_entered_from_non_parent_p (void)
444 ira_assert (current_loops
!= NULL
);
445 FOR_EACH_VEC_SAFE_ELT (get_loops (cfun
), i
, loop
)
446 if (ira_loop_nodes
[i
].regno_allocno_map
!= NULL
)
447 ira_loop_nodes
[i
].entered_from_non_parent_p
448 = entered_from_non_parent_p (&ira_loop_nodes
[i
]);
451 /* Return TRUE if move of SRC_ALLOCNO (assigned to hard register) to
452 DEST_ALLOCNO (assigned to memory) can be removed because it does
453 not change value of the destination. One possible reason for this
454 is the situation when SRC_ALLOCNO is not modified in the
455 corresponding loop. */
457 store_can_be_removed_p (ira_allocno_t src_allocno
, ira_allocno_t dest_allocno
)
459 int regno
, orig_regno
;
461 ira_loop_tree_node_t node
;
463 ira_assert (ALLOCNO_CAP_MEMBER (src_allocno
) == NULL
464 && ALLOCNO_CAP_MEMBER (dest_allocno
) == NULL
);
465 orig_regno
= ALLOCNO_REGNO (src_allocno
);
466 regno
= REGNO (allocno_emit_reg (dest_allocno
));
467 for (node
= ALLOCNO_LOOP_TREE_NODE (src_allocno
);
471 a
= node
->regno_allocno_map
[orig_regno
];
472 ira_assert (a
!= NULL
);
473 if (REGNO (allocno_emit_reg (a
)) == (unsigned) regno
)
474 /* We achieved the destination and everything is ok. */
476 else if (bitmap_bit_p (node
->modified_regnos
, orig_regno
))
478 else if (node
->entered_from_non_parent_p
)
479 /* If there is a path from a destination loop block to the
480 source loop header containing basic blocks of non-parents
481 (grandparents) of the source loop, we should have checked
482 modifications of the pseudo on this path too to decide
483 about possibility to remove the store. It could be done by
484 solving a data-flow problem. Unfortunately such global
485 solution would complicate IR flattening. Therefore we just
486 prohibit removal of the store in such complicated case. */
489 /* It is actually a loop entry -- do not remove the store. */
493 /* Generate and attach moves to the edge E. This looks at the final
494 regnos of allocnos living on the edge with the same original regno
495 to figure out when moves should be generated. */
497 generate_edge_moves (edge e
)
499 ira_loop_tree_node_t src_loop_node
, dest_loop_node
;
502 ira_allocno_t src_allocno
, dest_allocno
, *src_map
, *dest_map
;
504 bitmap regs_live_in_dest
, regs_live_out_src
;
506 src_loop_node
= IRA_BB_NODE (e
->src
)->parent
;
507 dest_loop_node
= IRA_BB_NODE (e
->dest
)->parent
;
509 if (src_loop_node
== dest_loop_node
)
511 src_map
= src_loop_node
->regno_allocno_map
;
512 dest_map
= dest_loop_node
->regno_allocno_map
;
513 regs_live_in_dest
= df_get_live_in (e
->dest
);
514 regs_live_out_src
= df_get_live_out (e
->src
);
515 EXECUTE_IF_SET_IN_REG_SET (regs_live_in_dest
,
516 FIRST_PSEUDO_REGISTER
, regno
, bi
)
517 if (bitmap_bit_p (regs_live_out_src
, regno
))
519 src_allocno
= src_map
[regno
];
520 dest_allocno
= dest_map
[regno
];
521 if (REGNO (allocno_emit_reg (src_allocno
))
522 == REGNO (allocno_emit_reg (dest_allocno
)))
524 /* Remove unnecessary stores at the region exit. We should do
525 this for readonly memory for sure and this is guaranteed by
526 that we never generate moves on region borders (see
527 checking in function change_loop). */
528 if (ALLOCNO_HARD_REGNO (dest_allocno
) < 0
529 && ALLOCNO_HARD_REGNO (src_allocno
) >= 0
530 && store_can_be_removed_p (src_allocno
, dest_allocno
))
532 ALLOCNO_EMIT_DATA (src_allocno
)->mem_optimized_dest
= dest_allocno
;
533 ALLOCNO_EMIT_DATA (dest_allocno
)->mem_optimized_dest_p
= true;
534 if (internal_flag_ira_verbose
> 3 && ira_dump_file
!= NULL
)
535 fprintf (ira_dump_file
, " Remove r%d:a%d->a%d(mem)\n",
536 regno
, ALLOCNO_NUM (src_allocno
),
537 ALLOCNO_NUM (dest_allocno
));
540 move
= create_move (dest_allocno
, src_allocno
);
541 add_to_edge_list (e
, move
, true);
545 /* Bitmap of allocnos local for the current loop. */
546 static bitmap local_allocno_bitmap
;
548 /* This bitmap is used to find that we need to generate and to use a
549 new pseudo-register when processing allocnos with the same original
551 static bitmap used_regno_bitmap
;
553 /* This bitmap contains regnos of allocnos which were renamed locally
554 because the allocnos correspond to disjoint live ranges in loops
555 with a common parent. */
556 static bitmap renamed_regno_bitmap
;
558 /* Change (if necessary) pseudo-registers inside loop given by loop
561 change_loop (ira_loop_tree_node_t node
)
567 ira_allocno_t allocno
, parent_allocno
, *map
;
570 enum reg_class aclass
, pclass
;
571 ira_loop_tree_node_t parent
;
573 if (node
!= ira_loop_tree_root
)
575 ira_assert (current_loops
!= NULL
);
577 if (node
->bb
!= NULL
)
579 FOR_BB_INSNS (node
->bb
, insn
)
580 if (INSN_P (insn
) && change_regs_in_insn (&insn
))
582 df_insn_rescan (insn
);
583 df_notes_rescan (insn
);
588 if (internal_flag_ira_verbose
> 3 && ira_dump_file
!= NULL
)
589 fprintf (ira_dump_file
,
590 " Changing RTL for loop %d (header bb%d)\n",
591 node
->loop_num
, node
->loop
->header
->index
);
593 parent
= ira_curr_loop_tree_node
->parent
;
594 map
= parent
->regno_allocno_map
;
595 EXECUTE_IF_SET_IN_REG_SET (ira_curr_loop_tree_node
->border_allocnos
,
598 allocno
= ira_allocnos
[i
];
599 regno
= ALLOCNO_REGNO (allocno
);
600 aclass
= ALLOCNO_CLASS (allocno
);
601 pclass
= ira_pressure_class_translate
[aclass
];
602 parent_allocno
= map
[regno
];
603 ira_assert (regno
< ira_reg_equiv_len
);
604 /* We generate the same hard register move because the
605 reload pass can put an allocno into memory in this case
606 we will have live range splitting. If it does not happen
607 such the same hard register moves will be removed. The
608 worst case when the both allocnos are put into memory by
609 the reload is very rare. */
610 if (parent_allocno
!= NULL
611 && (ALLOCNO_HARD_REGNO (allocno
)
612 == ALLOCNO_HARD_REGNO (parent_allocno
))
613 && (ALLOCNO_HARD_REGNO (allocno
) < 0
614 || (parent
->reg_pressure
[pclass
] + 1
615 <= ira_class_hard_regs_num
[pclass
])
616 || TEST_HARD_REG_BIT (ira_prohibited_mode_move_regs
617 [ALLOCNO_MODE (allocno
)],
618 ALLOCNO_HARD_REGNO (allocno
))
619 /* don't create copies because reload can spill an
620 allocno set by copy although the allocno will not
622 || ira_equiv_no_lvalue_p (regno
)
623 || (pic_offset_table_rtx
!= NULL
624 && (ALLOCNO_REGNO (allocno
)
625 == (int) REGNO (pic_offset_table_rtx
)))))
627 original_reg
= allocno_emit_reg (allocno
);
628 if (parent_allocno
== NULL
629 || (REGNO (allocno_emit_reg (parent_allocno
))
630 == REGNO (original_reg
)))
632 if (internal_flag_ira_verbose
> 3 && ira_dump_file
)
633 fprintf (ira_dump_file
, " %i vs parent %i:",
634 ALLOCNO_HARD_REGNO (allocno
),
635 ALLOCNO_HARD_REGNO (parent_allocno
));
636 set_allocno_reg (allocno
, ira_create_new_reg (original_reg
));
640 /* Rename locals: Local allocnos with same regno in different loops
641 might get the different hard register. So we need to change
643 bitmap_and_compl (local_allocno_bitmap
,
644 ira_curr_loop_tree_node
->all_allocnos
,
645 ira_curr_loop_tree_node
->border_allocnos
);
646 EXECUTE_IF_SET_IN_REG_SET (local_allocno_bitmap
, 0, i
, bi
)
648 allocno
= ira_allocnos
[i
];
649 regno
= ALLOCNO_REGNO (allocno
);
650 if (ALLOCNO_CAP_MEMBER (allocno
) != NULL
)
652 used_p
= !bitmap_set_bit (used_regno_bitmap
, regno
);
653 ALLOCNO_EMIT_DATA (allocno
)->somewhere_renamed_p
= true;
656 bitmap_set_bit (renamed_regno_bitmap
, regno
);
657 set_allocno_reg (allocno
, ira_create_new_reg (allocno_emit_reg (allocno
)));
661 /* Process to set up flag somewhere_renamed_p. */
663 set_allocno_somewhere_renamed_p (void)
666 ira_allocno_t allocno
;
667 ira_allocno_iterator ai
;
669 FOR_EACH_ALLOCNO (allocno
, ai
)
671 regno
= ALLOCNO_REGNO (allocno
);
672 if (bitmap_bit_p (renamed_regno_bitmap
, regno
)
673 && REGNO (allocno_emit_reg (allocno
)) == regno
)
674 ALLOCNO_EMIT_DATA (allocno
)->somewhere_renamed_p
= true;
678 /* Return TRUE if move lists on all edges given in vector VEC are
681 eq_edge_move_lists_p (vec
<edge
, va_gc
> *vec
)
686 list
= (move_t
) EDGE_I (vec
, 0)->aux
;
687 for (i
= EDGE_COUNT (vec
) - 1; i
> 0; i
--)
688 if (! eq_move_lists_p (list
, (move_t
) EDGE_I (vec
, i
)->aux
))
693 /* Look at all entry edges (if START_P) or exit edges of basic block
694 BB and put move lists at the BB start or end if it is possible. In
695 other words, this decreases code duplication of allocno moves. */
697 unify_moves (basic_block bb
, bool start_p
)
702 vec
<edge
, va_gc
> *vec
;
704 vec
= (start_p
? bb
->preds
: bb
->succs
);
705 if (EDGE_COUNT (vec
) == 0 || ! eq_edge_move_lists_p (vec
))
708 list
= (move_t
) e
->aux
;
709 if (! start_p
&& control_flow_insn_p (BB_END (bb
)))
712 for (i
= EDGE_COUNT (vec
) - 1; i
> 0; i
--)
715 free_move_list ((move_t
) e
->aux
);
719 at_bb_start
[bb
->index
] = list
;
721 at_bb_end
[bb
->index
] = list
;
724 /* Last move (in move sequence being processed) setting up the
725 corresponding hard register. */
726 static move_t hard_regno_last_set
[FIRST_PSEUDO_REGISTER
];
728 /* If the element value is equal to CURR_TICK then the corresponding
729 element in `hard_regno_last_set' is defined and correct. */
730 static int hard_regno_last_set_check
[FIRST_PSEUDO_REGISTER
];
732 /* Last move (in move sequence being processed) setting up the
733 corresponding allocno. */
734 static move_t
*allocno_last_set
;
736 /* If the element value is equal to CURR_TICK then the corresponding
737 element in . `allocno_last_set' is defined and correct. */
738 static int *allocno_last_set_check
;
740 /* Definition of vector of moves. */
742 /* This vec contains moves sorted topologically (depth-first) on their
744 static vec
<move_t
> move_vec
;
746 /* The variable value is used to check correctness of values of
747 elements of arrays `hard_regno_last_set' and
748 `allocno_last_set_check'. */
749 static int curr_tick
;
751 /* This recursive function traverses dependencies of MOVE and produces
752 topological sorting (in depth-first order). */
754 traverse_moves (move_t move
)
760 move
->visited_p
= true;
761 for (i
= move
->deps_num
- 1; i
>= 0; i
--)
762 traverse_moves (move
->deps
[i
]);
763 move_vec
.safe_push (move
);
766 /* Remove unnecessary moves in the LIST, makes topological sorting,
767 and removes cycles on hard reg dependencies by introducing new
768 allocnos assigned to memory and additional moves. It returns the
771 modify_move_list (move_t list
)
773 int i
, n
, nregs
, hard_regno
;
774 ira_allocno_t to
, from
;
775 move_t move
, new_move
, set_move
, first
, last
;
779 /* Create move deps. */
781 for (move
= list
; move
!= NULL
; move
= move
->next
)
784 if ((hard_regno
= ALLOCNO_HARD_REGNO (to
)) < 0)
786 nregs
= hard_regno_nregs (hard_regno
, ALLOCNO_MODE (to
));
787 for (i
= 0; i
< nregs
; i
++)
789 hard_regno_last_set
[hard_regno
+ i
] = move
;
790 hard_regno_last_set_check
[hard_regno
+ i
] = curr_tick
;
793 for (move
= list
; move
!= NULL
; move
= move
->next
)
797 if ((hard_regno
= ALLOCNO_HARD_REGNO (from
)) >= 0)
799 nregs
= hard_regno_nregs (hard_regno
, ALLOCNO_MODE (from
));
800 for (n
= i
= 0; i
< nregs
; i
++)
801 if (hard_regno_last_set_check
[hard_regno
+ i
] == curr_tick
802 && (ALLOCNO_REGNO (hard_regno_last_set
[hard_regno
+ i
]->to
)
803 != ALLOCNO_REGNO (from
)))
805 move
->deps
= (move_t
*) ira_allocate (n
* sizeof (move_t
));
806 for (n
= i
= 0; i
< nregs
; i
++)
807 if (hard_regno_last_set_check
[hard_regno
+ i
] == curr_tick
808 && (ALLOCNO_REGNO (hard_regno_last_set
[hard_regno
+ i
]->to
)
809 != ALLOCNO_REGNO (from
)))
810 move
->deps
[n
++] = hard_regno_last_set
[hard_regno
+ i
];
814 /* Topological sorting: */
815 move_vec
.truncate (0);
816 for (move
= list
; move
!= NULL
; move
= move
->next
)
817 traverse_moves (move
);
819 for (i
= (int) move_vec
.length () - 1; i
>= 0; i
--)
827 first
= move_vec
.last ();
828 /* Removing cycles: */
830 move_vec
.truncate (0);
831 for (move
= first
; move
!= NULL
; move
= move
->next
)
835 if ((hard_regno
= ALLOCNO_HARD_REGNO (from
)) >= 0)
837 nregs
= hard_regno_nregs (hard_regno
, ALLOCNO_MODE (from
));
838 for (i
= 0; i
< nregs
; i
++)
839 if (hard_regno_last_set_check
[hard_regno
+ i
] == curr_tick
840 && ALLOCNO_HARD_REGNO
841 (hard_regno_last_set
[hard_regno
+ i
]->to
) >= 0)
844 ira_allocno_t new_allocno
;
846 set_move
= hard_regno_last_set
[hard_regno
+ i
];
847 /* It does not matter what loop_tree_node (of TO or
848 FROM) to use for the new allocno because of
849 subsequent IRA internal representation
852 = create_new_allocno (ALLOCNO_REGNO (set_move
->to
),
853 ALLOCNO_LOOP_TREE_NODE (set_move
->to
));
854 ALLOCNO_MODE (new_allocno
) = ALLOCNO_MODE (set_move
->to
);
855 ira_set_allocno_class (new_allocno
,
856 ALLOCNO_CLASS (set_move
->to
));
857 ira_create_allocno_objects (new_allocno
);
858 ALLOCNO_ASSIGNED_P (new_allocno
) = true;
859 ALLOCNO_HARD_REGNO (new_allocno
) = -1;
860 ALLOCNO_EMIT_DATA (new_allocno
)->reg
861 = ira_create_new_reg (allocno_emit_reg (set_move
->to
));
863 /* Make it possibly conflicting with all earlier
864 created allocnos. Cases where temporary allocnos
865 created to remove the cycles are quite rare. */
866 n
= ALLOCNO_NUM_OBJECTS (new_allocno
);
867 gcc_assert (n
== ALLOCNO_NUM_OBJECTS (set_move
->to
));
868 for (j
= 0; j
< n
; j
++)
870 ira_object_t new_obj
= ALLOCNO_OBJECT (new_allocno
, j
);
872 OBJECT_MIN (new_obj
) = 0;
873 OBJECT_MAX (new_obj
) = ira_objects_num
- 1;
876 new_move
= create_move (set_move
->to
, new_allocno
);
877 set_move
->to
= new_allocno
;
878 move_vec
.safe_push (new_move
);
879 ira_move_loops_num
++;
880 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
881 fprintf (ira_dump_file
,
882 " Creating temporary allocno a%dr%d\n",
883 ALLOCNO_NUM (new_allocno
),
884 REGNO (allocno_emit_reg (new_allocno
)));
887 if ((hard_regno
= ALLOCNO_HARD_REGNO (to
)) < 0)
889 nregs
= hard_regno_nregs (hard_regno
, ALLOCNO_MODE (to
));
890 for (i
= 0; i
< nregs
; i
++)
892 hard_regno_last_set
[hard_regno
+ i
] = move
;
893 hard_regno_last_set_check
[hard_regno
+ i
] = curr_tick
;
896 for (i
= (int) move_vec
.length () - 1; i
>= 0; i
--)
906 /* Generate RTX move insns from the move list LIST. This updates
907 allocation cost using move execution frequency FREQ. */
909 emit_move_list (move_t list
, int freq
)
912 int to_regno
, from_regno
, cost
, regno
;
913 rtx_insn
*result
, *insn
;
916 enum reg_class aclass
;
920 for (; list
!= NULL
; list
= list
->next
)
923 to
= allocno_emit_reg (list
->to
);
924 to_regno
= REGNO (to
);
925 from
= allocno_emit_reg (list
->from
);
926 from_regno
= REGNO (from
);
927 emit_move_insn (to
, from
);
928 list
->insn
= get_insns ();
930 for (insn
= list
->insn
; insn
!= NULL_RTX
; insn
= NEXT_INSN (insn
))
932 /* The reload needs to have set up insn codes. If the
933 reload sets up insn codes by itself, it may fail because
934 insns will have hard registers instead of pseudos and
935 there may be no machine insn with given hard
937 recog_memoized (insn
);
938 /* Add insn to equiv init insn list if it is necessary.
939 Otherwise reload will not remove this insn if it decides
940 to use the equivalence. */
941 if ((set
= single_set (insn
)) != NULL_RTX
)
943 dest
= SET_DEST (set
);
944 if (GET_CODE (dest
) == SUBREG
)
945 dest
= SUBREG_REG (dest
);
946 ira_assert (REG_P (dest
));
947 regno
= REGNO (dest
);
948 if (regno
>= ira_reg_equiv_len
949 || (ira_reg_equiv
[regno
].invariant
== NULL_RTX
950 && ira_reg_equiv
[regno
].constant
== NULL_RTX
))
951 continue; /* regno has no equivalence. */
952 ira_assert ((int) reg_equivs
->length () > regno
);
953 reg_equiv_init (regno
)
954 = gen_rtx_INSN_LIST (VOIDmode
, insn
, reg_equiv_init (regno
));
958 ira_update_equiv_info_by_shuffle_insn (to_regno
, from_regno
, list
->insn
);
959 emit_insn (list
->insn
);
960 mode
= ALLOCNO_MODE (list
->to
);
961 aclass
= ALLOCNO_CLASS (list
->to
);
963 if (ALLOCNO_HARD_REGNO (list
->to
) < 0)
965 if (ALLOCNO_HARD_REGNO (list
->from
) >= 0)
967 cost
= ira_memory_move_cost
[mode
][aclass
][0] * freq
;
968 ira_store_cost
+= cost
;
971 else if (ALLOCNO_HARD_REGNO (list
->from
) < 0)
973 if (ALLOCNO_HARD_REGNO (list
->to
) >= 0)
975 cost
= ira_memory_move_cost
[mode
][aclass
][0] * freq
;
976 ira_load_cost
+= cost
;
981 ira_init_register_move_cost_if_necessary (mode
);
982 cost
= ira_register_move_cost
[mode
][aclass
][aclass
] * freq
;
983 ira_shuffle_cost
+= cost
;
985 ira_overall_cost
+= cost
;
987 result
= get_insns ();
992 /* Generate RTX move insns from move lists attached to basic blocks
1000 rtx_insn
*insns
, *tmp
;
1002 FOR_EACH_BB_FN (bb
, cfun
)
1004 if (at_bb_start
[bb
->index
] != NULL
)
1006 at_bb_start
[bb
->index
] = modify_move_list (at_bb_start
[bb
->index
]);
1007 insns
= emit_move_list (at_bb_start
[bb
->index
],
1008 REG_FREQ_FROM_BB (bb
));
1011 tmp
= NEXT_INSN (tmp
);
1012 if (NOTE_INSN_BASIC_BLOCK_P (tmp
))
1013 tmp
= NEXT_INSN (tmp
);
1014 if (tmp
== BB_HEAD (bb
))
1015 emit_insn_before (insns
, tmp
);
1016 else if (tmp
!= NULL_RTX
)
1017 emit_insn_after (insns
, PREV_INSN (tmp
));
1019 emit_insn_after (insns
, get_last_insn ());
1022 if (at_bb_end
[bb
->index
] != NULL
)
1024 at_bb_end
[bb
->index
] = modify_move_list (at_bb_end
[bb
->index
]);
1025 insns
= emit_move_list (at_bb_end
[bb
->index
], REG_FREQ_FROM_BB (bb
));
1026 ira_assert (! control_flow_insn_p (BB_END (bb
)));
1027 emit_insn_after (insns
, BB_END (bb
));
1030 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1034 ira_assert ((e
->flags
& EDGE_ABNORMAL
) == 0
1035 || ! EDGE_CRITICAL_P (e
));
1036 e
->aux
= modify_move_list ((move_t
) e
->aux
);
1038 (emit_move_list ((move_t
) e
->aux
,
1039 REG_FREQ_FROM_EDGE_FREQ (EDGE_FREQUENCY (e
))),
1041 if (e
->src
->next_bb
!= e
->dest
)
1042 ira_additional_jumps_num
++;
1047 /* Update costs of A and corresponding allocnos on upper levels on the
1048 loop tree from reading (if READ_P) or writing A on an execution
1051 update_costs (ira_allocno_t a
, bool read_p
, int freq
)
1053 ira_loop_tree_node_t parent
;
1057 ALLOCNO_NREFS (a
)++;
1058 ALLOCNO_FREQ (a
) += freq
;
1059 ALLOCNO_MEMORY_COST (a
)
1060 += (ira_memory_move_cost
[ALLOCNO_MODE (a
)][ALLOCNO_CLASS (a
)]
1061 [read_p
? 1 : 0] * freq
);
1062 if (ALLOCNO_CAP (a
) != NULL
)
1063 a
= ALLOCNO_CAP (a
);
1064 else if ((parent
= ALLOCNO_LOOP_TREE_NODE (a
)->parent
) == NULL
1065 || (a
= parent
->regno_allocno_map
[ALLOCNO_REGNO (a
)]) == NULL
)
1070 /* Process moves from LIST with execution FREQ to add ranges, copies,
1071 and modify costs for allocnos involved in the moves. All regnos
1072 living through the list is in LIVE_THROUGH, and the loop tree node
1073 used to find corresponding allocnos is NODE. */
1075 add_range_and_copies_from_move_list (move_t list
, ira_loop_tree_node_t node
,
1076 bitmap live_through
, int freq
)
1085 HARD_REG_SET hard_regs_live
;
1090 EXECUTE_IF_SET_IN_BITMAP (live_through
, FIRST_PSEUDO_REGISTER
, regno
, bi
)
1092 REG_SET_TO_HARD_REG_SET (hard_regs_live
, live_through
);
1093 /* This is a trick to guarantee that new ranges is not merged with
1096 start
= ira_max_point
;
1097 for (move
= list
; move
!= NULL
; move
= move
->next
)
1099 ira_allocno_t from
= move
->from
;
1100 ira_allocno_t to
= move
->to
;
1103 bitmap_clear_bit (live_through
, ALLOCNO_REGNO (from
));
1104 bitmap_clear_bit (live_through
, ALLOCNO_REGNO (to
));
1106 nr
= ALLOCNO_NUM_OBJECTS (to
);
1107 for (i
= 0; i
< nr
; i
++)
1109 ira_object_t to_obj
= ALLOCNO_OBJECT (to
, i
);
1110 if (OBJECT_CONFLICT_ARRAY (to_obj
) == NULL
)
1112 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1113 fprintf (ira_dump_file
, " Allocate conflicts for a%dr%d\n",
1114 ALLOCNO_NUM (to
), REGNO (allocno_emit_reg (to
)));
1115 ira_allocate_object_conflicts (to_obj
, n
);
1118 ior_hard_reg_conflicts (from
, &hard_regs_live
);
1119 ior_hard_reg_conflicts (to
, &hard_regs_live
);
1121 update_costs (from
, true, freq
);
1122 update_costs (to
, false, freq
);
1123 cp
= ira_add_allocno_copy (from
, to
, freq
, false, move
->insn
, NULL
);
1124 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1125 fprintf (ira_dump_file
, " Adding cp%d:a%dr%d-a%dr%d\n",
1126 cp
->num
, ALLOCNO_NUM (cp
->first
),
1127 REGNO (allocno_emit_reg (cp
->first
)),
1128 ALLOCNO_NUM (cp
->second
),
1129 REGNO (allocno_emit_reg (cp
->second
)));
1131 nr
= ALLOCNO_NUM_OBJECTS (from
);
1132 for (i
= 0; i
< nr
; i
++)
1134 ira_object_t from_obj
= ALLOCNO_OBJECT (from
, i
);
1135 r
= OBJECT_LIVE_RANGES (from_obj
);
1136 if (r
== NULL
|| r
->finish
>= 0)
1138 ira_add_live_range_to_object (from_obj
, start
, ira_max_point
);
1139 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1140 fprintf (ira_dump_file
,
1141 " Adding range [%d..%d] to allocno a%dr%d\n",
1142 start
, ira_max_point
, ALLOCNO_NUM (from
),
1143 REGNO (allocno_emit_reg (from
)));
1147 r
->finish
= ira_max_point
;
1148 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1149 fprintf (ira_dump_file
,
1150 " Adding range [%d..%d] to allocno a%dr%d\n",
1151 r
->start
, ira_max_point
, ALLOCNO_NUM (from
),
1152 REGNO (allocno_emit_reg (from
)));
1156 nr
= ALLOCNO_NUM_OBJECTS (to
);
1157 for (i
= 0; i
< nr
; i
++)
1159 ira_object_t to_obj
= ALLOCNO_OBJECT (to
, i
);
1160 ira_add_live_range_to_object (to_obj
, ira_max_point
, -1);
1164 for (move
= list
; move
!= NULL
; move
= move
->next
)
1167 nr
= ALLOCNO_NUM_OBJECTS (move
->to
);
1168 for (i
= 0; i
< nr
; i
++)
1170 ira_object_t to_obj
= ALLOCNO_OBJECT (move
->to
, i
);
1171 r
= OBJECT_LIVE_RANGES (to_obj
);
1174 r
->finish
= ira_max_point
- 1;
1175 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1176 fprintf (ira_dump_file
,
1177 " Adding range [%d..%d] to allocno a%dr%d\n",
1178 r
->start
, r
->finish
, ALLOCNO_NUM (move
->to
),
1179 REGNO (allocno_emit_reg (move
->to
)));
1183 EXECUTE_IF_SET_IN_BITMAP (live_through
, FIRST_PSEUDO_REGISTER
, regno
, bi
)
1188 a
= node
->regno_allocno_map
[regno
];
1189 if ((to
= ALLOCNO_EMIT_DATA (a
)->mem_optimized_dest
) != NULL
)
1191 nr
= ALLOCNO_NUM_OBJECTS (a
);
1192 for (i
= 0; i
< nr
; i
++)
1194 ira_object_t obj
= ALLOCNO_OBJECT (a
, i
);
1195 ira_add_live_range_to_object (obj
, start
, ira_max_point
- 1);
1197 if (internal_flag_ira_verbose
> 2 && ira_dump_file
!= NULL
)
1200 " Adding range [%d..%d] to live through %s allocno a%dr%d\n",
1201 start
, ira_max_point
- 1,
1202 to
!= NULL
? "upper level" : "",
1203 ALLOCNO_NUM (a
), REGNO (allocno_emit_reg (a
)));
1207 /* Process all move list to add ranges, conflicts, copies, and modify
1208 costs for allocnos involved in the moves. */
1210 add_ranges_and_copies (void)
1215 ira_loop_tree_node_t node
;
1216 bitmap live_through
;
1218 live_through
= ira_allocate_bitmap ();
1219 FOR_EACH_BB_FN (bb
, cfun
)
1221 /* It does not matter what loop_tree_node (of source or
1222 destination block) to use for searching allocnos by their
1223 regnos because of subsequent IR flattening. */
1224 node
= IRA_BB_NODE (bb
)->parent
;
1225 bitmap_copy (live_through
, df_get_live_in (bb
));
1226 add_range_and_copies_from_move_list
1227 (at_bb_start
[bb
->index
], node
, live_through
, REG_FREQ_FROM_BB (bb
));
1228 bitmap_copy (live_through
, df_get_live_out (bb
));
1229 add_range_and_copies_from_move_list
1230 (at_bb_end
[bb
->index
], node
, live_through
, REG_FREQ_FROM_BB (bb
));
1231 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1233 bitmap_and (live_through
,
1234 df_get_live_in (e
->dest
), df_get_live_out (bb
));
1235 add_range_and_copies_from_move_list
1236 ((move_t
) e
->aux
, node
, live_through
,
1237 REG_FREQ_FROM_EDGE_FREQ (EDGE_FREQUENCY (e
)));
1240 ira_free_bitmap (live_through
);
1243 /* The entry function changes code and generates shuffling allocnos on
1244 region borders for the regional (LOOPS_P is TRUE in this case)
1245 register allocation. */
1247 ira_emit (bool loops_p
)
1254 ira_allocno_iterator ai
;
1257 FOR_EACH_ALLOCNO (a
, ai
)
1258 ALLOCNO_EMIT_DATA (a
)->reg
= regno_reg_rtx
[ALLOCNO_REGNO (a
)];
1261 sz
= sizeof (move_t
) * last_basic_block_for_fn (cfun
);
1262 at_bb_start
= (move_t
*) ira_allocate (sz
);
1263 memset (at_bb_start
, 0, sz
);
1264 at_bb_end
= (move_t
*) ira_allocate (sz
);
1265 memset (at_bb_end
, 0, sz
);
1266 local_allocno_bitmap
= ira_allocate_bitmap ();
1267 used_regno_bitmap
= ira_allocate_bitmap ();
1268 renamed_regno_bitmap
= ira_allocate_bitmap ();
1269 max_regno_before_changing
= max_reg_num ();
1270 ira_traverse_loop_tree (true, ira_loop_tree_root
, change_loop
, NULL
);
1271 set_allocno_somewhere_renamed_p ();
1272 ira_free_bitmap (used_regno_bitmap
);
1273 ira_free_bitmap (renamed_regno_bitmap
);
1274 ira_free_bitmap (local_allocno_bitmap
);
1275 setup_entered_from_non_parent_p ();
1276 FOR_EACH_BB_FN (bb
, cfun
)
1278 at_bb_start
[bb
->index
] = NULL
;
1279 at_bb_end
[bb
->index
] = NULL
;
1280 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1281 if (e
->dest
!= EXIT_BLOCK_PTR_FOR_FN (cfun
))
1282 generate_edge_moves (e
);
1285 = (move_t
*) ira_allocate (sizeof (move_t
) * max_reg_num ());
1286 allocno_last_set_check
1287 = (int *) ira_allocate (sizeof (int) * max_reg_num ());
1288 memset (allocno_last_set_check
, 0, sizeof (int) * max_reg_num ());
1289 memset (hard_regno_last_set_check
, 0, sizeof (hard_regno_last_set_check
));
1291 FOR_EACH_BB_FN (bb
, cfun
)
1292 unify_moves (bb
, true);
1293 FOR_EACH_BB_FN (bb
, cfun
)
1294 unify_moves (bb
, false);
1295 move_vec
.create (ira_allocnos_num
);
1297 add_ranges_and_copies ();
1299 FOR_EACH_BB_FN (bb
, cfun
)
1301 free_move_list (at_bb_start
[bb
->index
]);
1302 free_move_list (at_bb_end
[bb
->index
]);
1303 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1305 free_move_list ((move_t
) e
->aux
);
1309 move_vec
.release ();
1310 ira_free (allocno_last_set_check
);
1311 ira_free (allocno_last_set
);
1312 commit_edge_insertions ();
1313 /* Fix insn codes. It is necessary to do it before reload because
1314 reload assumes initial insn codes defined. The insn codes can be
1315 invalidated by CFG infrastructure for example in jump
1317 FOR_EACH_BB_FN (bb
, cfun
)
1318 FOR_BB_INSNS_REVERSE (bb
, insn
)
1320 recog_memoized (insn
);
1321 ira_free (at_bb_end
);
1322 ira_free (at_bb_start
);