1 /* Assign reload pseudos.
2 Copyright (C) 2010-2017 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
79 #include "coretypes.h"
88 #include "insn-config.h"
92 #include "rtl-error.h"
93 #include "sparseset.h"
98 /* Current iteration number of the pass and current iteration number
99 of the pass after the latest spill pass when any former reload
100 pseudo was spilled. */
101 int lra_assignment_iter
;
102 int lra_assignment_iter_after_spill
;
104 /* Flag of spilling former reload pseudos on this pass. */
105 static bool former_reload_pseudo_spill_p
;
107 /* Array containing corresponding values of function
108 lra_get_allocno_class. It is used to speed up the code. */
109 static enum reg_class
*regno_allocno_class_array
;
111 /* Array containing lengths of pseudo live ranges. It is used to
112 speed up the code. */
113 static int *regno_live_length
;
115 /* Information about the thread to which a pseudo belongs. Threads are
116 a set of connected reload and inheritance pseudos with the same set of
117 available hard registers. Lone registers belong to their own threads. */
118 struct regno_assign_info
120 /* First/next pseudo of the same thread. */
122 /* Frequency of the thread (execution frequency of only reload
123 pseudos in the thread when the thread contains a reload pseudo).
124 Defined only for the first thread pseudo. */
128 /* Map regno to the corresponding regno assignment info. */
129 static struct regno_assign_info
*regno_assign_info
;
131 /* All inherited, subreg or optional pseudos created before last spill
132 sub-pass. Such pseudos are permitted to get memory instead of hard
134 static bitmap_head non_reload_pseudos
;
136 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
137 REGNO1 and REGNO2 to form threads. */
139 process_copy_to_form_thread (int regno1
, int regno2
, int copy_freq
)
141 int last
, regno1_first
, regno2_first
;
143 lra_assert (regno1
>= lra_constraint_new_regno_start
144 && regno2
>= lra_constraint_new_regno_start
);
145 regno1_first
= regno_assign_info
[regno1
].first
;
146 regno2_first
= regno_assign_info
[regno2
].first
;
147 if (regno1_first
!= regno2_first
)
149 for (last
= regno2_first
;
150 regno_assign_info
[last
].next
>= 0;
151 last
= regno_assign_info
[last
].next
)
152 regno_assign_info
[last
].first
= regno1_first
;
153 regno_assign_info
[last
].first
= regno1_first
;
154 regno_assign_info
[last
].next
= regno_assign_info
[regno1_first
].next
;
155 regno_assign_info
[regno1_first
].next
= regno2_first
;
156 regno_assign_info
[regno1_first
].freq
157 += regno_assign_info
[regno2_first
].freq
;
159 regno_assign_info
[regno1_first
].freq
-= 2 * copy_freq
;
160 lra_assert (regno_assign_info
[regno1_first
].freq
>= 0);
163 /* Initialize REGNO_ASSIGN_INFO and form threads. */
165 init_regno_assign_info (void)
167 int i
, regno1
, regno2
, max_regno
= max_reg_num ();
170 regno_assign_info
= XNEWVEC (struct regno_assign_info
, max_regno
);
171 for (i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
173 regno_assign_info
[i
].first
= i
;
174 regno_assign_info
[i
].next
= -1;
175 regno_assign_info
[i
].freq
= lra_reg_info
[i
].freq
;
177 /* Form the threads. */
178 for (i
= 0; (cp
= lra_get_copy (i
)) != NULL
; i
++)
179 if ((regno1
= cp
->regno1
) >= lra_constraint_new_regno_start
180 && (regno2
= cp
->regno2
) >= lra_constraint_new_regno_start
181 && reg_renumber
[regno1
] < 0 && lra_reg_info
[regno1
].nrefs
!= 0
182 && reg_renumber
[regno2
] < 0 && lra_reg_info
[regno2
].nrefs
!= 0
183 && (ira_class_hard_regs_num
[regno_allocno_class_array
[regno1
]]
184 == ira_class_hard_regs_num
[regno_allocno_class_array
[regno2
]]))
185 process_copy_to_form_thread (regno1
, regno2
, cp
->freq
);
188 /* Free REGNO_ASSIGN_INFO. */
190 finish_regno_assign_info (void)
192 free (regno_assign_info
);
195 /* The function is used to sort *reload* and *inheritance* pseudos to
196 try to assign them hard registers. We put pseudos from the same
197 thread always nearby. */
199 reload_pseudo_compare_func (const void *v1p
, const void *v2p
)
201 int r1
= *(const int *) v1p
, r2
= *(const int *) v2p
;
202 enum reg_class cl1
= regno_allocno_class_array
[r1
];
203 enum reg_class cl2
= regno_allocno_class_array
[r2
];
206 lra_assert (r1
>= lra_constraint_new_regno_start
207 && r2
>= lra_constraint_new_regno_start
);
209 /* Prefer to assign reload registers with smaller classes first to
210 guarantee assignment to all reload registers. */
211 if ((diff
= (ira_class_hard_regs_num
[cl1
]
212 - ira_class_hard_regs_num
[cl2
])) != 0)
215 = (ira_reg_class_max_nregs
[cl2
][lra_reg_info
[r2
].biggest_mode
]
216 - ira_reg_class_max_nregs
[cl1
][lra_reg_info
[r1
].biggest_mode
])) != 0
217 /* The code below executes rarely as nregs == 1 in most cases.
218 So we should not worry about using faster data structures to
219 check reload pseudos. */
220 && ! bitmap_bit_p (&non_reload_pseudos
, r1
)
221 && ! bitmap_bit_p (&non_reload_pseudos
, r2
))
223 if ((diff
= (regno_assign_info
[regno_assign_info
[r2
].first
].freq
224 - regno_assign_info
[regno_assign_info
[r1
].first
].freq
)) != 0)
226 /* Allocate bigger pseudos first to avoid register file
229 = (ira_reg_class_max_nregs
[cl2
][lra_reg_info
[r2
].biggest_mode
]
230 - ira_reg_class_max_nregs
[cl1
][lra_reg_info
[r1
].biggest_mode
])) != 0)
232 /* Put pseudos from the thread nearby. */
233 if ((diff
= regno_assign_info
[r1
].first
- regno_assign_info
[r2
].first
) != 0)
235 /* Prefer pseudos with longer live ranges. It sets up better
236 prefered hard registers for the thread pseudos and decreases
237 register-register moves between the thread pseudos. */
238 if ((diff
= regno_live_length
[r2
] - regno_live_length
[r1
]) != 0)
240 /* If regs are equally good, sort by their numbers, so that the
241 results of qsort leave nothing to chance. */
245 /* The function is used to sort *non-reload* pseudos to try to assign
246 them hard registers. The order calculation is simpler than in the
247 previous function and based on the pseudo frequency usage. */
249 pseudo_compare_func (const void *v1p
, const void *v2p
)
251 int r1
= *(const int *) v1p
, r2
= *(const int *) v2p
;
254 /* Assign hard reg to static chain pointer first pseudo when
255 non-local goto is used. */
256 if (non_spilled_static_chain_regno_p (r1
))
258 else if (non_spilled_static_chain_regno_p (r2
))
261 /* Prefer to assign more frequently used registers first. */
262 if ((diff
= lra_reg_info
[r2
].freq
- lra_reg_info
[r1
].freq
) != 0)
265 /* If regs are equally good, sort by their numbers, so that the
266 results of qsort leave nothing to chance. */
270 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
271 pseudo live ranges with given start point. We insert only live
272 ranges of pseudos interesting for assignment purposes. They are
273 reload pseudos and pseudos assigned to hard registers. */
274 static lra_live_range_t
*start_point_ranges
;
276 /* Used as a flag that a live range is not inserted in the start point
278 static struct lra_live_range not_in_chain_mark
;
280 /* Create and set up START_POINT_RANGES. */
282 create_live_range_start_chains (void)
287 start_point_ranges
= XCNEWVEC (lra_live_range_t
, lra_live_max_point
);
288 max_regno
= max_reg_num ();
289 for (i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
290 if (i
>= lra_constraint_new_regno_start
|| reg_renumber
[i
] >= 0)
292 for (r
= lra_reg_info
[i
].live_ranges
; r
!= NULL
; r
= r
->next
)
294 r
->start_next
= start_point_ranges
[r
->start
];
295 start_point_ranges
[r
->start
] = r
;
300 for (r
= lra_reg_info
[i
].live_ranges
; r
!= NULL
; r
= r
->next
)
301 r
->start_next
= ¬_in_chain_mark
;
305 /* Insert live ranges of pseudo REGNO into start chains if they are
308 insert_in_live_range_start_chain (int regno
)
310 lra_live_range_t r
= lra_reg_info
[regno
].live_ranges
;
312 if (r
->start_next
!= ¬_in_chain_mark
)
314 for (; r
!= NULL
; r
= r
->next
)
316 r
->start_next
= start_point_ranges
[r
->start
];
317 start_point_ranges
[r
->start
] = r
;
321 /* Free START_POINT_RANGES. */
323 finish_live_range_start_chains (void)
325 gcc_assert (start_point_ranges
!= NULL
);
326 free (start_point_ranges
);
327 start_point_ranges
= NULL
;
330 /* Map: program point -> bitmap of all pseudos living at the point and
331 assigned to hard registers. */
332 static bitmap_head
*live_hard_reg_pseudos
;
333 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack
;
335 /* reg_renumber corresponding to pseudos marked in
336 live_hard_reg_pseudos. reg_renumber might be not matched to
337 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
338 live_hard_reg_pseudos. */
339 static int *live_pseudos_reg_renumber
;
341 /* Sparseset used to calculate living hard reg pseudos for some program
343 static sparseset live_range_hard_reg_pseudos
;
345 /* Sparseset used to calculate living reload/inheritance pseudos for
346 some program point range. */
347 static sparseset live_range_reload_inheritance_pseudos
;
349 /* Allocate and initialize the data about living pseudos at program
354 int i
, max_regno
= max_reg_num ();
356 live_range_hard_reg_pseudos
= sparseset_alloc (max_regno
);
357 live_range_reload_inheritance_pseudos
= sparseset_alloc (max_regno
);
358 live_hard_reg_pseudos
= XNEWVEC (bitmap_head
, lra_live_max_point
);
359 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack
);
360 for (i
= 0; i
< lra_live_max_point
; i
++)
361 bitmap_initialize (&live_hard_reg_pseudos
[i
],
362 &live_hard_reg_pseudos_bitmap_obstack
);
363 live_pseudos_reg_renumber
= XNEWVEC (int, max_regno
);
364 for (i
= 0; i
< max_regno
; i
++)
365 live_pseudos_reg_renumber
[i
] = -1;
368 /* Free the data about living pseudos at program points. */
372 sparseset_free (live_range_hard_reg_pseudos
);
373 sparseset_free (live_range_reload_inheritance_pseudos
);
374 free (live_hard_reg_pseudos
);
375 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack
);
376 free (live_pseudos_reg_renumber
);
379 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
380 entries for pseudo REGNO. Assume that the register has been
381 spilled if FREE_P, otherwise assume that it has been assigned
382 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
383 ranges in the start chains when it is assumed to be assigned to a
384 hard register because we use the chains of pseudos assigned to hard
385 registers during allocation. */
387 update_lives (int regno
, bool free_p
)
392 if (reg_renumber
[regno
] < 0)
394 live_pseudos_reg_renumber
[regno
] = free_p
? -1 : reg_renumber
[regno
];
395 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
397 for (p
= r
->start
; p
<= r
->finish
; p
++)
399 bitmap_clear_bit (&live_hard_reg_pseudos
[p
], regno
);
402 bitmap_set_bit (&live_hard_reg_pseudos
[p
], regno
);
403 insert_in_live_range_start_chain (regno
);
408 /* Sparseset used to calculate reload pseudos conflicting with a given
409 pseudo when we are trying to find a hard register for the given
411 static sparseset conflict_reload_and_inheritance_pseudos
;
413 /* Map: program point -> bitmap of all reload and inheritance pseudos
414 living at the point. */
415 static bitmap_head
*live_reload_and_inheritance_pseudos
;
416 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack
;
418 /* Allocate and initialize data about living reload pseudos at any
419 given program point. */
421 init_live_reload_and_inheritance_pseudos (void)
423 int i
, p
, max_regno
= max_reg_num ();
426 conflict_reload_and_inheritance_pseudos
= sparseset_alloc (max_regno
);
427 live_reload_and_inheritance_pseudos
= XNEWVEC (bitmap_head
, lra_live_max_point
);
428 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack
);
429 for (p
= 0; p
< lra_live_max_point
; p
++)
430 bitmap_initialize (&live_reload_and_inheritance_pseudos
[p
],
431 &live_reload_and_inheritance_pseudos_bitmap_obstack
);
432 for (i
= lra_constraint_new_regno_start
; i
< max_regno
; i
++)
434 for (r
= lra_reg_info
[i
].live_ranges
; r
!= NULL
; r
= r
->next
)
435 for (p
= r
->start
; p
<= r
->finish
; p
++)
436 bitmap_set_bit (&live_reload_and_inheritance_pseudos
[p
], i
);
440 /* Finalize data about living reload pseudos at any given program
443 finish_live_reload_and_inheritance_pseudos (void)
445 sparseset_free (conflict_reload_and_inheritance_pseudos
);
446 free (live_reload_and_inheritance_pseudos
);
447 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack
);
450 /* The value used to check that cost of given hard reg is really
451 defined currently. */
452 static int curr_hard_regno_costs_check
= 0;
453 /* Array used to check that cost of the corresponding hard reg (the
454 array element index) is really defined currently. */
455 static int hard_regno_costs_check
[FIRST_PSEUDO_REGISTER
];
456 /* The current costs of allocation of hard regs. Defined only if the
457 value of the corresponding element of the previous array is equal to
458 CURR_HARD_REGNO_COSTS_CHECK. */
459 static int hard_regno_costs
[FIRST_PSEUDO_REGISTER
];
461 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
464 adjust_hard_regno_cost (int hard_regno
, int incr
)
466 if (hard_regno_costs_check
[hard_regno
] != curr_hard_regno_costs_check
)
467 hard_regno_costs
[hard_regno
] = 0;
468 hard_regno_costs_check
[hard_regno
] = curr_hard_regno_costs_check
;
469 hard_regno_costs
[hard_regno
] += incr
;
472 /* Try to find a free hard register for pseudo REGNO. Return the
473 hard register on success and set *COST to the cost of using
474 that register. (If several registers have equal cost, the one with
475 the highest priority wins.) Return -1 on failure.
477 If FIRST_P, return the first available hard reg ignoring other
478 criteria, e.g. allocation cost. This approach results in less hard
479 reg pool fragmentation and permit to allocate hard regs to reload
480 pseudos in complicated situations where pseudo sizes are different.
482 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
483 otherwise consider all hard registers in REGNO's class.
485 If REGNO_SET is not empty, only hard registers from the set are
488 find_hard_regno_for_1 (int regno
, int *cost
, int try_only_hard_regno
,
489 bool first_p
, HARD_REG_SET regno_set
)
491 HARD_REG_SET conflict_set
;
492 int best_cost
= INT_MAX
, best_priority
= INT_MIN
, best_usage
= INT_MAX
;
494 int p
, i
, j
, rclass_size
, best_hard_regno
, priority
, hard_regno
;
495 int hr
, conflict_hr
, nregs
;
496 machine_mode biggest_mode
;
497 unsigned int k
, conflict_regno
;
498 int offset
, val
, biggest_nregs
, nregs_diff
;
499 enum reg_class rclass
;
501 bool *rclass_intersect_p
;
502 HARD_REG_SET impossible_start_hard_regs
, available_regs
;
504 if (hard_reg_set_empty_p (regno_set
))
505 COPY_HARD_REG_SET (conflict_set
, lra_no_alloc_regs
);
508 COMPL_HARD_REG_SET (conflict_set
, regno_set
);
509 IOR_HARD_REG_SET (conflict_set
, lra_no_alloc_regs
);
511 rclass
= regno_allocno_class_array
[regno
];
512 rclass_intersect_p
= ira_reg_classes_intersect_p
[rclass
];
513 curr_hard_regno_costs_check
++;
514 sparseset_clear (conflict_reload_and_inheritance_pseudos
);
515 sparseset_clear (live_range_hard_reg_pseudos
);
516 IOR_HARD_REG_SET (conflict_set
, lra_reg_info
[regno
].conflict_hard_regs
);
517 biggest_mode
= lra_reg_info
[regno
].biggest_mode
;
518 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
520 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos
[r
->start
], 0, k
, bi
)
521 if (rclass_intersect_p
[regno_allocno_class_array
[k
]])
522 sparseset_set_bit (live_range_hard_reg_pseudos
, k
);
523 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos
[r
->start
],
525 if (lra_reg_info
[k
].preferred_hard_regno1
>= 0
526 && live_pseudos_reg_renumber
[k
] < 0
527 && rclass_intersect_p
[regno_allocno_class_array
[k
]])
528 sparseset_set_bit (conflict_reload_and_inheritance_pseudos
, k
);
529 for (p
= r
->start
+ 1; p
<= r
->finish
; p
++)
533 for (r2
= start_point_ranges
[p
];
537 if (r2
->regno
>= lra_constraint_new_regno_start
538 && lra_reg_info
[r2
->regno
].preferred_hard_regno1
>= 0
539 && live_pseudos_reg_renumber
[r2
->regno
] < 0
540 && rclass_intersect_p
[regno_allocno_class_array
[r2
->regno
]])
541 sparseset_set_bit (conflict_reload_and_inheritance_pseudos
,
543 if (live_pseudos_reg_renumber
[r2
->regno
] >= 0
544 && rclass_intersect_p
[regno_allocno_class_array
[r2
->regno
]])
545 sparseset_set_bit (live_range_hard_reg_pseudos
, r2
->regno
);
549 if ((hard_regno
= lra_reg_info
[regno
].preferred_hard_regno1
) >= 0)
551 adjust_hard_regno_cost
552 (hard_regno
, -lra_reg_info
[regno
].preferred_hard_regno_profit1
);
553 if ((hard_regno
= lra_reg_info
[regno
].preferred_hard_regno2
) >= 0)
554 adjust_hard_regno_cost
555 (hard_regno
, -lra_reg_info
[regno
].preferred_hard_regno_profit2
);
558 if (lra_reg_info
[regno
].no_stack_p
)
559 for (i
= FIRST_STACK_REG
; i
<= LAST_STACK_REG
; i
++)
560 SET_HARD_REG_BIT (conflict_set
, i
);
562 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos
, regno
);
563 val
= lra_reg_info
[regno
].val
;
564 offset
= lra_reg_info
[regno
].offset
;
565 CLEAR_HARD_REG_SET (impossible_start_hard_regs
);
566 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos
, conflict_regno
)
568 conflict_hr
= live_pseudos_reg_renumber
[conflict_regno
];
569 if (lra_reg_val_equal_p (conflict_regno
, val
, offset
))
571 conflict_hr
= live_pseudos_reg_renumber
[conflict_regno
];
572 nregs
= (hard_regno_nregs
[conflict_hr
]
573 [lra_reg_info
[conflict_regno
].biggest_mode
]);
574 /* Remember about multi-register pseudos. For example, 2
575 hard register pseudos can start on the same hard register
576 but can not start on HR and HR+1/HR-1. */
577 for (hr
= conflict_hr
+ 1;
578 hr
< FIRST_PSEUDO_REGISTER
&& hr
< conflict_hr
+ nregs
;
580 SET_HARD_REG_BIT (impossible_start_hard_regs
, hr
);
581 for (hr
= conflict_hr
- 1;
582 hr
>= 0 && hr
+ hard_regno_nregs
[hr
][biggest_mode
] > conflict_hr
;
584 SET_HARD_REG_BIT (impossible_start_hard_regs
, hr
);
588 enum machine_mode biggest_conflict_mode
589 = lra_reg_info
[conflict_regno
].biggest_mode
;
590 int biggest_conflict_nregs
591 = hard_regno_nregs
[conflict_hr
][biggest_conflict_mode
];
593 nregs_diff
= (biggest_conflict_nregs
596 [PSEUDO_REGNO_MODE (conflict_regno
)]));
597 add_to_hard_reg_set (&conflict_set
,
598 biggest_conflict_mode
,
600 - (WORDS_BIG_ENDIAN
? nregs_diff
: 0));
601 if (hard_reg_set_subset_p (reg_class_contents
[rclass
],
606 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos
,
608 if (!lra_reg_val_equal_p (conflict_regno
, val
, offset
))
610 lra_assert (live_pseudos_reg_renumber
[conflict_regno
] < 0);
612 = lra_reg_info
[conflict_regno
].preferred_hard_regno1
) >= 0)
614 adjust_hard_regno_cost
616 lra_reg_info
[conflict_regno
].preferred_hard_regno_profit1
);
618 = lra_reg_info
[conflict_regno
].preferred_hard_regno2
) >= 0)
619 adjust_hard_regno_cost
621 lra_reg_info
[conflict_regno
].preferred_hard_regno_profit2
);
624 /* Make sure that all registers in a multi-word pseudo belong to the
626 IOR_COMPL_HARD_REG_SET (conflict_set
, reg_class_contents
[rclass
]);
627 lra_assert (rclass
!= NO_REGS
);
628 rclass_size
= ira_class_hard_regs_num
[rclass
];
629 best_hard_regno
= -1;
630 hard_regno
= ira_class_hard_regs
[rclass
][0];
631 biggest_nregs
= hard_regno_nregs
[hard_regno
][biggest_mode
];
632 nregs_diff
= (biggest_nregs
633 - hard_regno_nregs
[hard_regno
][PSEUDO_REGNO_MODE (regno
)]);
634 COPY_HARD_REG_SET (available_regs
, reg_class_contents
[rclass
]);
635 AND_COMPL_HARD_REG_SET (available_regs
, lra_no_alloc_regs
);
636 for (i
= 0; i
< rclass_size
; i
++)
638 if (try_only_hard_regno
>= 0)
639 hard_regno
= try_only_hard_regno
;
641 hard_regno
= ira_class_hard_regs
[rclass
][i
];
642 if (! overlaps_hard_reg_set_p (conflict_set
,
643 PSEUDO_REGNO_MODE (regno
), hard_regno
)
644 && HARD_REGNO_MODE_OK (hard_regno
, PSEUDO_REGNO_MODE (regno
))
645 /* We can not use prohibited_class_mode_regs for all classes
646 because it is not defined for all classes. */
647 && (ira_allocno_class_translate
[rclass
] != rclass
648 || ! TEST_HARD_REG_BIT (ira_prohibited_class_mode_regs
649 [rclass
][PSEUDO_REGNO_MODE (regno
)],
651 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs
, hard_regno
)
654 ? (hard_regno
- nregs_diff
>= 0
655 && TEST_HARD_REG_BIT (available_regs
,
656 hard_regno
- nregs_diff
))
657 : TEST_HARD_REG_BIT (available_regs
,
658 hard_regno
+ nregs_diff
))))
660 if (hard_regno_costs_check
[hard_regno
]
661 != curr_hard_regno_costs_check
)
663 hard_regno_costs_check
[hard_regno
] = curr_hard_regno_costs_check
;
664 hard_regno_costs
[hard_regno
] = 0;
667 j
< hard_regno_nregs
[hard_regno
][PSEUDO_REGNO_MODE (regno
)];
669 if (! TEST_HARD_REG_BIT (call_used_reg_set
, hard_regno
+ j
)
670 && ! df_regs_ever_live_p (hard_regno
+ j
))
671 /* It needs save restore. */
672 hard_regno_costs
[hard_regno
]
674 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun
)->next_bb
)
676 priority
= targetm
.register_priority (hard_regno
);
677 if (best_hard_regno
< 0 || hard_regno_costs
[hard_regno
] < best_cost
678 || (hard_regno_costs
[hard_regno
] == best_cost
679 && (priority
> best_priority
680 || (targetm
.register_usage_leveling_p ()
681 && priority
== best_priority
682 && best_usage
> lra_hard_reg_usage
[hard_regno
]))))
684 best_hard_regno
= hard_regno
;
685 best_cost
= hard_regno_costs
[hard_regno
];
686 best_priority
= priority
;
687 best_usage
= lra_hard_reg_usage
[hard_regno
];
690 if (try_only_hard_regno
>= 0 || (first_p
&& best_hard_regno
>= 0))
693 if (best_hard_regno
>= 0)
694 *cost
= best_cost
- lra_reg_info
[regno
].freq
;
695 return best_hard_regno
;
698 /* A wrapper for find_hard_regno_for_1 (see comments for that function
699 description). This function tries to find a hard register for
700 preferred class first if it is worth. */
702 find_hard_regno_for (int regno
, int *cost
, int try_only_hard_regno
, bool first_p
)
705 HARD_REG_SET regno_set
;
707 /* Only original pseudos can have a different preferred class. */
708 if (try_only_hard_regno
< 0 && regno
< lra_new_regno_start
)
710 enum reg_class pref_class
= reg_preferred_class (regno
);
712 if (regno_allocno_class_array
[regno
] != pref_class
)
714 hard_regno
= find_hard_regno_for_1 (regno
, cost
, -1, first_p
,
715 reg_class_contents
[pref_class
]);
720 CLEAR_HARD_REG_SET (regno_set
);
721 return find_hard_regno_for_1 (regno
, cost
, try_only_hard_regno
, first_p
,
725 /* Current value used for checking elements in
726 update_hard_regno_preference_check. */
727 static int curr_update_hard_regno_preference_check
;
728 /* If an element value is equal to the above variable value, then the
729 corresponding regno has been processed for preference
731 static int *update_hard_regno_preference_check
;
733 /* Update the preference for using HARD_REGNO for pseudos that are
734 connected directly or indirectly with REGNO. Apply divisor DIV
735 to any preference adjustments.
737 The more indirectly a pseudo is connected, the smaller its effect
738 should be. We therefore increase DIV on each "hop". */
740 update_hard_regno_preference (int regno
, int hard_regno
, int div
)
742 int another_regno
, cost
;
743 lra_copy_t cp
, next_cp
;
745 /* Search depth 5 seems to be enough. */
748 for (cp
= lra_reg_info
[regno
].copies
; cp
!= NULL
; cp
= next_cp
)
750 if (cp
->regno1
== regno
)
752 next_cp
= cp
->regno1_next
;
753 another_regno
= cp
->regno2
;
755 else if (cp
->regno2
== regno
)
757 next_cp
= cp
->regno2_next
;
758 another_regno
= cp
->regno1
;
762 if (reg_renumber
[another_regno
] < 0
763 && (update_hard_regno_preference_check
[another_regno
]
764 != curr_update_hard_regno_preference_check
))
766 update_hard_regno_preference_check
[another_regno
]
767 = curr_update_hard_regno_preference_check
;
768 cost
= cp
->freq
< div
? 1 : cp
->freq
/ div
;
769 lra_setup_reload_pseudo_preferenced_hard_reg
770 (another_regno
, hard_regno
, cost
);
771 update_hard_regno_preference (another_regno
, hard_regno
, div
* 2);
776 /* Return prefix title for pseudo REGNO. */
778 pseudo_prefix_title (int regno
)
781 (regno
< lra_constraint_new_regno_start
? ""
782 : bitmap_bit_p (&lra_inheritance_pseudos
, regno
) ? "inheritance "
783 : bitmap_bit_p (&lra_split_regs
, regno
) ? "split "
784 : bitmap_bit_p (&lra_optional_reload_pseudos
, regno
) ? "optional reload "
785 : bitmap_bit_p (&lra_subreg_reload_pseudos
, regno
) ? "subreg reload "
789 /* Update REG_RENUMBER and other pseudo preferences by assignment of
790 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
792 lra_setup_reg_renumber (int regno
, int hard_regno
, bool print_p
)
796 /* We can not just reassign hard register. */
797 lra_assert (hard_regno
< 0 || reg_renumber
[regno
] < 0);
798 if ((hr
= hard_regno
) < 0)
799 hr
= reg_renumber
[regno
];
800 reg_renumber
[regno
] = hard_regno
;
801 lra_assert (hr
>= 0);
802 for (i
= 0; i
< hard_regno_nregs
[hr
][PSEUDO_REGNO_MODE (regno
)]; i
++)
804 lra_hard_reg_usage
[hr
+ i
] -= lra_reg_info
[regno
].freq
;
806 lra_hard_reg_usage
[hr
+ i
] += lra_reg_info
[regno
].freq
;
807 if (print_p
&& lra_dump_file
!= NULL
)
808 fprintf (lra_dump_file
, " Assign %d to %sr%d (freq=%d)\n",
809 reg_renumber
[regno
], pseudo_prefix_title (regno
),
810 regno
, lra_reg_info
[regno
].freq
);
813 curr_update_hard_regno_preference_check
++;
814 update_hard_regno_preference (regno
, hard_regno
, 1);
818 /* Pseudos which occur in insns containing a particular pseudo. */
819 static bitmap_head insn_conflict_pseudos
;
821 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
822 and best spill pseudos for given pseudo (and best hard regno). */
823 static bitmap_head spill_pseudos_bitmap
, best_spill_pseudos_bitmap
;
825 /* Current pseudo check for validity of elements in
826 TRY_HARD_REG_PSEUDOS. */
827 static int curr_pseudo_check
;
828 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
829 static int try_hard_reg_pseudos_check
[FIRST_PSEUDO_REGISTER
];
830 /* Pseudos who hold given hard register at the considered points. */
831 static bitmap_head try_hard_reg_pseudos
[FIRST_PSEUDO_REGISTER
];
833 /* Set up try_hard_reg_pseudos for given program point P and class
834 RCLASS. Those are pseudos living at P and assigned to a hard
835 register of RCLASS. In other words, those are pseudos which can be
836 spilled to assign a hard register of RCLASS to a pseudo living at
839 setup_try_hard_regno_pseudos (int p
, enum reg_class rclass
)
843 unsigned int spill_regno
;
846 /* Find what pseudos could be spilled. */
847 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos
[p
], 0, spill_regno
, bi
)
849 mode
= PSEUDO_REGNO_MODE (spill_regno
);
850 hard_regno
= live_pseudos_reg_renumber
[spill_regno
];
851 if (overlaps_hard_reg_set_p (reg_class_contents
[rclass
],
854 for (i
= hard_regno_nregs
[hard_regno
][mode
] - 1; i
>= 0; i
--)
856 if (try_hard_reg_pseudos_check
[hard_regno
+ i
]
857 != curr_pseudo_check
)
859 try_hard_reg_pseudos_check
[hard_regno
+ i
]
861 bitmap_clear (&try_hard_reg_pseudos
[hard_regno
+ i
]);
863 bitmap_set_bit (&try_hard_reg_pseudos
[hard_regno
+ i
],
870 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
871 assignment means that we might undo the data change. */
873 assign_temporarily (int regno
, int hard_regno
)
878 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
880 for (p
= r
->start
; p
<= r
->finish
; p
++)
882 bitmap_clear_bit (&live_hard_reg_pseudos
[p
], regno
);
885 bitmap_set_bit (&live_hard_reg_pseudos
[p
], regno
);
886 insert_in_live_range_start_chain (regno
);
889 live_pseudos_reg_renumber
[regno
] = hard_regno
;
892 /* Return true iff there is a reason why pseudo SPILL_REGNO should not
895 must_not_spill_p (unsigned spill_regno
)
897 if ((pic_offset_table_rtx
!= NULL
898 && spill_regno
== REGNO (pic_offset_table_rtx
))
899 || ((int) spill_regno
>= lra_constraint_new_regno_start
900 && ! bitmap_bit_p (&lra_inheritance_pseudos
, spill_regno
)
901 && ! bitmap_bit_p (&lra_split_regs
, spill_regno
)
902 && ! bitmap_bit_p (&lra_subreg_reload_pseudos
, spill_regno
)
903 && ! bitmap_bit_p (&lra_optional_reload_pseudos
, spill_regno
)))
905 /* A reload pseudo that requires a singleton register class should
907 FIXME: this mitigates the issue on certain i386 patterns, but
908 does not solve the general case where existing reloads fully
909 cover a limited register class. */
910 if (!bitmap_bit_p (&non_reload_pseudos
, spill_regno
)
911 && reg_class_size
[reg_preferred_class (spill_regno
)] == 1)
916 /* Array used for sorting reload pseudos for subsequent allocation
917 after spilling some pseudo. */
918 static int *sorted_reload_pseudos
;
920 /* Spill some pseudos for a reload pseudo REGNO and return hard
921 register which should be used for pseudo after spilling. The
922 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
923 choose hard register (and pseudos occupying the hard registers and
924 to be spilled), we take into account not only how REGNO will
925 benefit from the spills but also how other reload pseudos not yet
926 assigned to hard registers benefit from the spills too. In very
927 rare cases, the function can fail and return -1.
929 If FIRST_P, return the first available hard reg ignoring other
930 criteria, e.g. allocation cost and cost of spilling non-reload
931 pseudos. This approach results in less hard reg pool fragmentation
932 and permit to allocate hard regs to reload pseudos in complicated
933 situations where pseudo sizes are different. */
935 spill_for (int regno
, bitmap spilled_pseudo_bitmap
, bool first_p
)
937 int i
, j
, n
, p
, hard_regno
, best_hard_regno
, cost
, best_cost
, rclass_size
;
938 int reload_hard_regno
, reload_cost
;
939 bool static_p
, best_static_p
;
941 enum reg_class rclass
;
942 unsigned int spill_regno
, reload_regno
, uid
;
943 int insn_pseudos_num
, best_insn_pseudos_num
;
944 int bad_spills_num
, smallest_bad_spills_num
;
948 rclass
= regno_allocno_class_array
[regno
];
949 lra_assert (reg_renumber
[regno
] < 0 && rclass
!= NO_REGS
);
950 bitmap_clear (&insn_conflict_pseudos
);
951 bitmap_clear (&best_spill_pseudos_bitmap
);
952 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info
[regno
].insn_bitmap
, 0, uid
, bi
)
954 struct lra_insn_reg
*ir
;
956 for (ir
= lra_get_insn_regs (uid
); ir
!= NULL
; ir
= ir
->next
)
957 if (ir
->regno
>= FIRST_PSEUDO_REGISTER
)
958 bitmap_set_bit (&insn_conflict_pseudos
, ir
->regno
);
960 best_hard_regno
= -1;
962 best_static_p
= TRUE
;
963 best_insn_pseudos_num
= INT_MAX
;
964 smallest_bad_spills_num
= INT_MAX
;
965 rclass_size
= ira_class_hard_regs_num
[rclass
];
966 mode
= PSEUDO_REGNO_MODE (regno
);
967 /* Invalidate try_hard_reg_pseudos elements. */
969 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
970 for (p
= r
->start
; p
<= r
->finish
; p
++)
971 setup_try_hard_regno_pseudos (p
, rclass
);
972 for (i
= 0; i
< rclass_size
; i
++)
974 hard_regno
= ira_class_hard_regs
[rclass
][i
];
975 bitmap_clear (&spill_pseudos_bitmap
);
976 for (j
= hard_regno_nregs
[hard_regno
][mode
] - 1; j
>= 0; j
--)
978 if (try_hard_reg_pseudos_check
[hard_regno
+ j
] != curr_pseudo_check
)
980 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos
[hard_regno
+ j
]));
981 bitmap_ior_into (&spill_pseudos_bitmap
,
982 &try_hard_reg_pseudos
[hard_regno
+ j
]);
986 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap
, 0, spill_regno
, bi
)
987 if (must_not_spill_p (spill_regno
))
989 else if (non_spilled_static_chain_regno_p (spill_regno
))
991 insn_pseudos_num
= 0;
993 if (lra_dump_file
!= NULL
)
994 fprintf (lra_dump_file
, " Trying %d:", hard_regno
);
995 sparseset_clear (live_range_reload_inheritance_pseudos
);
996 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap
, 0, spill_regno
, bi
)
998 if (bitmap_bit_p (&insn_conflict_pseudos
, spill_regno
))
1000 if (spill_regno
>= (unsigned int) lra_bad_spill_regno_start
)
1002 for (r
= lra_reg_info
[spill_regno
].live_ranges
;
1006 for (p
= r
->start
; p
<= r
->finish
; p
++)
1008 lra_live_range_t r2
;
1010 for (r2
= start_point_ranges
[p
];
1012 r2
= r2
->start_next
)
1013 if (r2
->regno
>= lra_constraint_new_regno_start
)
1014 sparseset_set_bit (live_range_reload_inheritance_pseudos
,
1020 if (sparseset_cardinality (live_range_reload_inheritance_pseudos
)
1021 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS
)
1022 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos
,
1024 if ((int) reload_regno
!= regno
1025 && (ira_reg_classes_intersect_p
1026 [rclass
][regno_allocno_class_array
[reload_regno
]])
1027 && live_pseudos_reg_renumber
[reload_regno
] < 0
1028 && find_hard_regno_for (reload_regno
, &cost
, -1, first_p
) < 0)
1029 sorted_reload_pseudos
[n
++] = reload_regno
;
1030 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap
, 0, spill_regno
, bi
)
1032 update_lives (spill_regno
, true);
1033 if (lra_dump_file
!= NULL
)
1034 fprintf (lra_dump_file
, " spill %d(freq=%d)",
1035 spill_regno
, lra_reg_info
[spill_regno
].freq
);
1037 hard_regno
= find_hard_regno_for (regno
, &cost
, -1, first_p
);
1038 if (hard_regno
>= 0)
1040 assign_temporarily (regno
, hard_regno
);
1041 qsort (sorted_reload_pseudos
, n
, sizeof (int),
1042 reload_pseudo_compare_func
);
1043 for (j
= 0; j
< n
; j
++)
1045 reload_regno
= sorted_reload_pseudos
[j
];
1046 lra_assert (live_pseudos_reg_renumber
[reload_regno
] < 0);
1047 if ((reload_hard_regno
1048 = find_hard_regno_for (reload_regno
,
1049 &reload_cost
, -1, first_p
)) >= 0)
1051 if (lra_dump_file
!= NULL
)
1052 fprintf (lra_dump_file
, " assign %d(cost=%d)",
1053 reload_regno
, reload_cost
);
1054 assign_temporarily (reload_regno
, reload_hard_regno
);
1055 cost
+= reload_cost
;
1058 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap
, 0, spill_regno
, bi
)
1062 cost
+= lra_reg_info
[spill_regno
].freq
;
1063 if (ira_reg_equiv
[spill_regno
].memory
!= NULL
1064 || ira_reg_equiv
[spill_regno
].constant
!= NULL
)
1065 for (x
= ira_reg_equiv
[spill_regno
].init_insns
;
1068 cost
-= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x
->insn ()));
1070 /* Avoid spilling static chain pointer pseudo when non-local
1072 if ((! static_p
&& best_static_p
)
1073 || (static_p
== best_static_p
1074 && (best_insn_pseudos_num
> insn_pseudos_num
1075 || (best_insn_pseudos_num
== insn_pseudos_num
1076 && (bad_spills_num
< smallest_bad_spills_num
1077 || (bad_spills_num
== smallest_bad_spills_num
1078 && best_cost
> cost
))))))
1080 best_insn_pseudos_num
= insn_pseudos_num
;
1081 smallest_bad_spills_num
= bad_spills_num
;
1082 best_static_p
= static_p
;
1084 best_hard_regno
= hard_regno
;
1085 bitmap_copy (&best_spill_pseudos_bitmap
, &spill_pseudos_bitmap
);
1086 if (lra_dump_file
!= NULL
)
1087 fprintf (lra_dump_file
,
1088 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1089 hard_regno
, cost
, bad_spills_num
, insn_pseudos_num
);
1091 assign_temporarily (regno
, -1);
1092 for (j
= 0; j
< n
; j
++)
1094 reload_regno
= sorted_reload_pseudos
[j
];
1095 if (live_pseudos_reg_renumber
[reload_regno
] >= 0)
1096 assign_temporarily (reload_regno
, -1);
1099 if (lra_dump_file
!= NULL
)
1100 fprintf (lra_dump_file
, "\n");
1101 /* Restore the live hard reg pseudo info for spilled pseudos. */
1102 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap
, 0, spill_regno
, bi
)
1103 update_lives (spill_regno
, false);
1108 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap
, 0, spill_regno
, bi
)
1110 if ((int) spill_regno
>= lra_constraint_new_regno_start
)
1111 former_reload_pseudo_spill_p
= true;
1112 if (lra_dump_file
!= NULL
)
1113 fprintf (lra_dump_file
, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
1114 pseudo_prefix_title (spill_regno
),
1115 spill_regno
, reg_renumber
[spill_regno
],
1116 lra_reg_info
[spill_regno
].freq
, regno
);
1117 update_lives (spill_regno
, true);
1118 lra_setup_reg_renumber (spill_regno
, -1, false);
1120 bitmap_ior_into (spilled_pseudo_bitmap
, &best_spill_pseudos_bitmap
);
1121 return best_hard_regno
;
1124 /* Assign HARD_REGNO to REGNO. */
1126 assign_hard_regno (int hard_regno
, int regno
)
1130 lra_assert (hard_regno
>= 0);
1131 lra_setup_reg_renumber (regno
, hard_regno
, true);
1132 update_lives (regno
, false);
1134 i
< hard_regno_nregs
[hard_regno
][lra_reg_info
[regno
].biggest_mode
];
1136 df_set_regs_ever_live (hard_regno
+ i
, true);
1139 /* Array used for sorting different pseudos. */
1140 static int *sorted_pseudos
;
1142 /* The constraints pass is allowed to create equivalences between
1143 pseudos that make the current allocation "incorrect" (in the sense
1144 that pseudos are assigned to hard registers from their own conflict
1145 sets). The global variable lra_risky_transformations_p says
1146 whether this might have happened.
1148 Process pseudos assigned to hard registers (less frequently used
1149 first), spill if a conflict is found, and mark the spilled pseudos
1150 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1151 pseudos, assigned to hard registers. */
1153 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1154 spilled_pseudo_bitmap
)
1156 int p
, i
, j
, n
, regno
, hard_regno
;
1157 unsigned int k
, conflict_regno
;
1159 HARD_REG_SET conflict_set
;
1163 int max_regno
= max_reg_num ();
1165 if (! lra_risky_transformations_p
)
1167 for (i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
1168 if (reg_renumber
[i
] >= 0 && lra_reg_info
[i
].nrefs
> 0)
1169 update_lives (i
, false);
1172 for (n
= 0, i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
1173 if ((pic_offset_table_rtx
== NULL_RTX
1174 || i
!= (int) REGNO (pic_offset_table_rtx
))
1175 && reg_renumber
[i
] >= 0 && lra_reg_info
[i
].nrefs
> 0)
1176 sorted_pseudos
[n
++] = i
;
1177 qsort (sorted_pseudos
, n
, sizeof (int), pseudo_compare_func
);
1178 if (pic_offset_table_rtx
!= NULL_RTX
1179 && (regno
= REGNO (pic_offset_table_rtx
)) >= FIRST_PSEUDO_REGISTER
1180 && reg_renumber
[regno
] >= 0 && lra_reg_info
[regno
].nrefs
> 0)
1181 sorted_pseudos
[n
++] = regno
;
1182 for (i
= n
- 1; i
>= 0; i
--)
1184 regno
= sorted_pseudos
[i
];
1185 hard_regno
= reg_renumber
[regno
];
1186 lra_assert (hard_regno
>= 0);
1187 mode
= lra_reg_info
[regno
].biggest_mode
;
1188 sparseset_clear (live_range_hard_reg_pseudos
);
1189 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
1191 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos
[r
->start
], 0, k
, bi
)
1192 sparseset_set_bit (live_range_hard_reg_pseudos
, k
);
1193 for (p
= r
->start
+ 1; p
<= r
->finish
; p
++)
1195 lra_live_range_t r2
;
1197 for (r2
= start_point_ranges
[p
];
1199 r2
= r2
->start_next
)
1200 if (live_pseudos_reg_renumber
[r2
->regno
] >= 0)
1201 sparseset_set_bit (live_range_hard_reg_pseudos
, r2
->regno
);
1204 COPY_HARD_REG_SET (conflict_set
, lra_no_alloc_regs
);
1205 IOR_HARD_REG_SET (conflict_set
, lra_reg_info
[regno
].conflict_hard_regs
);
1206 val
= lra_reg_info
[regno
].val
;
1207 offset
= lra_reg_info
[regno
].offset
;
1208 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos
, conflict_regno
)
1209 if (!lra_reg_val_equal_p (conflict_regno
, val
, offset
)
1210 /* If it is multi-register pseudos they should start on
1211 the same hard register. */
1212 || hard_regno
!= reg_renumber
[conflict_regno
])
1214 int conflict_hard_regno
= reg_renumber
[conflict_regno
];
1215 machine_mode biggest_mode
= lra_reg_info
[conflict_regno
].biggest_mode
;
1216 int biggest_nregs
= hard_regno_nregs
[conflict_hard_regno
][biggest_mode
];
1217 int nregs_diff
= (biggest_nregs
1219 [conflict_hard_regno
]
1220 [PSEUDO_REGNO_MODE (conflict_regno
)]));
1221 add_to_hard_reg_set (&conflict_set
,
1224 - (WORDS_BIG_ENDIAN
? nregs_diff
: 0));
1226 if (! overlaps_hard_reg_set_p (conflict_set
, mode
, hard_regno
))
1228 update_lives (regno
, false);
1231 bitmap_set_bit (spilled_pseudo_bitmap
, regno
);
1233 j
< hard_regno_nregs
[hard_regno
][PSEUDO_REGNO_MODE (regno
)];
1235 lra_hard_reg_usage
[hard_regno
+ j
] -= lra_reg_info
[regno
].freq
;
1236 reg_renumber
[regno
] = -1;
1237 if (regno
>= lra_constraint_new_regno_start
)
1238 former_reload_pseudo_spill_p
= true;
1239 if (lra_dump_file
!= NULL
)
1240 fprintf (lra_dump_file
, " Spill r%d after risky transformations\n",
1245 /* Improve allocation by assigning the same hard regno of inheritance
1246 pseudos to the connected pseudos. We need this because inheritance
1247 pseudos are allocated after reload pseudos in the thread and when
1248 we assign a hard register to a reload pseudo we don't know yet that
1249 the connected inheritance pseudos can get the same hard register.
1250 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1252 improve_inheritance (bitmap changed_pseudos
)
1255 int regno
, another_regno
, hard_regno
, another_hard_regno
, cost
, i
, n
;
1256 lra_copy_t cp
, next_cp
;
1259 if (lra_inheritance_iter
> LRA_MAX_INHERITANCE_PASSES
)
1262 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos
, 0, k
, bi
)
1263 if (reg_renumber
[k
] >= 0 && lra_reg_info
[k
].nrefs
!= 0)
1264 sorted_pseudos
[n
++] = k
;
1265 qsort (sorted_pseudos
, n
, sizeof (int), pseudo_compare_func
);
1266 for (i
= 0; i
< n
; i
++)
1268 regno
= sorted_pseudos
[i
];
1269 hard_regno
= reg_renumber
[regno
];
1270 lra_assert (hard_regno
>= 0);
1271 for (cp
= lra_reg_info
[regno
].copies
; cp
!= NULL
; cp
= next_cp
)
1273 if (cp
->regno1
== regno
)
1275 next_cp
= cp
->regno1_next
;
1276 another_regno
= cp
->regno2
;
1278 else if (cp
->regno2
== regno
)
1280 next_cp
= cp
->regno2_next
;
1281 another_regno
= cp
->regno1
;
1285 /* Don't change reload pseudo allocation. It might have
1286 this allocation for a purpose and changing it can result
1288 if ((another_regno
< lra_constraint_new_regno_start
1289 || bitmap_bit_p (&lra_inheritance_pseudos
, another_regno
))
1290 && (another_hard_regno
= reg_renumber
[another_regno
]) >= 0
1291 && another_hard_regno
!= hard_regno
)
1293 if (lra_dump_file
!= NULL
)
1296 " Improving inheritance for %d(%d) and %d(%d)...\n",
1297 regno
, hard_regno
, another_regno
, another_hard_regno
);
1298 update_lives (another_regno
, true);
1299 lra_setup_reg_renumber (another_regno
, -1, false);
1300 if (hard_regno
== find_hard_regno_for (another_regno
, &cost
,
1302 assign_hard_regno (hard_regno
, another_regno
);
1304 assign_hard_regno (another_hard_regno
, another_regno
);
1305 bitmap_set_bit (changed_pseudos
, another_regno
);
1312 /* Bitmap finally containing all pseudos spilled on this assignment
1314 static bitmap_head all_spilled_pseudos
;
1315 /* All pseudos whose allocation was changed. */
1316 static bitmap_head changed_pseudo_bitmap
;
1319 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1320 REGNO and whose hard regs can be assigned to REGNO. */
1322 find_all_spills_for (int regno
)
1328 enum reg_class rclass
;
1329 bool *rclass_intersect_p
;
1331 rclass
= regno_allocno_class_array
[regno
];
1332 rclass_intersect_p
= ira_reg_classes_intersect_p
[rclass
];
1333 for (r
= lra_reg_info
[regno
].live_ranges
; r
!= NULL
; r
= r
->next
)
1335 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos
[r
->start
], 0, k
, bi
)
1336 if (rclass_intersect_p
[regno_allocno_class_array
[k
]])
1337 sparseset_set_bit (live_range_hard_reg_pseudos
, k
);
1338 for (p
= r
->start
+ 1; p
<= r
->finish
; p
++)
1340 lra_live_range_t r2
;
1342 for (r2
= start_point_ranges
[p
];
1344 r2
= r2
->start_next
)
1346 if (live_pseudos_reg_renumber
[r2
->regno
] >= 0
1347 && rclass_intersect_p
[regno_allocno_class_array
[r2
->regno
]])
1348 sparseset_set_bit (live_range_hard_reg_pseudos
, r2
->regno
);
1354 /* Assign hard registers to reload pseudos and other pseudos. */
1356 assign_by_spills (void)
1358 int i
, n
, nfails
, iter
, regno
, hard_regno
, cost
;
1361 bitmap_head changed_insns
, do_not_assign_nonreload_pseudos
;
1362 unsigned int u
, conflict_regno
;
1365 int max_regno
= max_reg_num ();
1367 for (n
= 0, i
= lra_constraint_new_regno_start
; i
< max_regno
; i
++)
1368 if (reg_renumber
[i
] < 0 && lra_reg_info
[i
].nrefs
!= 0
1369 && regno_allocno_class_array
[i
] != NO_REGS
)
1370 sorted_pseudos
[n
++] = i
;
1371 bitmap_initialize (&insn_conflict_pseudos
, ®_obstack
);
1372 bitmap_initialize (&spill_pseudos_bitmap
, ®_obstack
);
1373 bitmap_initialize (&best_spill_pseudos_bitmap
, ®_obstack
);
1374 update_hard_regno_preference_check
= XCNEWVEC (int, max_regno
);
1375 curr_update_hard_regno_preference_check
= 0;
1376 memset (try_hard_reg_pseudos_check
, 0, sizeof (try_hard_reg_pseudos_check
));
1377 for (i
= 0; i
< FIRST_PSEUDO_REGISTER
; i
++)
1378 bitmap_initialize (&try_hard_reg_pseudos
[i
], ®_obstack
);
1379 curr_pseudo_check
= 0;
1380 bitmap_initialize (&changed_insns
, ®_obstack
);
1381 bitmap_initialize (&non_reload_pseudos
, ®_obstack
);
1382 bitmap_ior (&non_reload_pseudos
, &lra_inheritance_pseudos
, &lra_split_regs
);
1383 bitmap_ior_into (&non_reload_pseudos
, &lra_subreg_reload_pseudos
);
1384 bitmap_ior_into (&non_reload_pseudos
, &lra_optional_reload_pseudos
);
1385 for (iter
= 0; iter
<= 1; iter
++)
1387 qsort (sorted_pseudos
, n
, sizeof (int), reload_pseudo_compare_func
);
1389 for (i
= 0; i
< n
; i
++)
1391 regno
= sorted_pseudos
[i
];
1392 if (reg_renumber
[regno
] >= 0)
1394 if (lra_dump_file
!= NULL
)
1395 fprintf (lra_dump_file
, " Assigning to %d "
1396 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1397 regno
, reg_class_names
[regno_allocno_class_array
[regno
]],
1398 ORIGINAL_REGNO (regno_reg_rtx
[regno
]),
1399 lra_reg_info
[regno
].freq
, regno_assign_info
[regno
].first
,
1400 regno_assign_info
[regno_assign_info
[regno
].first
].freq
);
1401 hard_regno
= find_hard_regno_for (regno
, &cost
, -1, iter
== 1);
1402 reload_p
= ! bitmap_bit_p (&non_reload_pseudos
, regno
);
1403 if (hard_regno
< 0 && reload_p
)
1404 hard_regno
= spill_for (regno
, &all_spilled_pseudos
, iter
== 1);
1408 sorted_pseudos
[nfails
++] = regno
;
1412 /* This register might have been spilled by the previous
1413 pass. Indicate that it is no longer spilled. */
1414 bitmap_clear_bit (&all_spilled_pseudos
, regno
);
1415 assign_hard_regno (hard_regno
, regno
);
1417 /* As non-reload pseudo assignment is changed we
1418 should reconsider insns referring for the
1420 bitmap_set_bit (&changed_pseudo_bitmap
, regno
);
1427 /* We did not assign hard regs to reload pseudos after two iterations.
1428 Either it's an asm and something is wrong with the constraints, or
1429 we have run out of spill registers; error out in either case. */
1431 bitmap_head failed_reload_insns
;
1433 bitmap_initialize (&failed_reload_insns
, ®_obstack
);
1434 for (i
= 0; i
< nfails
; i
++)
1436 regno
= sorted_pseudos
[i
];
1437 bitmap_ior_into (&failed_reload_insns
,
1438 &lra_reg_info
[regno
].insn_bitmap
);
1439 /* Assign an arbitrary hard register of regno class to
1440 avoid further trouble with this insn. */
1441 bitmap_clear_bit (&all_spilled_pseudos
, regno
);
1443 (ira_class_hard_regs
[regno_allocno_class_array
[regno
]][0],
1446 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns
, 0, u
, bi
)
1448 insn
= lra_insn_recog_data
[u
]->insn
;
1449 if (asm_noperands (PATTERN (insn
)) >= 0)
1452 error_for_asm (insn
,
1453 "%<asm%> operand has impossible constraints");
1454 /* Avoid further trouble with this insn.
1455 For asm goto, instead of fixing up all the edges
1456 just clear the template and clear input operands
1457 (asm goto doesn't have any output operands). */
1460 rtx asm_op
= extract_asm_operands (PATTERN (insn
));
1461 ASM_OPERANDS_TEMPLATE (asm_op
) = ggc_strdup ("");
1462 ASM_OPERANDS_INPUT_VEC (asm_op
) = rtvec_alloc (0);
1463 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op
) = rtvec_alloc (0);
1464 lra_update_insn_regno_info (insn
);
1468 PATTERN (insn
) = gen_rtx_USE (VOIDmode
, const0_rtx
);
1469 lra_set_insn_deleted (insn
);
1474 error ("unable to find a register to spill");
1475 fatal_insn ("this is the insn:", insn
);
1480 /* This is a very rare event. We can not assign a hard register
1481 to reload pseudo because the hard register was assigned to
1482 another reload pseudo on a previous assignment pass. For x86
1483 example, on the 1st pass we assigned CX (although another
1484 hard register could be used for this) to reload pseudo in an
1485 insn, on the 2nd pass we need CX (and only this) hard
1486 register for a new reload pseudo in the same insn. Another
1487 possible situation may occur in assigning to multi-regs
1488 reload pseudos when hard regs pool is too fragmented even
1489 after spilling non-reload pseudos.
1491 We should do something radical here to succeed. Here we
1492 spill *all* conflicting pseudos and reassign them. */
1493 if (lra_dump_file
!= NULL
)
1494 fprintf (lra_dump_file
, " 2nd iter for reload pseudo assignments:\n");
1495 sparseset_clear (live_range_hard_reg_pseudos
);
1496 for (i
= 0; i
< nfails
; i
++)
1498 if (lra_dump_file
!= NULL
)
1499 fprintf (lra_dump_file
, " Reload r%d assignment failure\n",
1501 find_all_spills_for (sorted_pseudos
[i
]);
1503 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos
, conflict_regno
)
1505 if ((int) conflict_regno
>= lra_constraint_new_regno_start
)
1507 sorted_pseudos
[nfails
++] = conflict_regno
;
1508 former_reload_pseudo_spill_p
= true;
1510 if (lra_dump_file
!= NULL
)
1511 fprintf (lra_dump_file
, " Spill %s r%d(hr=%d, freq=%d)\n",
1512 pseudo_prefix_title (conflict_regno
), conflict_regno
,
1513 reg_renumber
[conflict_regno
],
1514 lra_reg_info
[conflict_regno
].freq
);
1515 update_lives (conflict_regno
, true);
1516 lra_setup_reg_renumber (conflict_regno
, -1, false);
1520 improve_inheritance (&changed_pseudo_bitmap
);
1521 bitmap_clear (&non_reload_pseudos
);
1522 bitmap_clear (&changed_insns
);
1525 /* We should not assign to original pseudos of inheritance
1526 pseudos or split pseudos if any its inheritance pseudo did
1527 not get hard register or any its split pseudo was not split
1528 because undo inheritance/split pass will extend live range of
1529 such inheritance or split pseudos. */
1530 bitmap_initialize (&do_not_assign_nonreload_pseudos
, ®_obstack
);
1531 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos
, 0, u
, bi
)
1532 if ((restore_rtx
= lra_reg_info
[u
].restore_rtx
) != NULL_RTX
1533 && REG_P (restore_rtx
)
1534 && reg_renumber
[u
] < 0
1535 && bitmap_bit_p (&lra_inheritance_pseudos
, u
))
1536 bitmap_set_bit (&do_not_assign_nonreload_pseudos
, REGNO (restore_rtx
));
1537 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs
, 0, u
, bi
)
1538 if ((restore_rtx
= lra_reg_info
[u
].restore_rtx
) != NULL_RTX
1539 && reg_renumber
[u
] >= 0)
1541 lra_assert (REG_P (restore_rtx
));
1542 bitmap_set_bit (&do_not_assign_nonreload_pseudos
, REGNO (restore_rtx
));
1544 for (n
= 0, i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
1545 if (((i
< lra_constraint_new_regno_start
1546 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos
, i
))
1547 || (bitmap_bit_p (&lra_inheritance_pseudos
, i
)
1548 && lra_reg_info
[i
].restore_rtx
!= NULL_RTX
)
1549 || (bitmap_bit_p (&lra_split_regs
, i
)
1550 && lra_reg_info
[i
].restore_rtx
!= NULL_RTX
)
1551 || bitmap_bit_p (&lra_subreg_reload_pseudos
, i
)
1552 || bitmap_bit_p (&lra_optional_reload_pseudos
, i
))
1553 && reg_renumber
[i
] < 0 && lra_reg_info
[i
].nrefs
!= 0
1554 && regno_allocno_class_array
[i
] != NO_REGS
)
1555 sorted_pseudos
[n
++] = i
;
1556 bitmap_clear (&do_not_assign_nonreload_pseudos
);
1557 if (n
!= 0 && lra_dump_file
!= NULL
)
1558 fprintf (lra_dump_file
, " Reassigning non-reload pseudos\n");
1559 qsort (sorted_pseudos
, n
, sizeof (int), pseudo_compare_func
);
1560 for (i
= 0; i
< n
; i
++)
1562 regno
= sorted_pseudos
[i
];
1563 hard_regno
= find_hard_regno_for (regno
, &cost
, -1, false);
1564 if (hard_regno
>= 0)
1566 assign_hard_regno (hard_regno
, regno
);
1567 /* We change allocation for non-reload pseudo on this
1568 iteration -- mark the pseudo for invalidation of used
1569 alternatives of insns containing the pseudo. */
1570 bitmap_set_bit (&changed_pseudo_bitmap
, regno
);
1574 enum reg_class rclass
= lra_get_allocno_class (regno
);
1575 enum reg_class spill_class
;
1577 if (targetm
.spill_class
== NULL
1578 || lra_reg_info
[regno
].restore_rtx
== NULL_RTX
1579 || ! bitmap_bit_p (&lra_inheritance_pseudos
, regno
)
1583 ((reg_class_t
) rclass
,
1584 PSEUDO_REGNO_MODE (regno
)))) == NO_REGS
)
1586 regno_allocno_class_array
[regno
] = spill_class
;
1587 hard_regno
= find_hard_regno_for (regno
, &cost
, -1, false);
1589 regno_allocno_class_array
[regno
] = rclass
;
1593 (regno
, spill_class
, spill_class
, spill_class
);
1594 assign_hard_regno (hard_regno
, regno
);
1595 bitmap_set_bit (&changed_pseudo_bitmap
, regno
);
1600 free (update_hard_regno_preference_check
);
1601 bitmap_clear (&best_spill_pseudos_bitmap
);
1602 bitmap_clear (&spill_pseudos_bitmap
);
1603 bitmap_clear (&insn_conflict_pseudos
);
1607 /* Entry function to assign hard registers to new reload pseudos
1608 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1609 of old pseudos) and possibly to the old pseudos. The function adds
1610 what insns to process for the next constraint pass. Those are all
1611 insns who contains non-reload and non-inheritance pseudos with
1614 Return true if we did not spill any non-reload and non-inheritance
1622 bitmap_head insns_to_process
;
1624 int max_regno
= max_reg_num ();
1626 timevar_push (TV_LRA_ASSIGN
);
1627 lra_assignment_iter
++;
1628 if (lra_dump_file
!= NULL
)
1629 fprintf (lra_dump_file
, "\n********** Assignment #%d: **********\n\n",
1630 lra_assignment_iter
);
1632 sorted_pseudos
= XNEWVEC (int, max_regno
);
1633 sorted_reload_pseudos
= XNEWVEC (int, max_regno
);
1634 regno_allocno_class_array
= XNEWVEC (enum reg_class
, max_regno
);
1635 regno_live_length
= XNEWVEC (int, max_regno
);
1636 for (i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
1641 regno_allocno_class_array
[i
] = lra_get_allocno_class (i
);
1642 for (l
= 0, r
= lra_reg_info
[i
].live_ranges
; r
!= NULL
; r
= r
->next
)
1643 l
+= r
->finish
- r
->start
+ 1;
1644 regno_live_length
[i
] = l
;
1646 former_reload_pseudo_spill_p
= false;
1647 init_regno_assign_info ();
1648 bitmap_initialize (&all_spilled_pseudos
, ®_obstack
);
1649 create_live_range_start_chains ();
1650 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos
);
1651 if (flag_checking
&& !flag_ipa_ra
)
1652 for (i
= FIRST_PSEUDO_REGISTER
; i
< max_regno
; i
++)
1653 if (lra_reg_info
[i
].nrefs
!= 0 && reg_renumber
[i
] >= 0
1654 && lra_reg_info
[i
].call_p
1655 && overlaps_hard_reg_set_p (call_used_reg_set
,
1656 PSEUDO_REGNO_MODE (i
), reg_renumber
[i
]))
1658 /* Setup insns to process on the next constraint pass. */
1659 bitmap_initialize (&changed_pseudo_bitmap
, ®_obstack
);
1660 init_live_reload_and_inheritance_pseudos ();
1661 assign_by_spills ();
1662 finish_live_reload_and_inheritance_pseudos ();
1663 bitmap_ior_into (&changed_pseudo_bitmap
, &all_spilled_pseudos
);
1665 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos
, 0, u
, bi
)
1666 /* We ignore spilled pseudos created on last inheritance pass
1667 because they will be removed. */
1668 if (lra_reg_info
[u
].restore_rtx
== NULL_RTX
)
1670 no_spills_p
= false;
1673 finish_live_range_start_chains ();
1674 bitmap_clear (&all_spilled_pseudos
);
1675 bitmap_initialize (&insns_to_process
, ®_obstack
);
1676 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap
, 0, u
, bi
)
1677 bitmap_ior_into (&insns_to_process
, &lra_reg_info
[u
].insn_bitmap
);
1678 bitmap_clear (&changed_pseudo_bitmap
);
1679 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process
, 0, u
, bi
)
1681 lra_push_insn_by_uid (u
);
1682 /* Invalidate alternatives for insn should be processed. */
1683 lra_set_used_insn_alternative_by_uid (u
, -1);
1685 bitmap_clear (&insns_to_process
);
1686 finish_regno_assign_info ();
1687 free (regno_live_length
);
1688 free (regno_allocno_class_array
);
1689 free (sorted_pseudos
);
1690 free (sorted_reload_pseudos
);
1692 timevar_pop (TV_LRA_ASSIGN
);
1693 if (former_reload_pseudo_spill_p
)
1694 lra_assignment_iter_after_spill
++;
1695 /* This is conditional on flag_checking because valid code can take
1696 more than this maximum number of iteration, but at the same time
1697 the test can uncover errors in machine descriptions. */
1699 && (lra_assignment_iter_after_spill
1700 > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER
))
1702 ("Maximum number of LRA assignment passes is achieved (%d)\n",
1703 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER
);