/cp
[official-gcc.git] / gcc / lra-assigns.c
blob839036c79e702efd6235772a22f57f088ceb01c4
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2015 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "backend.h"
81 #include "predict.h"
82 #include "tree.h"
83 #include "rtl.h"
84 #include "df.h"
85 #include "rtl-error.h"
86 #include "tm_p.h"
87 #include "target.h"
88 #include "insn-config.h"
89 #include "recog.h"
90 #include "output.h"
91 #include "regs.h"
92 #include "flags.h"
93 #include "alias.h"
94 #include "expmed.h"
95 #include "dojump.h"
96 #include "explow.h"
97 #include "calls.h"
98 #include "emit-rtl.h"
99 #include "varasm.h"
100 #include "stmt.h"
101 #include "expr.h"
102 #include "except.h"
103 #include "ira.h"
104 #include "sparseset.h"
105 #include "params.h"
106 #include "lra.h"
107 #include "insn-attr.h"
108 #include "insn-codes.h"
109 #include "lra-int.h"
111 /* Current iteration number of the pass and current iteration number
112 of the pass after the latest spill pass when any former reload
113 pseudo was spilled. */
114 int lra_assignment_iter;
115 int lra_assignment_iter_after_spill;
117 /* Flag of spilling former reload pseudos on this pass. */
118 static bool former_reload_pseudo_spill_p;
120 /* Array containing corresponding values of function
121 lra_get_allocno_class. It is used to speed up the code. */
122 static enum reg_class *regno_allocno_class_array;
124 /* Information about the thread to which a pseudo belongs. Threads are
125 a set of connected reload and inheritance pseudos with the same set of
126 available hard registers. Lone registers belong to their own threads. */
127 struct regno_assign_info
129 /* First/next pseudo of the same thread. */
130 int first, next;
131 /* Frequency of the thread (execution frequency of only reload
132 pseudos in the thread when the thread contains a reload pseudo).
133 Defined only for the first thread pseudo. */
134 int freq;
137 /* Map regno to the corresponding regno assignment info. */
138 static struct regno_assign_info *regno_assign_info;
140 /* All inherited, subreg or optional pseudos created before last spill
141 sub-pass. Such pseudos are permitted to get memory instead of hard
142 regs. */
143 static bitmap_head non_reload_pseudos;
145 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
146 REGNO1 and REGNO2 to form threads. */
147 static void
148 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
150 int last, regno1_first, regno2_first;
152 lra_assert (regno1 >= lra_constraint_new_regno_start
153 && regno2 >= lra_constraint_new_regno_start);
154 regno1_first = regno_assign_info[regno1].first;
155 regno2_first = regno_assign_info[regno2].first;
156 if (regno1_first != regno2_first)
158 for (last = regno2_first;
159 regno_assign_info[last].next >= 0;
160 last = regno_assign_info[last].next)
161 regno_assign_info[last].first = regno1_first;
162 regno_assign_info[last].first = regno1_first;
163 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
164 regno_assign_info[regno1_first].next = regno2_first;
165 regno_assign_info[regno1_first].freq
166 += regno_assign_info[regno2_first].freq;
168 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
169 lra_assert (regno_assign_info[regno1_first].freq >= 0);
172 /* Initialize REGNO_ASSIGN_INFO and form threads. */
173 static void
174 init_regno_assign_info (void)
176 int i, regno1, regno2, max_regno = max_reg_num ();
177 lra_copy_t cp;
179 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
180 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
182 regno_assign_info[i].first = i;
183 regno_assign_info[i].next = -1;
184 regno_assign_info[i].freq = lra_reg_info[i].freq;
186 /* Form the threads. */
187 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
188 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
189 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
190 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
191 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
192 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
193 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
194 process_copy_to_form_thread (regno1, regno2, cp->freq);
197 /* Free REGNO_ASSIGN_INFO. */
198 static void
199 finish_regno_assign_info (void)
201 free (regno_assign_info);
204 /* The function is used to sort *reload* and *inheritance* pseudos to
205 try to assign them hard registers. We put pseudos from the same
206 thread always nearby. */
207 static int
208 reload_pseudo_compare_func (const void *v1p, const void *v2p)
210 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
211 enum reg_class cl1 = regno_allocno_class_array[r1];
212 enum reg_class cl2 = regno_allocno_class_array[r2];
213 int diff;
215 lra_assert (r1 >= lra_constraint_new_regno_start
216 && r2 >= lra_constraint_new_regno_start);
218 /* Prefer to assign reload registers with smaller classes first to
219 guarantee assignment to all reload registers. */
220 if ((diff = (ira_class_hard_regs_num[cl1]
221 - ira_class_hard_regs_num[cl2])) != 0)
222 return diff;
223 if ((diff
224 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
225 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0
226 /* The code below executes rarely as nregs == 1 in most cases.
227 So we should not worry about using faster data structures to
228 check reload pseudos. */
229 && ! bitmap_bit_p (&non_reload_pseudos, r1)
230 && ! bitmap_bit_p (&non_reload_pseudos, r2))
231 return diff;
232 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
233 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
234 return diff;
235 /* Allocate bigger pseudos first to avoid register file
236 fragmentation. */
237 if ((diff
238 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
239 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
240 return diff;
241 /* Put pseudos from the thread nearby. */
242 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
243 return diff;
244 /* If regs are equally good, sort by their numbers, so that the
245 results of qsort leave nothing to chance. */
246 return r1 - r2;
249 /* The function is used to sort *non-reload* pseudos to try to assign
250 them hard registers. The order calculation is simpler than in the
251 previous function and based on the pseudo frequency usage. */
252 static int
253 pseudo_compare_func (const void *v1p, const void *v2p)
255 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
256 int diff;
258 /* Prefer to assign more frequently used registers first. */
259 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
260 return diff;
262 /* If regs are equally good, sort by their numbers, so that the
263 results of qsort leave nothing to chance. */
264 return r1 - r2;
267 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
268 pseudo live ranges with given start point. We insert only live
269 ranges of pseudos interesting for assignment purposes. They are
270 reload pseudos and pseudos assigned to hard registers. */
271 static lra_live_range_t *start_point_ranges;
273 /* Used as a flag that a live range is not inserted in the start point
274 chain. */
275 static struct lra_live_range not_in_chain_mark;
277 /* Create and set up START_POINT_RANGES. */
278 static void
279 create_live_range_start_chains (void)
281 int i, max_regno;
282 lra_live_range_t r;
284 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
285 max_regno = max_reg_num ();
286 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
287 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
289 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
291 r->start_next = start_point_ranges[r->start];
292 start_point_ranges[r->start] = r;
295 else
297 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
298 r->start_next = &not_in_chain_mark;
302 /* Insert live ranges of pseudo REGNO into start chains if they are
303 not there yet. */
304 static void
305 insert_in_live_range_start_chain (int regno)
307 lra_live_range_t r = lra_reg_info[regno].live_ranges;
309 if (r->start_next != &not_in_chain_mark)
310 return;
311 for (; r != NULL; r = r->next)
313 r->start_next = start_point_ranges[r->start];
314 start_point_ranges[r->start] = r;
318 /* Free START_POINT_RANGES. */
319 static void
320 finish_live_range_start_chains (void)
322 gcc_assert (start_point_ranges != NULL);
323 free (start_point_ranges);
324 start_point_ranges = NULL;
327 /* Map: program point -> bitmap of all pseudos living at the point and
328 assigned to hard registers. */
329 static bitmap_head *live_hard_reg_pseudos;
330 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
332 /* reg_renumber corresponding to pseudos marked in
333 live_hard_reg_pseudos. reg_renumber might be not matched to
334 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
335 live_hard_reg_pseudos. */
336 static int *live_pseudos_reg_renumber;
338 /* Sparseset used to calculate living hard reg pseudos for some program
339 point range. */
340 static sparseset live_range_hard_reg_pseudos;
342 /* Sparseset used to calculate living reload/inheritance pseudos for
343 some program point range. */
344 static sparseset live_range_reload_inheritance_pseudos;
346 /* Allocate and initialize the data about living pseudos at program
347 points. */
348 static void
349 init_lives (void)
351 int i, max_regno = max_reg_num ();
353 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
354 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
355 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
356 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
357 for (i = 0; i < lra_live_max_point; i++)
358 bitmap_initialize (&live_hard_reg_pseudos[i],
359 &live_hard_reg_pseudos_bitmap_obstack);
360 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
361 for (i = 0; i < max_regno; i++)
362 live_pseudos_reg_renumber[i] = -1;
365 /* Free the data about living pseudos at program points. */
366 static void
367 finish_lives (void)
369 sparseset_free (live_range_hard_reg_pseudos);
370 sparseset_free (live_range_reload_inheritance_pseudos);
371 free (live_hard_reg_pseudos);
372 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
373 free (live_pseudos_reg_renumber);
376 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
377 entries for pseudo REGNO. Assume that the register has been
378 spilled if FREE_P, otherwise assume that it has been assigned
379 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
380 ranges in the start chains when it is assumed to be assigned to a
381 hard register because we use the chains of pseudos assigned to hard
382 registers during allocation. */
383 static void
384 update_lives (int regno, bool free_p)
386 int p;
387 lra_live_range_t r;
389 if (reg_renumber[regno] < 0)
390 return;
391 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
392 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
394 for (p = r->start; p <= r->finish; p++)
395 if (free_p)
396 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
397 else
399 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
400 insert_in_live_range_start_chain (regno);
405 /* Sparseset used to calculate reload pseudos conflicting with a given
406 pseudo when we are trying to find a hard register for the given
407 pseudo. */
408 static sparseset conflict_reload_and_inheritance_pseudos;
410 /* Map: program point -> bitmap of all reload and inheritance pseudos
411 living at the point. */
412 static bitmap_head *live_reload_and_inheritance_pseudos;
413 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
415 /* Allocate and initialize data about living reload pseudos at any
416 given program point. */
417 static void
418 init_live_reload_and_inheritance_pseudos (void)
420 int i, p, max_regno = max_reg_num ();
421 lra_live_range_t r;
423 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
424 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
425 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
426 for (p = 0; p < lra_live_max_point; p++)
427 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
428 &live_reload_and_inheritance_pseudos_bitmap_obstack);
429 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
431 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
432 for (p = r->start; p <= r->finish; p++)
433 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
437 /* Finalize data about living reload pseudos at any given program
438 point. */
439 static void
440 finish_live_reload_and_inheritance_pseudos (void)
442 sparseset_free (conflict_reload_and_inheritance_pseudos);
443 free (live_reload_and_inheritance_pseudos);
444 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
447 /* The value used to check that cost of given hard reg is really
448 defined currently. */
449 static int curr_hard_regno_costs_check = 0;
450 /* Array used to check that cost of the corresponding hard reg (the
451 array element index) is really defined currently. */
452 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
453 /* The current costs of allocation of hard regs. Defined only if the
454 value of the corresponding element of the previous array is equal to
455 CURR_HARD_REGNO_COSTS_CHECK. */
456 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
458 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
459 not defined yet. */
460 static inline void
461 adjust_hard_regno_cost (int hard_regno, int incr)
463 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
464 hard_regno_costs[hard_regno] = 0;
465 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
466 hard_regno_costs[hard_regno] += incr;
469 /* Try to find a free hard register for pseudo REGNO. Return the
470 hard register on success and set *COST to the cost of using
471 that register. (If several registers have equal cost, the one with
472 the highest priority wins.) Return -1 on failure.
474 If FIRST_P, return the first available hard reg ignoring other
475 criteria, e.g. allocation cost. This approach results in less hard
476 reg pool fragmentation and permit to allocate hard regs to reload
477 pseudos in complicated situations where pseudo sizes are different.
479 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
480 otherwise consider all hard registers in REGNO's class.
482 If REGNO_SET is not empty, only hard registers from the set are
483 considered. */
484 static int
485 find_hard_regno_for_1 (int regno, int *cost, int try_only_hard_regno,
486 bool first_p, HARD_REG_SET regno_set)
488 HARD_REG_SET conflict_set;
489 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
490 lra_live_range_t r;
491 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
492 int hr, conflict_hr, nregs;
493 machine_mode biggest_mode;
494 unsigned int k, conflict_regno;
495 int offset, val, biggest_nregs, nregs_diff;
496 enum reg_class rclass;
497 bitmap_iterator bi;
498 bool *rclass_intersect_p;
499 HARD_REG_SET impossible_start_hard_regs, available_regs;
501 if (hard_reg_set_empty_p (regno_set))
502 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
503 else
505 COMPL_HARD_REG_SET (conflict_set, regno_set);
506 IOR_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
508 rclass = regno_allocno_class_array[regno];
509 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
510 curr_hard_regno_costs_check++;
511 sparseset_clear (conflict_reload_and_inheritance_pseudos);
512 sparseset_clear (live_range_hard_reg_pseudos);
513 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
514 biggest_mode = lra_reg_info[regno].biggest_mode;
515 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
517 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
518 if (rclass_intersect_p[regno_allocno_class_array[k]])
519 sparseset_set_bit (live_range_hard_reg_pseudos, k);
520 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
521 0, k, bi)
522 if (lra_reg_info[k].preferred_hard_regno1 >= 0
523 && live_pseudos_reg_renumber[k] < 0
524 && rclass_intersect_p[regno_allocno_class_array[k]])
525 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
526 for (p = r->start + 1; p <= r->finish; p++)
528 lra_live_range_t r2;
530 for (r2 = start_point_ranges[p];
531 r2 != NULL;
532 r2 = r2->start_next)
534 if (r2->regno >= lra_constraint_new_regno_start
535 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
536 && live_pseudos_reg_renumber[r2->regno] < 0
537 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
538 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
539 r2->regno);
540 if (live_pseudos_reg_renumber[r2->regno] >= 0
541 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
542 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
546 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
548 adjust_hard_regno_cost
549 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
550 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
551 adjust_hard_regno_cost
552 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
554 #ifdef STACK_REGS
555 if (lra_reg_info[regno].no_stack_p)
556 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
557 SET_HARD_REG_BIT (conflict_set, i);
558 #endif
559 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
560 val = lra_reg_info[regno].val;
561 offset = lra_reg_info[regno].offset;
562 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
563 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
564 if (lra_reg_val_equal_p (conflict_regno, val, offset))
566 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
567 nregs = (hard_regno_nregs[conflict_hr]
568 [lra_reg_info[conflict_regno].biggest_mode]);
569 /* Remember about multi-register pseudos. For example, 2 hard
570 register pseudos can start on the same hard register but can
571 not start on HR and HR+1/HR-1. */
572 for (hr = conflict_hr + 1;
573 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
574 hr++)
575 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
576 for (hr = conflict_hr - 1;
577 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
578 hr--)
579 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
581 else
583 add_to_hard_reg_set (&conflict_set,
584 lra_reg_info[conflict_regno].biggest_mode,
585 live_pseudos_reg_renumber[conflict_regno]);
586 if (hard_reg_set_subset_p (reg_class_contents[rclass],
587 conflict_set))
588 return -1;
590 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
591 conflict_regno)
592 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
594 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
595 if ((hard_regno
596 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
598 adjust_hard_regno_cost
599 (hard_regno,
600 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
601 if ((hard_regno
602 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
603 adjust_hard_regno_cost
604 (hard_regno,
605 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
608 /* Make sure that all registers in a multi-word pseudo belong to the
609 required class. */
610 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
611 lra_assert (rclass != NO_REGS);
612 rclass_size = ira_class_hard_regs_num[rclass];
613 best_hard_regno = -1;
614 hard_regno = ira_class_hard_regs[rclass][0];
615 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
616 nregs_diff = (biggest_nregs
617 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
618 COPY_HARD_REG_SET (available_regs, reg_class_contents[rclass]);
619 AND_COMPL_HARD_REG_SET (available_regs, lra_no_alloc_regs);
620 for (i = 0; i < rclass_size; i++)
622 if (try_only_hard_regno >= 0)
623 hard_regno = try_only_hard_regno;
624 else
625 hard_regno = ira_class_hard_regs[rclass][i];
626 if (! overlaps_hard_reg_set_p (conflict_set,
627 PSEUDO_REGNO_MODE (regno), hard_regno)
628 /* We can not use prohibited_class_mode_regs because it is
629 not defined for all classes. */
630 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
631 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
632 && (nregs_diff == 0
633 || (WORDS_BIG_ENDIAN
634 ? (hard_regno - nregs_diff >= 0
635 && TEST_HARD_REG_BIT (available_regs,
636 hard_regno - nregs_diff))
637 : TEST_HARD_REG_BIT (available_regs,
638 hard_regno + nregs_diff))))
640 if (hard_regno_costs_check[hard_regno]
641 != curr_hard_regno_costs_check)
643 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
644 hard_regno_costs[hard_regno] = 0;
646 for (j = 0;
647 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
648 j++)
649 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
650 && ! df_regs_ever_live_p (hard_regno + j))
651 /* It needs save restore. */
652 hard_regno_costs[hard_regno]
653 += (2
654 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
655 + 1);
656 priority = targetm.register_priority (hard_regno);
657 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
658 || (hard_regno_costs[hard_regno] == best_cost
659 && (priority > best_priority
660 || (targetm.register_usage_leveling_p ()
661 && priority == best_priority
662 && best_usage > lra_hard_reg_usage[hard_regno]))))
664 best_hard_regno = hard_regno;
665 best_cost = hard_regno_costs[hard_regno];
666 best_priority = priority;
667 best_usage = lra_hard_reg_usage[hard_regno];
670 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
671 break;
673 if (best_hard_regno >= 0)
674 *cost = best_cost - lra_reg_info[regno].freq;
675 return best_hard_regno;
678 /* A wrapper for find_hard_regno_for_1 (see comments for that function
679 description). This function tries to find a hard register for
680 preferred class first if it is worth. */
681 static int
682 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno, bool first_p)
684 int hard_regno;
685 HARD_REG_SET regno_set;
687 /* Only original pseudos can have a different preferred class. */
688 if (try_only_hard_regno < 0 && regno < lra_new_regno_start)
690 enum reg_class pref_class = reg_preferred_class (regno);
692 if (regno_allocno_class_array[regno] != pref_class)
694 hard_regno = find_hard_regno_for_1 (regno, cost, -1, first_p,
695 reg_class_contents[pref_class]);
696 if (hard_regno >= 0)
697 return hard_regno;
700 CLEAR_HARD_REG_SET (regno_set);
701 return find_hard_regno_for_1 (regno, cost, try_only_hard_regno, first_p,
702 regno_set);
705 /* Current value used for checking elements in
706 update_hard_regno_preference_check. */
707 static int curr_update_hard_regno_preference_check;
708 /* If an element value is equal to the above variable value, then the
709 corresponding regno has been processed for preference
710 propagation. */
711 static int *update_hard_regno_preference_check;
713 /* Update the preference for using HARD_REGNO for pseudos that are
714 connected directly or indirectly with REGNO. Apply divisor DIV
715 to any preference adjustments.
717 The more indirectly a pseudo is connected, the smaller its effect
718 should be. We therefore increase DIV on each "hop". */
719 static void
720 update_hard_regno_preference (int regno, int hard_regno, int div)
722 int another_regno, cost;
723 lra_copy_t cp, next_cp;
725 /* Search depth 5 seems to be enough. */
726 if (div > (1 << 5))
727 return;
728 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
730 if (cp->regno1 == regno)
732 next_cp = cp->regno1_next;
733 another_regno = cp->regno2;
735 else if (cp->regno2 == regno)
737 next_cp = cp->regno2_next;
738 another_regno = cp->regno1;
740 else
741 gcc_unreachable ();
742 if (reg_renumber[another_regno] < 0
743 && (update_hard_regno_preference_check[another_regno]
744 != curr_update_hard_regno_preference_check))
746 update_hard_regno_preference_check[another_regno]
747 = curr_update_hard_regno_preference_check;
748 cost = cp->freq < div ? 1 : cp->freq / div;
749 lra_setup_reload_pseudo_preferenced_hard_reg
750 (another_regno, hard_regno, cost);
751 update_hard_regno_preference (another_regno, hard_regno, div * 2);
756 /* Return prefix title for pseudo REGNO. */
757 static const char *
758 pseudo_prefix_title (int regno)
760 return
761 (regno < lra_constraint_new_regno_start ? ""
762 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
763 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
764 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
765 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
766 : "reload ");
769 /* Update REG_RENUMBER and other pseudo preferences by assignment of
770 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
771 void
772 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
774 int i, hr;
776 /* We can not just reassign hard register. */
777 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
778 if ((hr = hard_regno) < 0)
779 hr = reg_renumber[regno];
780 reg_renumber[regno] = hard_regno;
781 lra_assert (hr >= 0);
782 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
783 if (hard_regno < 0)
784 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
785 else
786 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
787 if (print_p && lra_dump_file != NULL)
788 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
789 reg_renumber[regno], pseudo_prefix_title (regno),
790 regno, lra_reg_info[regno].freq);
791 if (hard_regno >= 0)
793 curr_update_hard_regno_preference_check++;
794 update_hard_regno_preference (regno, hard_regno, 1);
798 /* Pseudos which occur in insns containing a particular pseudo. */
799 static bitmap_head insn_conflict_pseudos;
801 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
802 and best spill pseudos for given pseudo (and best hard regno). */
803 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
805 /* Current pseudo check for validity of elements in
806 TRY_HARD_REG_PSEUDOS. */
807 static int curr_pseudo_check;
808 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
809 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
810 /* Pseudos who hold given hard register at the considered points. */
811 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
813 /* Set up try_hard_reg_pseudos for given program point P and class
814 RCLASS. Those are pseudos living at P and assigned to a hard
815 register of RCLASS. In other words, those are pseudos which can be
816 spilled to assign a hard register of RCLASS to a pseudo living at
817 P. */
818 static void
819 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
821 int i, hard_regno;
822 machine_mode mode;
823 unsigned int spill_regno;
824 bitmap_iterator bi;
826 /* Find what pseudos could be spilled. */
827 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
829 mode = PSEUDO_REGNO_MODE (spill_regno);
830 hard_regno = live_pseudos_reg_renumber[spill_regno];
831 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
832 mode, hard_regno))
834 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
836 if (try_hard_reg_pseudos_check[hard_regno + i]
837 != curr_pseudo_check)
839 try_hard_reg_pseudos_check[hard_regno + i]
840 = curr_pseudo_check;
841 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
843 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
844 spill_regno);
850 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
851 assignment means that we might undo the data change. */
852 static void
853 assign_temporarily (int regno, int hard_regno)
855 int p;
856 lra_live_range_t r;
858 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
860 for (p = r->start; p <= r->finish; p++)
861 if (hard_regno < 0)
862 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
863 else
865 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
866 insert_in_live_range_start_chain (regno);
869 live_pseudos_reg_renumber[regno] = hard_regno;
872 /* Array used for sorting reload pseudos for subsequent allocation
873 after spilling some pseudo. */
874 static int *sorted_reload_pseudos;
876 /* Spill some pseudos for a reload pseudo REGNO and return hard
877 register which should be used for pseudo after spilling. The
878 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
879 choose hard register (and pseudos occupying the hard registers and
880 to be spilled), we take into account not only how REGNO will
881 benefit from the spills but also how other reload pseudos not yet
882 assigned to hard registers benefit from the spills too. In very
883 rare cases, the function can fail and return -1.
885 If FIRST_P, return the first available hard reg ignoring other
886 criteria, e.g. allocation cost and cost of spilling non-reload
887 pseudos. This approach results in less hard reg pool fragmentation
888 and permit to allocate hard regs to reload pseudos in complicated
889 situations where pseudo sizes are different. */
890 static int
891 spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
893 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
894 int reload_hard_regno, reload_cost;
895 machine_mode mode;
896 enum reg_class rclass;
897 unsigned int spill_regno, reload_regno, uid;
898 int insn_pseudos_num, best_insn_pseudos_num;
899 int bad_spills_num, smallest_bad_spills_num;
900 lra_live_range_t r;
901 bitmap_iterator bi;
903 rclass = regno_allocno_class_array[regno];
904 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
905 bitmap_clear (&insn_conflict_pseudos);
906 bitmap_clear (&best_spill_pseudos_bitmap);
907 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
909 struct lra_insn_reg *ir;
911 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
912 if (ir->regno >= FIRST_PSEUDO_REGISTER)
913 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
915 best_hard_regno = -1;
916 best_cost = INT_MAX;
917 best_insn_pseudos_num = INT_MAX;
918 smallest_bad_spills_num = INT_MAX;
919 rclass_size = ira_class_hard_regs_num[rclass];
920 mode = PSEUDO_REGNO_MODE (regno);
921 /* Invalidate try_hard_reg_pseudos elements. */
922 curr_pseudo_check++;
923 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
924 for (p = r->start; p <= r->finish; p++)
925 setup_try_hard_regno_pseudos (p, rclass);
926 for (i = 0; i < rclass_size; i++)
928 hard_regno = ira_class_hard_regs[rclass][i];
929 bitmap_clear (&spill_pseudos_bitmap);
930 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
932 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
933 continue;
934 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
935 bitmap_ior_into (&spill_pseudos_bitmap,
936 &try_hard_reg_pseudos[hard_regno + j]);
938 /* Spill pseudos. */
939 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
940 if ((pic_offset_table_rtx != NULL
941 && spill_regno == REGNO (pic_offset_table_rtx))
942 || ((int) spill_regno >= lra_constraint_new_regno_start
943 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
944 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
945 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
946 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
947 goto fail;
948 insn_pseudos_num = 0;
949 bad_spills_num = 0;
950 if (lra_dump_file != NULL)
951 fprintf (lra_dump_file, " Trying %d:", hard_regno);
952 sparseset_clear (live_range_reload_inheritance_pseudos);
953 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
955 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
956 insn_pseudos_num++;
957 if (spill_regno >= (unsigned int) lra_bad_spill_regno_start)
958 bad_spills_num++;
959 for (r = lra_reg_info[spill_regno].live_ranges;
960 r != NULL;
961 r = r->next)
963 for (p = r->start; p <= r->finish; p++)
965 lra_live_range_t r2;
967 for (r2 = start_point_ranges[p];
968 r2 != NULL;
969 r2 = r2->start_next)
970 if (r2->regno >= lra_constraint_new_regno_start)
971 sparseset_set_bit (live_range_reload_inheritance_pseudos,
972 r2->regno);
976 n = 0;
977 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
978 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
979 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
980 reload_regno)
981 if ((int) reload_regno != regno
982 && (ira_reg_classes_intersect_p
983 [rclass][regno_allocno_class_array[reload_regno]])
984 && live_pseudos_reg_renumber[reload_regno] < 0
985 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
986 sorted_reload_pseudos[n++] = reload_regno;
987 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
989 update_lives (spill_regno, true);
990 if (lra_dump_file != NULL)
991 fprintf (lra_dump_file, " spill %d(freq=%d)",
992 spill_regno, lra_reg_info[spill_regno].freq);
994 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
995 if (hard_regno >= 0)
997 assign_temporarily (regno, hard_regno);
998 qsort (sorted_reload_pseudos, n, sizeof (int),
999 reload_pseudo_compare_func);
1000 for (j = 0; j < n; j++)
1002 reload_regno = sorted_reload_pseudos[j];
1003 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
1004 if ((reload_hard_regno
1005 = find_hard_regno_for (reload_regno,
1006 &reload_cost, -1, first_p)) >= 0)
1008 if (lra_dump_file != NULL)
1009 fprintf (lra_dump_file, " assign %d(cost=%d)",
1010 reload_regno, reload_cost);
1011 assign_temporarily (reload_regno, reload_hard_regno);
1012 cost += reload_cost;
1015 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1017 rtx_insn_list *x;
1019 cost += lra_reg_info[spill_regno].freq;
1020 if (ira_reg_equiv[spill_regno].memory != NULL
1021 || ira_reg_equiv[spill_regno].constant != NULL)
1022 for (x = ira_reg_equiv[spill_regno].init_insns;
1023 x != NULL;
1024 x = x->next ())
1025 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
1027 if (best_insn_pseudos_num > insn_pseudos_num
1028 || (best_insn_pseudos_num == insn_pseudos_num
1029 && (bad_spills_num < smallest_bad_spills_num
1030 || (bad_spills_num == smallest_bad_spills_num
1031 && best_cost > cost))))
1033 best_insn_pseudos_num = insn_pseudos_num;
1034 smallest_bad_spills_num = bad_spills_num;
1035 best_cost = cost;
1036 best_hard_regno = hard_regno;
1037 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
1038 if (lra_dump_file != NULL)
1039 fprintf (lra_dump_file,
1040 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1041 hard_regno, cost, bad_spills_num, insn_pseudos_num);
1043 assign_temporarily (regno, -1);
1044 for (j = 0; j < n; j++)
1046 reload_regno = sorted_reload_pseudos[j];
1047 if (live_pseudos_reg_renumber[reload_regno] >= 0)
1048 assign_temporarily (reload_regno, -1);
1051 if (lra_dump_file != NULL)
1052 fprintf (lra_dump_file, "\n");
1053 /* Restore the live hard reg pseudo info for spilled pseudos. */
1054 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1055 update_lives (spill_regno, false);
1056 fail:
1059 /* Spill: */
1060 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
1062 if ((int) spill_regno >= lra_constraint_new_regno_start)
1063 former_reload_pseudo_spill_p = true;
1064 if (lra_dump_file != NULL)
1065 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
1066 pseudo_prefix_title (spill_regno),
1067 spill_regno, reg_renumber[spill_regno],
1068 lra_reg_info[spill_regno].freq, regno);
1069 update_lives (spill_regno, true);
1070 lra_setup_reg_renumber (spill_regno, -1, false);
1072 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1073 return best_hard_regno;
1076 /* Assign HARD_REGNO to REGNO. */
1077 static void
1078 assign_hard_regno (int hard_regno, int regno)
1080 int i;
1082 lra_assert (hard_regno >= 0);
1083 lra_setup_reg_renumber (regno, hard_regno, true);
1084 update_lives (regno, false);
1085 for (i = 0;
1086 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
1087 i++)
1088 df_set_regs_ever_live (hard_regno + i, true);
1091 /* Array used for sorting different pseudos. */
1092 static int *sorted_pseudos;
1094 /* The constraints pass is allowed to create equivalences between
1095 pseudos that make the current allocation "incorrect" (in the sense
1096 that pseudos are assigned to hard registers from their own conflict
1097 sets). The global variable lra_risky_transformations_p says
1098 whether this might have happened.
1100 Process pseudos assigned to hard registers (less frequently used
1101 first), spill if a conflict is found, and mark the spilled pseudos
1102 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1103 pseudos, assigned to hard registers. */
1104 static void
1105 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1106 spilled_pseudo_bitmap)
1108 int p, i, j, n, regno, hard_regno;
1109 unsigned int k, conflict_regno;
1110 int val, offset;
1111 HARD_REG_SET conflict_set;
1112 machine_mode mode;
1113 lra_live_range_t r;
1114 bitmap_iterator bi;
1115 int max_regno = max_reg_num ();
1117 if (! lra_risky_transformations_p)
1119 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1120 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1121 update_lives (i, false);
1122 return;
1124 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1125 if ((pic_offset_table_rtx == NULL_RTX
1126 || i != (int) REGNO (pic_offset_table_rtx))
1127 && reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1128 sorted_pseudos[n++] = i;
1129 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1130 if (pic_offset_table_rtx != NULL_RTX
1131 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1132 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1133 sorted_pseudos[n++] = regno;
1134 for (i = n - 1; i >= 0; i--)
1136 regno = sorted_pseudos[i];
1137 hard_regno = reg_renumber[regno];
1138 lra_assert (hard_regno >= 0);
1139 mode = lra_reg_info[regno].biggest_mode;
1140 sparseset_clear (live_range_hard_reg_pseudos);
1141 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1143 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1144 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1145 for (p = r->start + 1; p <= r->finish; p++)
1147 lra_live_range_t r2;
1149 for (r2 = start_point_ranges[p];
1150 r2 != NULL;
1151 r2 = r2->start_next)
1152 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1153 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1156 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1157 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1158 val = lra_reg_info[regno].val;
1159 offset = lra_reg_info[regno].offset;
1160 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1161 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1162 /* If it is multi-register pseudos they should start on
1163 the same hard register. */
1164 || hard_regno != reg_renumber[conflict_regno])
1165 add_to_hard_reg_set (&conflict_set,
1166 lra_reg_info[conflict_regno].biggest_mode,
1167 reg_renumber[conflict_regno]);
1168 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1170 update_lives (regno, false);
1171 continue;
1173 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1174 for (j = 0;
1175 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1176 j++)
1177 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1178 reg_renumber[regno] = -1;
1179 if (regno >= lra_constraint_new_regno_start)
1180 former_reload_pseudo_spill_p = true;
1181 if (lra_dump_file != NULL)
1182 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1183 regno);
1187 /* Improve allocation by assigning the same hard regno of inheritance
1188 pseudos to the connected pseudos. We need this because inheritance
1189 pseudos are allocated after reload pseudos in the thread and when
1190 we assign a hard register to a reload pseudo we don't know yet that
1191 the connected inheritance pseudos can get the same hard register.
1192 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1193 static void
1194 improve_inheritance (bitmap changed_pseudos)
1196 unsigned int k;
1197 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1198 lra_copy_t cp, next_cp;
1199 bitmap_iterator bi;
1201 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1202 return;
1203 n = 0;
1204 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1205 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1206 sorted_pseudos[n++] = k;
1207 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1208 for (i = 0; i < n; i++)
1210 regno = sorted_pseudos[i];
1211 hard_regno = reg_renumber[regno];
1212 lra_assert (hard_regno >= 0);
1213 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1215 if (cp->regno1 == regno)
1217 next_cp = cp->regno1_next;
1218 another_regno = cp->regno2;
1220 else if (cp->regno2 == regno)
1222 next_cp = cp->regno2_next;
1223 another_regno = cp->regno1;
1225 else
1226 gcc_unreachable ();
1227 /* Don't change reload pseudo allocation. It might have
1228 this allocation for a purpose and changing it can result
1229 in LRA cycling. */
1230 if ((another_regno < lra_constraint_new_regno_start
1231 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1232 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1233 && another_hard_regno != hard_regno)
1235 if (lra_dump_file != NULL)
1236 fprintf
1237 (lra_dump_file,
1238 " Improving inheritance for %d(%d) and %d(%d)...\n",
1239 regno, hard_regno, another_regno, another_hard_regno);
1240 update_lives (another_regno, true);
1241 lra_setup_reg_renumber (another_regno, -1, false);
1242 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1243 hard_regno, false))
1244 assign_hard_regno (hard_regno, another_regno);
1245 else
1246 assign_hard_regno (another_hard_regno, another_regno);
1247 bitmap_set_bit (changed_pseudos, another_regno);
1254 /* Bitmap finally containing all pseudos spilled on this assignment
1255 pass. */
1256 static bitmap_head all_spilled_pseudos;
1257 /* All pseudos whose allocation was changed. */
1258 static bitmap_head changed_pseudo_bitmap;
1261 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1262 REGNO and whose hard regs can be assigned to REGNO. */
1263 static void
1264 find_all_spills_for (int regno)
1266 int p;
1267 lra_live_range_t r;
1268 unsigned int k;
1269 bitmap_iterator bi;
1270 enum reg_class rclass;
1271 bool *rclass_intersect_p;
1273 rclass = regno_allocno_class_array[regno];
1274 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1275 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1277 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1278 if (rclass_intersect_p[regno_allocno_class_array[k]])
1279 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1280 for (p = r->start + 1; p <= r->finish; p++)
1282 lra_live_range_t r2;
1284 for (r2 = start_point_ranges[p];
1285 r2 != NULL;
1286 r2 = r2->start_next)
1288 if (live_pseudos_reg_renumber[r2->regno] >= 0
1289 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
1290 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1296 /* Assign hard registers to reload pseudos and other pseudos. */
1297 static void
1298 assign_by_spills (void)
1300 int i, n, nfails, iter, regno, hard_regno, cost, restore_regno;
1301 rtx_insn *insn;
1302 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1303 unsigned int u, conflict_regno;
1304 bitmap_iterator bi;
1305 bool reload_p;
1306 int max_regno = max_reg_num ();
1308 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1309 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1310 && regno_allocno_class_array[i] != NO_REGS)
1311 sorted_pseudos[n++] = i;
1312 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1313 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1314 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1315 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1316 curr_update_hard_regno_preference_check = 0;
1317 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1318 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1319 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1320 curr_pseudo_check = 0;
1321 bitmap_initialize (&changed_insns, &reg_obstack);
1322 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1323 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1324 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1325 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1326 for (iter = 0; iter <= 1; iter++)
1328 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1329 nfails = 0;
1330 for (i = 0; i < n; i++)
1332 regno = sorted_pseudos[i];
1333 if (lra_dump_file != NULL)
1334 fprintf (lra_dump_file, " Assigning to %d "
1335 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1336 regno, reg_class_names[regno_allocno_class_array[regno]],
1337 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1338 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1339 regno_assign_info[regno_assign_info[regno].first].freq);
1340 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
1341 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1342 if (hard_regno < 0 && reload_p)
1343 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
1344 if (hard_regno < 0)
1346 if (reload_p)
1347 sorted_pseudos[nfails++] = regno;
1349 else
1351 /* This register might have been spilled by the previous
1352 pass. Indicate that it is no longer spilled. */
1353 bitmap_clear_bit (&all_spilled_pseudos, regno);
1354 assign_hard_regno (hard_regno, regno);
1355 if (! reload_p)
1356 /* As non-reload pseudo assignment is changed we
1357 should reconsider insns referring for the
1358 pseudo. */
1359 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1362 if (nfails == 0)
1363 break;
1364 if (iter > 0)
1366 /* We did not assign hard regs to reload pseudos after two iterations.
1367 Either it's an asm and something is wrong with the constraints, or
1368 we have run out of spill registers; error out in either case. */
1369 bool asm_p = false;
1370 bitmap_head failed_reload_insns;
1372 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1373 for (i = 0; i < nfails; i++)
1375 regno = sorted_pseudos[i];
1376 bitmap_ior_into (&failed_reload_insns,
1377 &lra_reg_info[regno].insn_bitmap);
1378 /* Assign an arbitrary hard register of regno class to
1379 avoid further trouble with this insn. */
1380 bitmap_clear_bit (&all_spilled_pseudos, regno);
1381 assign_hard_regno
1382 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1383 regno);
1385 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1387 insn = lra_insn_recog_data[u]->insn;
1388 if (asm_noperands (PATTERN (insn)) >= 0)
1390 asm_p = true;
1391 error_for_asm (insn,
1392 "%<asm%> operand has impossible constraints");
1393 /* Avoid further trouble with this insn.
1394 For asm goto, instead of fixing up all the edges
1395 just clear the template and clear input operands
1396 (asm goto doesn't have any output operands). */
1397 if (JUMP_P (insn))
1399 rtx asm_op = extract_asm_operands (PATTERN (insn));
1400 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1401 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1402 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1403 lra_update_insn_regno_info (insn);
1405 else
1407 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1408 lra_set_insn_deleted (insn);
1411 else if (!asm_p)
1413 error ("unable to find a register to spill");
1414 fatal_insn ("this is the insn:", insn);
1417 break;
1419 /* This is a very rare event. We can not assign a hard register
1420 to reload pseudo because the hard register was assigned to
1421 another reload pseudo on a previous assignment pass. For x86
1422 example, on the 1st pass we assigned CX (although another
1423 hard register could be used for this) to reload pseudo in an
1424 insn, on the 2nd pass we need CX (and only this) hard
1425 register for a new reload pseudo in the same insn. Another
1426 possible situation may occur in assigning to multi-regs
1427 reload pseudos when hard regs pool is too fragmented even
1428 after spilling non-reload pseudos.
1430 We should do something radical here to succeed. Here we
1431 spill *all* conflicting pseudos and reassign them. */
1432 if (lra_dump_file != NULL)
1433 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1434 sparseset_clear (live_range_hard_reg_pseudos);
1435 for (i = 0; i < nfails; i++)
1437 if (lra_dump_file != NULL)
1438 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1439 sorted_pseudos[i]);
1440 find_all_spills_for (sorted_pseudos[i]);
1442 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1444 if ((int) conflict_regno >= lra_constraint_new_regno_start)
1446 sorted_pseudos[nfails++] = conflict_regno;
1447 former_reload_pseudo_spill_p = true;
1449 if (lra_dump_file != NULL)
1450 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1451 pseudo_prefix_title (conflict_regno), conflict_regno,
1452 reg_renumber[conflict_regno],
1453 lra_reg_info[conflict_regno].freq);
1454 update_lives (conflict_regno, true);
1455 lra_setup_reg_renumber (conflict_regno, -1, false);
1457 n = nfails;
1459 improve_inheritance (&changed_pseudo_bitmap);
1460 bitmap_clear (&non_reload_pseudos);
1461 bitmap_clear (&changed_insns);
1462 if (! lra_simple_p)
1464 /* We should not assign to original pseudos of inheritance
1465 pseudos or split pseudos if any its inheritance pseudo did
1466 not get hard register or any its split pseudo was not split
1467 because undo inheritance/split pass will extend live range of
1468 such inheritance or split pseudos. */
1469 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1470 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1471 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1472 && reg_renumber[u] < 0
1473 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1474 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1475 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1476 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1477 && reg_renumber[u] >= 0)
1478 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1479 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1480 if (((i < lra_constraint_new_regno_start
1481 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1482 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1483 && lra_reg_info[i].restore_regno >= 0)
1484 || (bitmap_bit_p (&lra_split_regs, i)
1485 && lra_reg_info[i].restore_regno >= 0)
1486 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1487 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1488 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1489 && regno_allocno_class_array[i] != NO_REGS)
1490 sorted_pseudos[n++] = i;
1491 bitmap_clear (&do_not_assign_nonreload_pseudos);
1492 if (n != 0 && lra_dump_file != NULL)
1493 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1494 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1495 for (i = 0; i < n; i++)
1497 regno = sorted_pseudos[i];
1498 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1499 if (hard_regno >= 0)
1501 assign_hard_regno (hard_regno, regno);
1502 /* We change allocation for non-reload pseudo on this
1503 iteration -- mark the pseudo for invalidation of used
1504 alternatives of insns containing the pseudo. */
1505 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1507 else
1509 enum reg_class rclass = lra_get_allocno_class (regno);
1510 enum reg_class spill_class;
1512 if (targetm.spill_class == NULL
1513 || lra_reg_info[regno].restore_regno < 0
1514 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1515 || (spill_class
1516 = ((enum reg_class)
1517 targetm.spill_class
1518 ((reg_class_t) rclass,
1519 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1520 continue;
1521 regno_allocno_class_array[regno] = spill_class;
1522 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1523 if (hard_regno < 0)
1524 regno_allocno_class_array[regno] = rclass;
1525 else
1527 setup_reg_classes
1528 (regno, spill_class, spill_class, spill_class);
1529 assign_hard_regno (hard_regno, regno);
1530 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1535 free (update_hard_regno_preference_check);
1536 bitmap_clear (&best_spill_pseudos_bitmap);
1537 bitmap_clear (&spill_pseudos_bitmap);
1538 bitmap_clear (&insn_conflict_pseudos);
1542 /* Entry function to assign hard registers to new reload pseudos
1543 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1544 of old pseudos) and possibly to the old pseudos. The function adds
1545 what insns to process for the next constraint pass. Those are all
1546 insns who contains non-reload and non-inheritance pseudos with
1547 changed allocation.
1549 Return true if we did not spill any non-reload and non-inheritance
1550 pseudos. */
1551 bool
1552 lra_assign (void)
1554 int i;
1555 unsigned int u;
1556 bitmap_iterator bi;
1557 bitmap_head insns_to_process;
1558 bool no_spills_p;
1559 int max_regno = max_reg_num ();
1561 timevar_push (TV_LRA_ASSIGN);
1562 lra_assignment_iter++;
1563 if (lra_dump_file != NULL)
1564 fprintf (lra_dump_file, "\n********** Assignment #%d: **********\n\n",
1565 lra_assignment_iter);
1566 init_lives ();
1567 sorted_pseudos = XNEWVEC (int, max_regno);
1568 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1569 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1570 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1571 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1572 former_reload_pseudo_spill_p = false;
1573 init_regno_assign_info ();
1574 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1575 create_live_range_start_chains ();
1576 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1577 #ifdef ENABLE_CHECKING
1578 if (!flag_ipa_ra)
1579 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1580 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1581 && lra_reg_info[i].call_p
1582 && overlaps_hard_reg_set_p (call_used_reg_set,
1583 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1584 gcc_unreachable ();
1585 #endif
1586 /* Setup insns to process on the next constraint pass. */
1587 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1588 init_live_reload_and_inheritance_pseudos ();
1589 assign_by_spills ();
1590 finish_live_reload_and_inheritance_pseudos ();
1591 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1592 no_spills_p = true;
1593 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1594 /* We ignore spilled pseudos created on last inheritance pass
1595 because they will be removed. */
1596 if (lra_reg_info[u].restore_regno < 0)
1598 no_spills_p = false;
1599 break;
1601 finish_live_range_start_chains ();
1602 bitmap_clear (&all_spilled_pseudos);
1603 bitmap_initialize (&insns_to_process, &reg_obstack);
1604 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1605 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1606 bitmap_clear (&changed_pseudo_bitmap);
1607 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1609 lra_push_insn_by_uid (u);
1610 /* Invalidate alternatives for insn should be processed. */
1611 lra_set_used_insn_alternative_by_uid (u, -1);
1613 bitmap_clear (&insns_to_process);
1614 finish_regno_assign_info ();
1615 free (regno_allocno_class_array);
1616 free (sorted_pseudos);
1617 free (sorted_reload_pseudos);
1618 finish_lives ();
1619 timevar_pop (TV_LRA_ASSIGN);
1620 if (former_reload_pseudo_spill_p)
1621 lra_assignment_iter_after_spill++;
1622 if (lra_assignment_iter_after_spill > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER)
1623 internal_error
1624 ("Maximum number of LRA assignment passes is achieved (%d)\n",
1625 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER);
1626 return no_spills_p;