Introduce gimple_call
[official-gcc.git] / gcc / lra-assigns.c
blob7b862a488e6f387a576c3507f07eb7ac207376f4
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2014 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "tm.h"
81 #include "hard-reg-set.h"
82 #include "rtl.h"
83 #include "rtl-error.h"
84 #include "tm_p.h"
85 #include "target.h"
86 #include "insn-config.h"
87 #include "recog.h"
88 #include "output.h"
89 #include "regs.h"
90 #include "function.h"
91 #include "expr.h"
92 #include "basic-block.h"
93 #include "except.h"
94 #include "df.h"
95 #include "ira.h"
96 #include "sparseset.h"
97 #include "params.h"
98 #include "lra-int.h"
100 /* Array containing corresponding values of function
101 lra_get_allocno_class. It is used to speed up the code. */
102 static enum reg_class *regno_allocno_class_array;
104 /* Information about the thread to which a pseudo belongs. Threads are
105 a set of connected reload and inheritance pseudos with the same set of
106 available hard registers. Lone registers belong to their own threads. */
107 struct regno_assign_info
109 /* First/next pseudo of the same thread. */
110 int first, next;
111 /* Frequency of the thread (execution frequency of only reload
112 pseudos in the thread when the thread contains a reload pseudo).
113 Defined only for the first thread pseudo. */
114 int freq;
117 /* Map regno to the corresponding regno assignment info. */
118 static struct regno_assign_info *regno_assign_info;
120 /* All inherited, subreg or optional pseudos created before last spill
121 sub-pass. Such pseudos are permitted to get memory instead of hard
122 regs. */
123 static bitmap_head non_reload_pseudos;
125 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
126 REGNO1 and REGNO2 to form threads. */
127 static void
128 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
130 int last, regno1_first, regno2_first;
132 lra_assert (regno1 >= lra_constraint_new_regno_start
133 && regno2 >= lra_constraint_new_regno_start);
134 regno1_first = regno_assign_info[regno1].first;
135 regno2_first = regno_assign_info[regno2].first;
136 if (regno1_first != regno2_first)
138 for (last = regno2_first;
139 regno_assign_info[last].next >= 0;
140 last = regno_assign_info[last].next)
141 regno_assign_info[last].first = regno1_first;
142 regno_assign_info[last].first = regno1_first;
143 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
144 regno_assign_info[regno1_first].next = regno2_first;
145 regno_assign_info[regno1_first].freq
146 += regno_assign_info[regno2_first].freq;
148 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
149 lra_assert (regno_assign_info[regno1_first].freq >= 0);
152 /* Initialize REGNO_ASSIGN_INFO and form threads. */
153 static void
154 init_regno_assign_info (void)
156 int i, regno1, regno2, max_regno = max_reg_num ();
157 lra_copy_t cp;
159 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
160 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
162 regno_assign_info[i].first = i;
163 regno_assign_info[i].next = -1;
164 regno_assign_info[i].freq = lra_reg_info[i].freq;
166 /* Form the threads. */
167 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
168 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
169 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
170 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
171 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
172 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
173 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
174 process_copy_to_form_thread (regno1, regno2, cp->freq);
177 /* Free REGNO_ASSIGN_INFO. */
178 static void
179 finish_regno_assign_info (void)
181 free (regno_assign_info);
184 /* The function is used to sort *reload* and *inheritance* pseudos to
185 try to assign them hard registers. We put pseudos from the same
186 thread always nearby. */
187 static int
188 reload_pseudo_compare_func (const void *v1p, const void *v2p)
190 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
191 enum reg_class cl1 = regno_allocno_class_array[r1];
192 enum reg_class cl2 = regno_allocno_class_array[r2];
193 int diff;
195 lra_assert (r1 >= lra_constraint_new_regno_start
196 && r2 >= lra_constraint_new_regno_start);
198 /* Prefer to assign reload registers with smaller classes first to
199 guarantee assignment to all reload registers. */
200 if ((diff = (ira_class_hard_regs_num[cl1]
201 - ira_class_hard_regs_num[cl2])) != 0)
202 return diff;
203 if ((diff
204 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
205 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0
206 /* The code below executes rarely as nregs == 1 in most cases.
207 So we should not worry about using faster data structures to
208 check reload pseudos. */
209 && ! bitmap_bit_p (&non_reload_pseudos, r1)
210 && ! bitmap_bit_p (&non_reload_pseudos, r2))
211 return diff;
212 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
213 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
214 return diff;
215 /* Allocate bigger pseudos first to avoid register file
216 fragmentation. */
217 if ((diff
218 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
219 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
220 return diff;
221 /* Put pseudos from the thread nearby. */
222 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
223 return diff;
224 /* If regs are equally good, sort by their numbers, so that the
225 results of qsort leave nothing to chance. */
226 return r1 - r2;
229 /* The function is used to sort *non-reload* pseudos to try to assign
230 them hard registers. The order calculation is simpler than in the
231 previous function and based on the pseudo frequency usage. */
232 static int
233 pseudo_compare_func (const void *v1p, const void *v2p)
235 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
236 int diff;
238 /* Prefer to assign more frequently used registers first. */
239 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
240 return diff;
242 /* If regs are equally good, sort by their numbers, so that the
243 results of qsort leave nothing to chance. */
244 return r1 - r2;
247 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
248 pseudo live ranges with given start point. We insert only live
249 ranges of pseudos interesting for assignment purposes. They are
250 reload pseudos and pseudos assigned to hard registers. */
251 static lra_live_range_t *start_point_ranges;
253 /* Used as a flag that a live range is not inserted in the start point
254 chain. */
255 static struct lra_live_range not_in_chain_mark;
257 /* Create and set up START_POINT_RANGES. */
258 static void
259 create_live_range_start_chains (void)
261 int i, max_regno;
262 lra_live_range_t r;
264 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
265 max_regno = max_reg_num ();
266 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
267 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
269 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
271 r->start_next = start_point_ranges[r->start];
272 start_point_ranges[r->start] = r;
275 else
277 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
278 r->start_next = &not_in_chain_mark;
282 /* Insert live ranges of pseudo REGNO into start chains if they are
283 not there yet. */
284 static void
285 insert_in_live_range_start_chain (int regno)
287 lra_live_range_t r = lra_reg_info[regno].live_ranges;
289 if (r->start_next != &not_in_chain_mark)
290 return;
291 for (; r != NULL; r = r->next)
293 r->start_next = start_point_ranges[r->start];
294 start_point_ranges[r->start] = r;
298 /* Free START_POINT_RANGES. */
299 static void
300 finish_live_range_start_chains (void)
302 gcc_assert (start_point_ranges != NULL);
303 free (start_point_ranges);
304 start_point_ranges = NULL;
307 /* Map: program point -> bitmap of all pseudos living at the point and
308 assigned to hard registers. */
309 static bitmap_head *live_hard_reg_pseudos;
310 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
312 /* reg_renumber corresponding to pseudos marked in
313 live_hard_reg_pseudos. reg_renumber might be not matched to
314 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
315 live_hard_reg_pseudos. */
316 static int *live_pseudos_reg_renumber;
318 /* Sparseset used to calculate living hard reg pseudos for some program
319 point range. */
320 static sparseset live_range_hard_reg_pseudos;
322 /* Sparseset used to calculate living reload/inheritance pseudos for
323 some program point range. */
324 static sparseset live_range_reload_inheritance_pseudos;
326 /* Allocate and initialize the data about living pseudos at program
327 points. */
328 static void
329 init_lives (void)
331 int i, max_regno = max_reg_num ();
333 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
334 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
335 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
336 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
337 for (i = 0; i < lra_live_max_point; i++)
338 bitmap_initialize (&live_hard_reg_pseudos[i],
339 &live_hard_reg_pseudos_bitmap_obstack);
340 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
341 for (i = 0; i < max_regno; i++)
342 live_pseudos_reg_renumber[i] = -1;
345 /* Free the data about living pseudos at program points. */
346 static void
347 finish_lives (void)
349 sparseset_free (live_range_hard_reg_pseudos);
350 sparseset_free (live_range_reload_inheritance_pseudos);
351 free (live_hard_reg_pseudos);
352 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
353 free (live_pseudos_reg_renumber);
356 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
357 entries for pseudo REGNO. Assume that the register has been
358 spilled if FREE_P, otherwise assume that it has been assigned
359 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
360 ranges in the start chains when it is assumed to be assigned to a
361 hard register because we use the chains of pseudos assigned to hard
362 registers during allocation. */
363 static void
364 update_lives (int regno, bool free_p)
366 int p;
367 lra_live_range_t r;
369 if (reg_renumber[regno] < 0)
370 return;
371 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
372 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
374 for (p = r->start; p <= r->finish; p++)
375 if (free_p)
376 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
377 else
379 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
380 insert_in_live_range_start_chain (regno);
385 /* Sparseset used to calculate reload pseudos conflicting with a given
386 pseudo when we are trying to find a hard register for the given
387 pseudo. */
388 static sparseset conflict_reload_and_inheritance_pseudos;
390 /* Map: program point -> bitmap of all reload and inheritance pseudos
391 living at the point. */
392 static bitmap_head *live_reload_and_inheritance_pseudos;
393 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
395 /* Allocate and initialize data about living reload pseudos at any
396 given program point. */
397 static void
398 init_live_reload_and_inheritance_pseudos (void)
400 int i, p, max_regno = max_reg_num ();
401 lra_live_range_t r;
403 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
404 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
405 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
406 for (p = 0; p < lra_live_max_point; p++)
407 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
408 &live_reload_and_inheritance_pseudos_bitmap_obstack);
409 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
411 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
412 for (p = r->start; p <= r->finish; p++)
413 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
417 /* Finalize data about living reload pseudos at any given program
418 point. */
419 static void
420 finish_live_reload_and_inheritance_pseudos (void)
422 sparseset_free (conflict_reload_and_inheritance_pseudos);
423 free (live_reload_and_inheritance_pseudos);
424 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
427 /* The value used to check that cost of given hard reg is really
428 defined currently. */
429 static int curr_hard_regno_costs_check = 0;
430 /* Array used to check that cost of the corresponding hard reg (the
431 array element index) is really defined currently. */
432 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
433 /* The current costs of allocation of hard regs. Defined only if the
434 value of the corresponding element of the previous array is equal to
435 CURR_HARD_REGNO_COSTS_CHECK. */
436 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
438 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
439 not defined yet. */
440 static inline void
441 adjust_hard_regno_cost (int hard_regno, int incr)
443 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
444 hard_regno_costs[hard_regno] = 0;
445 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
446 hard_regno_costs[hard_regno] += incr;
449 /* Try to find a free hard register for pseudo REGNO. Return the
450 hard register on success and set *COST to the cost of using
451 that register. (If several registers have equal cost, the one with
452 the highest priority wins.) Return -1 on failure.
454 If FIRST_P, return the first available hard reg ignoring other
455 criteria, e.g. allocation cost. This approach results in less hard
456 reg pool fragmentation and permit to allocate hard regs to reload
457 pseudos in complicated situations where pseudo sizes are different.
459 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
460 otherwise consider all hard registers in REGNO's class. */
461 static int
462 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno,
463 bool first_p)
465 HARD_REG_SET conflict_set;
466 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
467 lra_live_range_t r;
468 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
469 int hr, conflict_hr, nregs;
470 enum machine_mode biggest_mode;
471 unsigned int k, conflict_regno;
472 int offset, val, biggest_nregs, nregs_diff;
473 enum reg_class rclass;
474 bitmap_iterator bi;
475 bool *rclass_intersect_p;
476 HARD_REG_SET impossible_start_hard_regs, available_regs;
478 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
479 rclass = regno_allocno_class_array[regno];
480 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
481 curr_hard_regno_costs_check++;
482 sparseset_clear (conflict_reload_and_inheritance_pseudos);
483 sparseset_clear (live_range_hard_reg_pseudos);
484 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
485 biggest_mode = lra_reg_info[regno].biggest_mode;
486 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
488 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
489 if (rclass_intersect_p[regno_allocno_class_array[k]])
490 sparseset_set_bit (live_range_hard_reg_pseudos, k);
491 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
492 0, k, bi)
493 if (lra_reg_info[k].preferred_hard_regno1 >= 0
494 && live_pseudos_reg_renumber[k] < 0
495 && rclass_intersect_p[regno_allocno_class_array[k]])
496 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
497 for (p = r->start + 1; p <= r->finish; p++)
499 lra_live_range_t r2;
501 for (r2 = start_point_ranges[p];
502 r2 != NULL;
503 r2 = r2->start_next)
505 if (r2->regno >= lra_constraint_new_regno_start
506 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
507 && live_pseudos_reg_renumber[r2->regno] < 0
508 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
509 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
510 r2->regno);
511 if (live_pseudos_reg_renumber[r2->regno] >= 0
512 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
513 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
517 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
519 adjust_hard_regno_cost
520 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
521 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
522 adjust_hard_regno_cost
523 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
525 #ifdef STACK_REGS
526 if (lra_reg_info[regno].no_stack_p)
527 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
528 SET_HARD_REG_BIT (conflict_set, i);
529 #endif
530 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
531 val = lra_reg_info[regno].val;
532 offset = lra_reg_info[regno].offset;
533 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
534 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
535 if (lra_reg_val_equal_p (conflict_regno, val, offset))
537 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
538 nregs = (hard_regno_nregs[conflict_hr]
539 [lra_reg_info[conflict_regno].biggest_mode]);
540 /* Remember about multi-register pseudos. For example, 2 hard
541 register pseudos can start on the same hard register but can
542 not start on HR and HR+1/HR-1. */
543 for (hr = conflict_hr + 1;
544 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
545 hr++)
546 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
547 for (hr = conflict_hr - 1;
548 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
549 hr--)
550 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
552 else
554 add_to_hard_reg_set (&conflict_set,
555 lra_reg_info[conflict_regno].biggest_mode,
556 live_pseudos_reg_renumber[conflict_regno]);
557 if (hard_reg_set_subset_p (reg_class_contents[rclass],
558 conflict_set))
559 return -1;
561 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
562 conflict_regno)
563 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
565 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
566 if ((hard_regno
567 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
569 adjust_hard_regno_cost
570 (hard_regno,
571 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
572 if ((hard_regno
573 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
574 adjust_hard_regno_cost
575 (hard_regno,
576 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
579 /* Make sure that all registers in a multi-word pseudo belong to the
580 required class. */
581 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
582 lra_assert (rclass != NO_REGS);
583 rclass_size = ira_class_hard_regs_num[rclass];
584 best_hard_regno = -1;
585 hard_regno = ira_class_hard_regs[rclass][0];
586 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
587 nregs_diff = (biggest_nregs
588 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
589 COPY_HARD_REG_SET (available_regs, reg_class_contents[rclass]);
590 AND_COMPL_HARD_REG_SET (available_regs, lra_no_alloc_regs);
591 for (i = 0; i < rclass_size; i++)
593 if (try_only_hard_regno >= 0)
594 hard_regno = try_only_hard_regno;
595 else
596 hard_regno = ira_class_hard_regs[rclass][i];
597 if (! overlaps_hard_reg_set_p (conflict_set,
598 PSEUDO_REGNO_MODE (regno), hard_regno)
599 /* We can not use prohibited_class_mode_regs because it is
600 not defined for all classes. */
601 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
602 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
603 && (nregs_diff == 0
604 || (WORDS_BIG_ENDIAN
605 ? (hard_regno - nregs_diff >= 0
606 && TEST_HARD_REG_BIT (available_regs,
607 hard_regno - nregs_diff))
608 : TEST_HARD_REG_BIT (available_regs,
609 hard_regno + nregs_diff))))
611 if (hard_regno_costs_check[hard_regno]
612 != curr_hard_regno_costs_check)
614 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
615 hard_regno_costs[hard_regno] = 0;
617 for (j = 0;
618 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
619 j++)
620 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
621 && ! df_regs_ever_live_p (hard_regno + j))
622 /* It needs save restore. */
623 hard_regno_costs[hard_regno]
624 += (2
625 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
626 + 1);
627 priority = targetm.register_priority (hard_regno);
628 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
629 || (hard_regno_costs[hard_regno] == best_cost
630 && (priority > best_priority
631 || (targetm.register_usage_leveling_p ()
632 && priority == best_priority
633 && best_usage > lra_hard_reg_usage[hard_regno]))))
635 best_hard_regno = hard_regno;
636 best_cost = hard_regno_costs[hard_regno];
637 best_priority = priority;
638 best_usage = lra_hard_reg_usage[hard_regno];
641 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
642 break;
644 if (best_hard_regno >= 0)
645 *cost = best_cost - lra_reg_info[regno].freq;
646 return best_hard_regno;
649 /* Current value used for checking elements in
650 update_hard_regno_preference_check. */
651 static int curr_update_hard_regno_preference_check;
652 /* If an element value is equal to the above variable value, then the
653 corresponding regno has been processed for preference
654 propagation. */
655 static int *update_hard_regno_preference_check;
657 /* Update the preference for using HARD_REGNO for pseudos that are
658 connected directly or indirectly with REGNO. Apply divisor DIV
659 to any preference adjustments.
661 The more indirectly a pseudo is connected, the smaller its effect
662 should be. We therefore increase DIV on each "hop". */
663 static void
664 update_hard_regno_preference (int regno, int hard_regno, int div)
666 int another_regno, cost;
667 lra_copy_t cp, next_cp;
669 /* Search depth 5 seems to be enough. */
670 if (div > (1 << 5))
671 return;
672 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
674 if (cp->regno1 == regno)
676 next_cp = cp->regno1_next;
677 another_regno = cp->regno2;
679 else if (cp->regno2 == regno)
681 next_cp = cp->regno2_next;
682 another_regno = cp->regno1;
684 else
685 gcc_unreachable ();
686 if (reg_renumber[another_regno] < 0
687 && (update_hard_regno_preference_check[another_regno]
688 != curr_update_hard_regno_preference_check))
690 update_hard_regno_preference_check[another_regno]
691 = curr_update_hard_regno_preference_check;
692 cost = cp->freq < div ? 1 : cp->freq / div;
693 lra_setup_reload_pseudo_preferenced_hard_reg
694 (another_regno, hard_regno, cost);
695 update_hard_regno_preference (another_regno, hard_regno, div * 2);
700 /* Return prefix title for pseudo REGNO. */
701 static const char *
702 pseudo_prefix_title (int regno)
704 return
705 (regno < lra_constraint_new_regno_start ? ""
706 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
707 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
708 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
709 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
710 : "reload ");
713 /* Update REG_RENUMBER and other pseudo preferences by assignment of
714 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
715 void
716 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
718 int i, hr;
720 /* We can not just reassign hard register. */
721 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
722 if ((hr = hard_regno) < 0)
723 hr = reg_renumber[regno];
724 reg_renumber[regno] = hard_regno;
725 lra_assert (hr >= 0);
726 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
727 if (hard_regno < 0)
728 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
729 else
730 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
731 if (print_p && lra_dump_file != NULL)
732 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
733 reg_renumber[regno], pseudo_prefix_title (regno),
734 regno, lra_reg_info[regno].freq);
735 if (hard_regno >= 0)
737 curr_update_hard_regno_preference_check++;
738 update_hard_regno_preference (regno, hard_regno, 1);
742 /* Pseudos which occur in insns containing a particular pseudo. */
743 static bitmap_head insn_conflict_pseudos;
745 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
746 and best spill pseudos for given pseudo (and best hard regno). */
747 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
749 /* Current pseudo check for validity of elements in
750 TRY_HARD_REG_PSEUDOS. */
751 static int curr_pseudo_check;
752 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
753 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
754 /* Pseudos who hold given hard register at the considered points. */
755 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
757 /* Set up try_hard_reg_pseudos for given program point P and class
758 RCLASS. Those are pseudos living at P and assigned to a hard
759 register of RCLASS. In other words, those are pseudos which can be
760 spilled to assign a hard register of RCLASS to a pseudo living at
761 P. */
762 static void
763 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
765 int i, hard_regno;
766 enum machine_mode mode;
767 unsigned int spill_regno;
768 bitmap_iterator bi;
770 /* Find what pseudos could be spilled. */
771 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
773 mode = PSEUDO_REGNO_MODE (spill_regno);
774 hard_regno = live_pseudos_reg_renumber[spill_regno];
775 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
776 mode, hard_regno))
778 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
780 if (try_hard_reg_pseudos_check[hard_regno + i]
781 != curr_pseudo_check)
783 try_hard_reg_pseudos_check[hard_regno + i]
784 = curr_pseudo_check;
785 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
787 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
788 spill_regno);
794 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
795 assignment means that we might undo the data change. */
796 static void
797 assign_temporarily (int regno, int hard_regno)
799 int p;
800 lra_live_range_t r;
802 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
804 for (p = r->start; p <= r->finish; p++)
805 if (hard_regno < 0)
806 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
807 else
809 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
810 insert_in_live_range_start_chain (regno);
813 live_pseudos_reg_renumber[regno] = hard_regno;
816 /* Array used for sorting reload pseudos for subsequent allocation
817 after spilling some pseudo. */
818 static int *sorted_reload_pseudos;
820 /* Spill some pseudos for a reload pseudo REGNO and return hard
821 register which should be used for pseudo after spilling. The
822 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
823 choose hard register (and pseudos occupying the hard registers and
824 to be spilled), we take into account not only how REGNO will
825 benefit from the spills but also how other reload pseudos not yet
826 assigned to hard registers benefit from the spills too. In very
827 rare cases, the function can fail and return -1.
829 If FIRST_P, return the first available hard reg ignoring other
830 criteria, e.g. allocation cost and cost of spilling non-reload
831 pseudos. This approach results in less hard reg pool fragmentation
832 and permit to allocate hard regs to reload pseudos in complicated
833 situations where pseudo sizes are different. */
834 static int
835 spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
837 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
838 int reload_hard_regno, reload_cost;
839 enum machine_mode mode;
840 enum reg_class rclass;
841 unsigned int spill_regno, reload_regno, uid;
842 int insn_pseudos_num, best_insn_pseudos_num;
843 lra_live_range_t r;
844 bitmap_iterator bi;
846 rclass = regno_allocno_class_array[regno];
847 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
848 bitmap_clear (&insn_conflict_pseudos);
849 bitmap_clear (&best_spill_pseudos_bitmap);
850 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
852 struct lra_insn_reg *ir;
854 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
855 if (ir->regno >= FIRST_PSEUDO_REGISTER)
856 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
858 best_hard_regno = -1;
859 best_cost = INT_MAX;
860 best_insn_pseudos_num = INT_MAX;
861 rclass_size = ira_class_hard_regs_num[rclass];
862 mode = PSEUDO_REGNO_MODE (regno);
863 /* Invalidate try_hard_reg_pseudos elements. */
864 curr_pseudo_check++;
865 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
866 for (p = r->start; p <= r->finish; p++)
867 setup_try_hard_regno_pseudos (p, rclass);
868 for (i = 0; i < rclass_size; i++)
870 hard_regno = ira_class_hard_regs[rclass][i];
871 bitmap_clear (&spill_pseudos_bitmap);
872 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
874 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
875 continue;
876 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
877 bitmap_ior_into (&spill_pseudos_bitmap,
878 &try_hard_reg_pseudos[hard_regno + j]);
880 /* Spill pseudos. */
881 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
882 if ((pic_offset_table_rtx != NULL
883 && spill_regno == REGNO (pic_offset_table_rtx))
884 || ((int) spill_regno >= lra_constraint_new_regno_start
885 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
886 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
887 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
888 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
889 goto fail;
890 insn_pseudos_num = 0;
891 if (lra_dump_file != NULL)
892 fprintf (lra_dump_file, " Trying %d:", hard_regno);
893 sparseset_clear (live_range_reload_inheritance_pseudos);
894 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
896 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
897 insn_pseudos_num++;
898 for (r = lra_reg_info[spill_regno].live_ranges;
899 r != NULL;
900 r = r->next)
902 for (p = r->start; p <= r->finish; p++)
904 lra_live_range_t r2;
906 for (r2 = start_point_ranges[p];
907 r2 != NULL;
908 r2 = r2->start_next)
909 if (r2->regno >= lra_constraint_new_regno_start)
910 sparseset_set_bit (live_range_reload_inheritance_pseudos,
911 r2->regno);
915 n = 0;
916 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
917 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
918 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
919 reload_regno)
920 if ((int) reload_regno != regno
921 && (ira_reg_classes_intersect_p
922 [rclass][regno_allocno_class_array[reload_regno]])
923 && live_pseudos_reg_renumber[reload_regno] < 0
924 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
925 sorted_reload_pseudos[n++] = reload_regno;
926 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
928 update_lives (spill_regno, true);
929 if (lra_dump_file != NULL)
930 fprintf (lra_dump_file, " spill %d(freq=%d)",
931 spill_regno, lra_reg_info[spill_regno].freq);
933 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
934 if (hard_regno >= 0)
936 assign_temporarily (regno, hard_regno);
937 qsort (sorted_reload_pseudos, n, sizeof (int),
938 reload_pseudo_compare_func);
939 for (j = 0; j < n; j++)
941 reload_regno = sorted_reload_pseudos[j];
942 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
943 if ((reload_hard_regno
944 = find_hard_regno_for (reload_regno,
945 &reload_cost, -1, first_p)) >= 0)
947 if (lra_dump_file != NULL)
948 fprintf (lra_dump_file, " assign %d(cost=%d)",
949 reload_regno, reload_cost);
950 assign_temporarily (reload_regno, reload_hard_regno);
951 cost += reload_cost;
954 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
956 rtx_insn_list *x;
958 cost += lra_reg_info[spill_regno].freq;
959 if (ira_reg_equiv[spill_regno].memory != NULL
960 || ira_reg_equiv[spill_regno].constant != NULL)
961 for (x = ira_reg_equiv[spill_regno].init_insns;
962 x != NULL;
963 x = x->next ())
964 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
966 if (best_insn_pseudos_num > insn_pseudos_num
967 || (best_insn_pseudos_num == insn_pseudos_num
968 && best_cost > cost))
970 best_insn_pseudos_num = insn_pseudos_num;
971 best_cost = cost;
972 best_hard_regno = hard_regno;
973 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
974 if (lra_dump_file != NULL)
975 fprintf (lra_dump_file, " Now best %d(cost=%d)\n",
976 hard_regno, cost);
978 assign_temporarily (regno, -1);
979 for (j = 0; j < n; j++)
981 reload_regno = sorted_reload_pseudos[j];
982 if (live_pseudos_reg_renumber[reload_regno] >= 0)
983 assign_temporarily (reload_regno, -1);
986 if (lra_dump_file != NULL)
987 fprintf (lra_dump_file, "\n");
988 /* Restore the live hard reg pseudo info for spilled pseudos. */
989 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
990 update_lives (spill_regno, false);
991 fail:
994 /* Spill: */
995 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
997 if (lra_dump_file != NULL)
998 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
999 pseudo_prefix_title (spill_regno),
1000 spill_regno, reg_renumber[spill_regno],
1001 lra_reg_info[spill_regno].freq, regno);
1002 update_lives (spill_regno, true);
1003 lra_setup_reg_renumber (spill_regno, -1, false);
1005 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1006 return best_hard_regno;
1009 /* Assign HARD_REGNO to REGNO. */
1010 static void
1011 assign_hard_regno (int hard_regno, int regno)
1013 int i;
1015 lra_assert (hard_regno >= 0);
1016 lra_setup_reg_renumber (regno, hard_regno, true);
1017 update_lives (regno, false);
1018 for (i = 0;
1019 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
1020 i++)
1021 df_set_regs_ever_live (hard_regno + i, true);
1024 /* Array used for sorting different pseudos. */
1025 static int *sorted_pseudos;
1027 /* The constraints pass is allowed to create equivalences between
1028 pseudos that make the current allocation "incorrect" (in the sense
1029 that pseudos are assigned to hard registers from their own conflict
1030 sets). The global variable lra_risky_transformations_p says
1031 whether this might have happened.
1033 Process pseudos assigned to hard registers (less frequently used
1034 first), spill if a conflict is found, and mark the spilled pseudos
1035 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1036 pseudos, assigned to hard registers. */
1037 static void
1038 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1039 spilled_pseudo_bitmap)
1041 int p, i, j, n, regno, hard_regno;
1042 unsigned int k, conflict_regno;
1043 int val, offset;
1044 HARD_REG_SET conflict_set;
1045 enum machine_mode mode;
1046 lra_live_range_t r;
1047 bitmap_iterator bi;
1048 int max_regno = max_reg_num ();
1050 if (! lra_risky_transformations_p)
1052 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1053 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1054 update_lives (i, false);
1055 return;
1057 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1058 if ((pic_offset_table_rtx == NULL_RTX
1059 || i != (int) REGNO (pic_offset_table_rtx))
1060 && reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1061 sorted_pseudos[n++] = i;
1062 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1063 if (pic_offset_table_rtx != NULL_RTX
1064 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1065 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1066 sorted_pseudos[n++] = regno;
1067 for (i = n - 1; i >= 0; i--)
1069 regno = sorted_pseudos[i];
1070 hard_regno = reg_renumber[regno];
1071 lra_assert (hard_regno >= 0);
1072 mode = lra_reg_info[regno].biggest_mode;
1073 sparseset_clear (live_range_hard_reg_pseudos);
1074 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1076 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1077 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1078 for (p = r->start + 1; p <= r->finish; p++)
1080 lra_live_range_t r2;
1082 for (r2 = start_point_ranges[p];
1083 r2 != NULL;
1084 r2 = r2->start_next)
1085 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1086 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1089 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1090 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1091 val = lra_reg_info[regno].val;
1092 offset = lra_reg_info[regno].offset;
1093 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1094 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1095 /* If it is multi-register pseudos they should start on
1096 the same hard register. */
1097 || hard_regno != reg_renumber[conflict_regno])
1098 add_to_hard_reg_set (&conflict_set,
1099 lra_reg_info[conflict_regno].biggest_mode,
1100 reg_renumber[conflict_regno]);
1101 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1103 update_lives (regno, false);
1104 continue;
1106 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1107 for (j = 0;
1108 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1109 j++)
1110 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1111 reg_renumber[regno] = -1;
1112 if (lra_dump_file != NULL)
1113 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1114 regno);
1118 /* Improve allocation by assigning the same hard regno of inheritance
1119 pseudos to the connected pseudos. We need this because inheritance
1120 pseudos are allocated after reload pseudos in the thread and when
1121 we assign a hard register to a reload pseudo we don't know yet that
1122 the connected inheritance pseudos can get the same hard register.
1123 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1124 static void
1125 improve_inheritance (bitmap changed_pseudos)
1127 unsigned int k;
1128 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1129 lra_copy_t cp, next_cp;
1130 bitmap_iterator bi;
1132 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1133 return;
1134 n = 0;
1135 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1136 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1137 sorted_pseudos[n++] = k;
1138 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1139 for (i = 0; i < n; i++)
1141 regno = sorted_pseudos[i];
1142 hard_regno = reg_renumber[regno];
1143 lra_assert (hard_regno >= 0);
1144 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1146 if (cp->regno1 == regno)
1148 next_cp = cp->regno1_next;
1149 another_regno = cp->regno2;
1151 else if (cp->regno2 == regno)
1153 next_cp = cp->regno2_next;
1154 another_regno = cp->regno1;
1156 else
1157 gcc_unreachable ();
1158 /* Don't change reload pseudo allocation. It might have
1159 this allocation for a purpose and changing it can result
1160 in LRA cycling. */
1161 if ((another_regno < lra_constraint_new_regno_start
1162 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1163 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1164 && another_hard_regno != hard_regno)
1166 if (lra_dump_file != NULL)
1167 fprintf
1168 (lra_dump_file,
1169 " Improving inheritance for %d(%d) and %d(%d)...\n",
1170 regno, hard_regno, another_regno, another_hard_regno);
1171 update_lives (another_regno, true);
1172 lra_setup_reg_renumber (another_regno, -1, false);
1173 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1174 hard_regno, false))
1175 assign_hard_regno (hard_regno, another_regno);
1176 else
1177 assign_hard_regno (another_hard_regno, another_regno);
1178 bitmap_set_bit (changed_pseudos, another_regno);
1185 /* Bitmap finally containing all pseudos spilled on this assignment
1186 pass. */
1187 static bitmap_head all_spilled_pseudos;
1188 /* All pseudos whose allocation was changed. */
1189 static bitmap_head changed_pseudo_bitmap;
1192 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1193 REGNO and whose hard regs can be assigned to REGNO. */
1194 static void
1195 find_all_spills_for (int regno)
1197 int p;
1198 lra_live_range_t r;
1199 unsigned int k;
1200 bitmap_iterator bi;
1201 enum reg_class rclass;
1202 bool *rclass_intersect_p;
1204 rclass = regno_allocno_class_array[regno];
1205 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1206 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1208 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1209 if (rclass_intersect_p[regno_allocno_class_array[k]])
1210 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1211 for (p = r->start + 1; p <= r->finish; p++)
1213 lra_live_range_t r2;
1215 for (r2 = start_point_ranges[p];
1216 r2 != NULL;
1217 r2 = r2->start_next)
1219 if (live_pseudos_reg_renumber[r2->regno] >= 0
1220 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
1221 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1227 /* Assign hard registers to reload pseudos and other pseudos. */
1228 static void
1229 assign_by_spills (void)
1231 int i, n, nfails, iter, regno, hard_regno, cost, restore_regno;
1232 rtx_insn *insn;
1233 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1234 unsigned int u, conflict_regno;
1235 bitmap_iterator bi;
1236 bool reload_p;
1237 int max_regno = max_reg_num ();
1239 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1240 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1241 && regno_allocno_class_array[i] != NO_REGS)
1242 sorted_pseudos[n++] = i;
1243 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1244 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1245 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1246 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1247 curr_update_hard_regno_preference_check = 0;
1248 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1249 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1250 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1251 curr_pseudo_check = 0;
1252 bitmap_initialize (&changed_insns, &reg_obstack);
1253 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1254 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1255 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1256 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1257 for (iter = 0; iter <= 1; iter++)
1259 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1260 nfails = 0;
1261 for (i = 0; i < n; i++)
1263 regno = sorted_pseudos[i];
1264 if (lra_dump_file != NULL)
1265 fprintf (lra_dump_file, " Assigning to %d "
1266 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1267 regno, reg_class_names[regno_allocno_class_array[regno]],
1268 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1269 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1270 regno_assign_info[regno_assign_info[regno].first].freq);
1271 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
1272 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1273 if (hard_regno < 0 && reload_p)
1274 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
1275 if (hard_regno < 0)
1277 if (reload_p)
1278 sorted_pseudos[nfails++] = regno;
1280 else
1282 /* This register might have been spilled by the previous
1283 pass. Indicate that it is no longer spilled. */
1284 bitmap_clear_bit (&all_spilled_pseudos, regno);
1285 assign_hard_regno (hard_regno, regno);
1286 if (! reload_p)
1287 /* As non-reload pseudo assignment is changed we
1288 should reconsider insns referring for the
1289 pseudo. */
1290 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1293 if (nfails == 0)
1294 break;
1295 if (iter > 0)
1297 /* We did not assign hard regs to reload pseudos after two iterations.
1298 Either it's an asm and something is wrong with the constraints, or
1299 we have run out of spill registers; error out in either case. */
1300 bool asm_p = false;
1301 bitmap_head failed_reload_insns;
1303 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1304 for (i = 0; i < nfails; i++)
1306 regno = sorted_pseudos[i];
1307 bitmap_ior_into (&failed_reload_insns,
1308 &lra_reg_info[regno].insn_bitmap);
1309 /* Assign an arbitrary hard register of regno class to
1310 avoid further trouble with this insn. */
1311 bitmap_clear_bit (&all_spilled_pseudos, regno);
1312 assign_hard_regno
1313 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1314 regno);
1316 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1318 insn = lra_insn_recog_data[u]->insn;
1319 if (asm_noperands (PATTERN (insn)) >= 0)
1321 asm_p = true;
1322 error_for_asm (insn,
1323 "%<asm%> operand has impossible constraints");
1324 /* Avoid further trouble with this insn.
1325 For asm goto, instead of fixing up all the edges
1326 just clear the template and clear input operands
1327 (asm goto doesn't have any output operands). */
1328 if (JUMP_P (insn))
1330 rtx asm_op = extract_asm_operands (PATTERN (insn));
1331 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1332 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1333 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1334 lra_update_insn_regno_info (insn);
1336 else
1338 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1339 lra_set_insn_deleted (insn);
1342 else if (!asm_p)
1344 error ("unable to find a register to spill");
1345 fatal_insn ("this is the insn:", insn);
1348 break;
1350 /* This is a very rare event. We can not assign a hard register
1351 to reload pseudo because the hard register was assigned to
1352 another reload pseudo on a previous assignment pass. For x86
1353 example, on the 1st pass we assigned CX (although another
1354 hard register could be used for this) to reload pseudo in an
1355 insn, on the 2nd pass we need CX (and only this) hard
1356 register for a new reload pseudo in the same insn. Another
1357 possible situation may occur in assigning to multi-regs
1358 reload pseudos when hard regs pool is too fragmented even
1359 after spilling non-reload pseudos.
1361 We should do something radical here to succeed. Here we
1362 spill *all* conflicting pseudos and reassign them. */
1363 if (lra_dump_file != NULL)
1364 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1365 sparseset_clear (live_range_hard_reg_pseudos);
1366 for (i = 0; i < nfails; i++)
1368 if (lra_dump_file != NULL)
1369 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1370 sorted_pseudos[i]);
1371 find_all_spills_for (sorted_pseudos[i]);
1373 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1375 if ((int) conflict_regno >= lra_constraint_new_regno_start)
1376 sorted_pseudos[nfails++] = conflict_regno;
1377 if (lra_dump_file != NULL)
1378 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1379 pseudo_prefix_title (conflict_regno), conflict_regno,
1380 reg_renumber[conflict_regno],
1381 lra_reg_info[conflict_regno].freq);
1382 update_lives (conflict_regno, true);
1383 lra_setup_reg_renumber (conflict_regno, -1, false);
1385 n = nfails;
1387 improve_inheritance (&changed_pseudo_bitmap);
1388 bitmap_clear (&non_reload_pseudos);
1389 bitmap_clear (&changed_insns);
1390 if (! lra_simple_p)
1392 /* We should not assign to original pseudos of inheritance
1393 pseudos or split pseudos if any its inheritance pseudo did
1394 not get hard register or any its split pseudo was not split
1395 because undo inheritance/split pass will extend live range of
1396 such inheritance or split pseudos. */
1397 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1398 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1399 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1400 && reg_renumber[u] < 0
1401 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1402 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1403 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1404 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1405 && reg_renumber[u] >= 0)
1406 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1407 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1408 if (((i < lra_constraint_new_regno_start
1409 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1410 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1411 && lra_reg_info[i].restore_regno >= 0)
1412 || (bitmap_bit_p (&lra_split_regs, i)
1413 && lra_reg_info[i].restore_regno >= 0)
1414 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1415 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1416 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1417 && regno_allocno_class_array[i] != NO_REGS)
1418 sorted_pseudos[n++] = i;
1419 bitmap_clear (&do_not_assign_nonreload_pseudos);
1420 if (n != 0 && lra_dump_file != NULL)
1421 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1422 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1423 for (i = 0; i < n; i++)
1425 regno = sorted_pseudos[i];
1426 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1427 if (hard_regno >= 0)
1429 assign_hard_regno (hard_regno, regno);
1430 /* We change allocation for non-reload pseudo on this
1431 iteration -- mark the pseudo for invalidation of used
1432 alternatives of insns containing the pseudo. */
1433 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1435 else
1437 enum reg_class rclass = lra_get_allocno_class (regno);
1438 enum reg_class spill_class;
1440 if (targetm.spill_class == NULL
1441 || lra_reg_info[regno].restore_regno < 0
1442 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1443 || (spill_class
1444 = ((enum reg_class)
1445 targetm.spill_class
1446 ((reg_class_t) rclass,
1447 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1448 continue;
1449 regno_allocno_class_array[regno] = spill_class;
1450 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1451 if (hard_regno < 0)
1452 regno_allocno_class_array[regno] = rclass;
1453 else
1455 setup_reg_classes
1456 (regno, spill_class, spill_class, spill_class);
1457 assign_hard_regno (hard_regno, regno);
1458 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1463 free (update_hard_regno_preference_check);
1464 bitmap_clear (&best_spill_pseudos_bitmap);
1465 bitmap_clear (&spill_pseudos_bitmap);
1466 bitmap_clear (&insn_conflict_pseudos);
1470 /* Entry function to assign hard registers to new reload pseudos
1471 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1472 of old pseudos) and possibly to the old pseudos. The function adds
1473 what insns to process for the next constraint pass. Those are all
1474 insns who contains non-reload and non-inheritance pseudos with
1475 changed allocation.
1477 Return true if we did not spill any non-reload and non-inheritance
1478 pseudos. */
1479 bool
1480 lra_assign (void)
1482 int i;
1483 unsigned int u;
1484 bitmap_iterator bi;
1485 bitmap_head insns_to_process;
1486 bool no_spills_p;
1487 int max_regno = max_reg_num ();
1489 timevar_push (TV_LRA_ASSIGN);
1490 init_lives ();
1491 sorted_pseudos = XNEWVEC (int, max_regno);
1492 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1493 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1494 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1495 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1496 init_regno_assign_info ();
1497 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1498 create_live_range_start_chains ();
1499 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1500 #ifdef ENABLE_CHECKING
1501 if (!flag_use_caller_save)
1502 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1503 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1504 && lra_reg_info[i].call_p
1505 && overlaps_hard_reg_set_p (call_used_reg_set,
1506 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1507 gcc_unreachable ();
1508 #endif
1509 /* Setup insns to process on the next constraint pass. */
1510 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1511 init_live_reload_and_inheritance_pseudos ();
1512 assign_by_spills ();
1513 finish_live_reload_and_inheritance_pseudos ();
1514 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1515 no_spills_p = true;
1516 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1517 /* We ignore spilled pseudos created on last inheritance pass
1518 because they will be removed. */
1519 if (lra_reg_info[u].restore_regno < 0)
1521 no_spills_p = false;
1522 break;
1524 finish_live_range_start_chains ();
1525 bitmap_clear (&all_spilled_pseudos);
1526 bitmap_initialize (&insns_to_process, &reg_obstack);
1527 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1528 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1529 bitmap_clear (&changed_pseudo_bitmap);
1530 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1532 lra_push_insn_by_uid (u);
1533 /* Invalidate alternatives for insn should be processed. */
1534 lra_set_used_insn_alternative_by_uid (u, -1);
1536 bitmap_clear (&insns_to_process);
1537 finish_regno_assign_info ();
1538 free (regno_allocno_class_array);
1539 free (sorted_pseudos);
1540 free (sorted_reload_pseudos);
1541 finish_lives ();
1542 timevar_pop (TV_LRA_ASSIGN);
1543 return no_spills_p;