* config/msp430/msp430.c (msp430_asm_integer): Support addition
[official-gcc.git] / gcc / lra-assigns.c
blob0ad91d06fd531493053a31a2ffcd83c506a9614d
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2015 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "tm.h"
81 #include "hard-reg-set.h"
82 #include "rtl.h"
83 #include "rtl-error.h"
84 #include "tm_p.h"
85 #include "target.h"
86 #include "insn-config.h"
87 #include "recog.h"
88 #include "output.h"
89 #include "regs.h"
90 #include "hashtab.h"
91 #include "hash-set.h"
92 #include "vec.h"
93 #include "input.h"
94 #include "function.h"
95 #include "symtab.h"
96 #include "flags.h"
97 #include "statistics.h"
98 #include "alias.h"
99 #include "inchash.h"
100 #include "tree.h"
101 #include "expmed.h"
102 #include "dojump.h"
103 #include "explow.h"
104 #include "calls.h"
105 #include "emit-rtl.h"
106 #include "varasm.h"
107 #include "stmt.h"
108 #include "expr.h"
109 #include "predict.h"
110 #include "dominance.h"
111 #include "cfg.h"
112 #include "basic-block.h"
113 #include "except.h"
114 #include "df.h"
115 #include "ira.h"
116 #include "sparseset.h"
117 #include "params.h"
118 #include "lra-int.h"
120 /* Current iteration number of the pass and current iteration number
121 of the pass after the latest spill pass when any former reload
122 pseudo was spilled. */
123 int lra_assignment_iter;
124 int lra_assignment_iter_after_spill;
126 /* Flag of spilling former reload pseudos on this pass. */
127 static bool former_reload_pseudo_spill_p;
129 /* Array containing corresponding values of function
130 lra_get_allocno_class. It is used to speed up the code. */
131 static enum reg_class *regno_allocno_class_array;
133 /* Information about the thread to which a pseudo belongs. Threads are
134 a set of connected reload and inheritance pseudos with the same set of
135 available hard registers. Lone registers belong to their own threads. */
136 struct regno_assign_info
138 /* First/next pseudo of the same thread. */
139 int first, next;
140 /* Frequency of the thread (execution frequency of only reload
141 pseudos in the thread when the thread contains a reload pseudo).
142 Defined only for the first thread pseudo. */
143 int freq;
146 /* Map regno to the corresponding regno assignment info. */
147 static struct regno_assign_info *regno_assign_info;
149 /* All inherited, subreg or optional pseudos created before last spill
150 sub-pass. Such pseudos are permitted to get memory instead of hard
151 regs. */
152 static bitmap_head non_reload_pseudos;
154 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
155 REGNO1 and REGNO2 to form threads. */
156 static void
157 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
159 int last, regno1_first, regno2_first;
161 lra_assert (regno1 >= lra_constraint_new_regno_start
162 && regno2 >= lra_constraint_new_regno_start);
163 regno1_first = regno_assign_info[regno1].first;
164 regno2_first = regno_assign_info[regno2].first;
165 if (regno1_first != regno2_first)
167 for (last = regno2_first;
168 regno_assign_info[last].next >= 0;
169 last = regno_assign_info[last].next)
170 regno_assign_info[last].first = regno1_first;
171 regno_assign_info[last].first = regno1_first;
172 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
173 regno_assign_info[regno1_first].next = regno2_first;
174 regno_assign_info[regno1_first].freq
175 += regno_assign_info[regno2_first].freq;
177 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
178 lra_assert (regno_assign_info[regno1_first].freq >= 0);
181 /* Initialize REGNO_ASSIGN_INFO and form threads. */
182 static void
183 init_regno_assign_info (void)
185 int i, regno1, regno2, max_regno = max_reg_num ();
186 lra_copy_t cp;
188 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
189 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
191 regno_assign_info[i].first = i;
192 regno_assign_info[i].next = -1;
193 regno_assign_info[i].freq = lra_reg_info[i].freq;
195 /* Form the threads. */
196 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
197 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
198 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
199 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
200 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
201 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
202 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
203 process_copy_to_form_thread (regno1, regno2, cp->freq);
206 /* Free REGNO_ASSIGN_INFO. */
207 static void
208 finish_regno_assign_info (void)
210 free (regno_assign_info);
213 /* The function is used to sort *reload* and *inheritance* pseudos to
214 try to assign them hard registers. We put pseudos from the same
215 thread always nearby. */
216 static int
217 reload_pseudo_compare_func (const void *v1p, const void *v2p)
219 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
220 enum reg_class cl1 = regno_allocno_class_array[r1];
221 enum reg_class cl2 = regno_allocno_class_array[r2];
222 int diff;
224 lra_assert (r1 >= lra_constraint_new_regno_start
225 && r2 >= lra_constraint_new_regno_start);
227 /* Prefer to assign reload registers with smaller classes first to
228 guarantee assignment to all reload registers. */
229 if ((diff = (ira_class_hard_regs_num[cl1]
230 - ira_class_hard_regs_num[cl2])) != 0)
231 return diff;
232 if ((diff
233 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
234 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0
235 /* The code below executes rarely as nregs == 1 in most cases.
236 So we should not worry about using faster data structures to
237 check reload pseudos. */
238 && ! bitmap_bit_p (&non_reload_pseudos, r1)
239 && ! bitmap_bit_p (&non_reload_pseudos, r2))
240 return diff;
241 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
242 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
243 return diff;
244 /* Allocate bigger pseudos first to avoid register file
245 fragmentation. */
246 if ((diff
247 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
248 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
249 return diff;
250 /* Put pseudos from the thread nearby. */
251 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
252 return diff;
253 /* If regs are equally good, sort by their numbers, so that the
254 results of qsort leave nothing to chance. */
255 return r1 - r2;
258 /* The function is used to sort *non-reload* pseudos to try to assign
259 them hard registers. The order calculation is simpler than in the
260 previous function and based on the pseudo frequency usage. */
261 static int
262 pseudo_compare_func (const void *v1p, const void *v2p)
264 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
265 int diff;
267 /* Prefer to assign more frequently used registers first. */
268 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
269 return diff;
271 /* If regs are equally good, sort by their numbers, so that the
272 results of qsort leave nothing to chance. */
273 return r1 - r2;
276 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
277 pseudo live ranges with given start point. We insert only live
278 ranges of pseudos interesting for assignment purposes. They are
279 reload pseudos and pseudos assigned to hard registers. */
280 static lra_live_range_t *start_point_ranges;
282 /* Used as a flag that a live range is not inserted in the start point
283 chain. */
284 static struct lra_live_range not_in_chain_mark;
286 /* Create and set up START_POINT_RANGES. */
287 static void
288 create_live_range_start_chains (void)
290 int i, max_regno;
291 lra_live_range_t r;
293 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
294 max_regno = max_reg_num ();
295 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
296 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
298 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
300 r->start_next = start_point_ranges[r->start];
301 start_point_ranges[r->start] = r;
304 else
306 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
307 r->start_next = &not_in_chain_mark;
311 /* Insert live ranges of pseudo REGNO into start chains if they are
312 not there yet. */
313 static void
314 insert_in_live_range_start_chain (int regno)
316 lra_live_range_t r = lra_reg_info[regno].live_ranges;
318 if (r->start_next != &not_in_chain_mark)
319 return;
320 for (; r != NULL; r = r->next)
322 r->start_next = start_point_ranges[r->start];
323 start_point_ranges[r->start] = r;
327 /* Free START_POINT_RANGES. */
328 static void
329 finish_live_range_start_chains (void)
331 gcc_assert (start_point_ranges != NULL);
332 free (start_point_ranges);
333 start_point_ranges = NULL;
336 /* Map: program point -> bitmap of all pseudos living at the point and
337 assigned to hard registers. */
338 static bitmap_head *live_hard_reg_pseudos;
339 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
341 /* reg_renumber corresponding to pseudos marked in
342 live_hard_reg_pseudos. reg_renumber might be not matched to
343 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
344 live_hard_reg_pseudos. */
345 static int *live_pseudos_reg_renumber;
347 /* Sparseset used to calculate living hard reg pseudos for some program
348 point range. */
349 static sparseset live_range_hard_reg_pseudos;
351 /* Sparseset used to calculate living reload/inheritance pseudos for
352 some program point range. */
353 static sparseset live_range_reload_inheritance_pseudos;
355 /* Allocate and initialize the data about living pseudos at program
356 points. */
357 static void
358 init_lives (void)
360 int i, max_regno = max_reg_num ();
362 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
363 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
364 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
365 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
366 for (i = 0; i < lra_live_max_point; i++)
367 bitmap_initialize (&live_hard_reg_pseudos[i],
368 &live_hard_reg_pseudos_bitmap_obstack);
369 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
370 for (i = 0; i < max_regno; i++)
371 live_pseudos_reg_renumber[i] = -1;
374 /* Free the data about living pseudos at program points. */
375 static void
376 finish_lives (void)
378 sparseset_free (live_range_hard_reg_pseudos);
379 sparseset_free (live_range_reload_inheritance_pseudos);
380 free (live_hard_reg_pseudos);
381 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
382 free (live_pseudos_reg_renumber);
385 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
386 entries for pseudo REGNO. Assume that the register has been
387 spilled if FREE_P, otherwise assume that it has been assigned
388 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
389 ranges in the start chains when it is assumed to be assigned to a
390 hard register because we use the chains of pseudos assigned to hard
391 registers during allocation. */
392 static void
393 update_lives (int regno, bool free_p)
395 int p;
396 lra_live_range_t r;
398 if (reg_renumber[regno] < 0)
399 return;
400 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
401 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
403 for (p = r->start; p <= r->finish; p++)
404 if (free_p)
405 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
406 else
408 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
409 insert_in_live_range_start_chain (regno);
414 /* Sparseset used to calculate reload pseudos conflicting with a given
415 pseudo when we are trying to find a hard register for the given
416 pseudo. */
417 static sparseset conflict_reload_and_inheritance_pseudos;
419 /* Map: program point -> bitmap of all reload and inheritance pseudos
420 living at the point. */
421 static bitmap_head *live_reload_and_inheritance_pseudos;
422 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
424 /* Allocate and initialize data about living reload pseudos at any
425 given program point. */
426 static void
427 init_live_reload_and_inheritance_pseudos (void)
429 int i, p, max_regno = max_reg_num ();
430 lra_live_range_t r;
432 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
433 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
434 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
435 for (p = 0; p < lra_live_max_point; p++)
436 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
437 &live_reload_and_inheritance_pseudos_bitmap_obstack);
438 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
440 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
441 for (p = r->start; p <= r->finish; p++)
442 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
446 /* Finalize data about living reload pseudos at any given program
447 point. */
448 static void
449 finish_live_reload_and_inheritance_pseudos (void)
451 sparseset_free (conflict_reload_and_inheritance_pseudos);
452 free (live_reload_and_inheritance_pseudos);
453 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
456 /* The value used to check that cost of given hard reg is really
457 defined currently. */
458 static int curr_hard_regno_costs_check = 0;
459 /* Array used to check that cost of the corresponding hard reg (the
460 array element index) is really defined currently. */
461 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
462 /* The current costs of allocation of hard regs. Defined only if the
463 value of the corresponding element of the previous array is equal to
464 CURR_HARD_REGNO_COSTS_CHECK. */
465 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
467 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
468 not defined yet. */
469 static inline void
470 adjust_hard_regno_cost (int hard_regno, int incr)
472 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
473 hard_regno_costs[hard_regno] = 0;
474 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
475 hard_regno_costs[hard_regno] += incr;
478 /* Try to find a free hard register for pseudo REGNO. Return the
479 hard register on success and set *COST to the cost of using
480 that register. (If several registers have equal cost, the one with
481 the highest priority wins.) Return -1 on failure.
483 If FIRST_P, return the first available hard reg ignoring other
484 criteria, e.g. allocation cost. This approach results in less hard
485 reg pool fragmentation and permit to allocate hard regs to reload
486 pseudos in complicated situations where pseudo sizes are different.
488 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
489 otherwise consider all hard registers in REGNO's class.
491 If REGNO_SET is not empty, only hard registers from the set are
492 considered. */
493 static int
494 find_hard_regno_for_1 (int regno, int *cost, int try_only_hard_regno,
495 bool first_p, HARD_REG_SET regno_set)
497 HARD_REG_SET conflict_set;
498 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
499 lra_live_range_t r;
500 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
501 int hr, conflict_hr, nregs;
502 machine_mode biggest_mode;
503 unsigned int k, conflict_regno;
504 int offset, val, biggest_nregs, nregs_diff;
505 enum reg_class rclass;
506 bitmap_iterator bi;
507 bool *rclass_intersect_p;
508 HARD_REG_SET impossible_start_hard_regs, available_regs;
510 if (hard_reg_set_empty_p (regno_set))
511 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
512 else
514 COMPL_HARD_REG_SET (conflict_set, regno_set);
515 IOR_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
517 rclass = regno_allocno_class_array[regno];
518 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
519 curr_hard_regno_costs_check++;
520 sparseset_clear (conflict_reload_and_inheritance_pseudos);
521 sparseset_clear (live_range_hard_reg_pseudos);
522 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
523 biggest_mode = lra_reg_info[regno].biggest_mode;
524 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
526 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
527 if (rclass_intersect_p[regno_allocno_class_array[k]])
528 sparseset_set_bit (live_range_hard_reg_pseudos, k);
529 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
530 0, k, bi)
531 if (lra_reg_info[k].preferred_hard_regno1 >= 0
532 && live_pseudos_reg_renumber[k] < 0
533 && rclass_intersect_p[regno_allocno_class_array[k]])
534 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
535 for (p = r->start + 1; p <= r->finish; p++)
537 lra_live_range_t r2;
539 for (r2 = start_point_ranges[p];
540 r2 != NULL;
541 r2 = r2->start_next)
543 if (r2->regno >= lra_constraint_new_regno_start
544 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
545 && live_pseudos_reg_renumber[r2->regno] < 0
546 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
547 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
548 r2->regno);
549 if (live_pseudos_reg_renumber[r2->regno] >= 0
550 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
551 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
555 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
557 adjust_hard_regno_cost
558 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
559 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
560 adjust_hard_regno_cost
561 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
563 #ifdef STACK_REGS
564 if (lra_reg_info[regno].no_stack_p)
565 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
566 SET_HARD_REG_BIT (conflict_set, i);
567 #endif
568 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
569 val = lra_reg_info[regno].val;
570 offset = lra_reg_info[regno].offset;
571 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
572 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
573 if (lra_reg_val_equal_p (conflict_regno, val, offset))
575 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
576 nregs = (hard_regno_nregs[conflict_hr]
577 [lra_reg_info[conflict_regno].biggest_mode]);
578 /* Remember about multi-register pseudos. For example, 2 hard
579 register pseudos can start on the same hard register but can
580 not start on HR and HR+1/HR-1. */
581 for (hr = conflict_hr + 1;
582 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
583 hr++)
584 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
585 for (hr = conflict_hr - 1;
586 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
587 hr--)
588 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
590 else
592 add_to_hard_reg_set (&conflict_set,
593 lra_reg_info[conflict_regno].biggest_mode,
594 live_pseudos_reg_renumber[conflict_regno]);
595 if (hard_reg_set_subset_p (reg_class_contents[rclass],
596 conflict_set))
597 return -1;
599 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
600 conflict_regno)
601 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
603 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
604 if ((hard_regno
605 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
607 adjust_hard_regno_cost
608 (hard_regno,
609 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
610 if ((hard_regno
611 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
612 adjust_hard_regno_cost
613 (hard_regno,
614 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
617 /* Make sure that all registers in a multi-word pseudo belong to the
618 required class. */
619 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
620 lra_assert (rclass != NO_REGS);
621 rclass_size = ira_class_hard_regs_num[rclass];
622 best_hard_regno = -1;
623 hard_regno = ira_class_hard_regs[rclass][0];
624 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
625 nregs_diff = (biggest_nregs
626 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
627 COPY_HARD_REG_SET (available_regs, reg_class_contents[rclass]);
628 AND_COMPL_HARD_REG_SET (available_regs, lra_no_alloc_regs);
629 for (i = 0; i < rclass_size; i++)
631 if (try_only_hard_regno >= 0)
632 hard_regno = try_only_hard_regno;
633 else
634 hard_regno = ira_class_hard_regs[rclass][i];
635 if (! overlaps_hard_reg_set_p (conflict_set,
636 PSEUDO_REGNO_MODE (regno), hard_regno)
637 /* We can not use prohibited_class_mode_regs because it is
638 not defined for all classes. */
639 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
640 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
641 && (nregs_diff == 0
642 || (WORDS_BIG_ENDIAN
643 ? (hard_regno - nregs_diff >= 0
644 && TEST_HARD_REG_BIT (available_regs,
645 hard_regno - nregs_diff))
646 : TEST_HARD_REG_BIT (available_regs,
647 hard_regno + nregs_diff))))
649 if (hard_regno_costs_check[hard_regno]
650 != curr_hard_regno_costs_check)
652 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
653 hard_regno_costs[hard_regno] = 0;
655 for (j = 0;
656 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
657 j++)
658 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
659 && ! df_regs_ever_live_p (hard_regno + j))
660 /* It needs save restore. */
661 hard_regno_costs[hard_regno]
662 += (2
663 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
664 + 1);
665 priority = targetm.register_priority (hard_regno);
666 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
667 || (hard_regno_costs[hard_regno] == best_cost
668 && (priority > best_priority
669 || (targetm.register_usage_leveling_p ()
670 && priority == best_priority
671 && best_usage > lra_hard_reg_usage[hard_regno]))))
673 best_hard_regno = hard_regno;
674 best_cost = hard_regno_costs[hard_regno];
675 best_priority = priority;
676 best_usage = lra_hard_reg_usage[hard_regno];
679 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
680 break;
682 if (best_hard_regno >= 0)
683 *cost = best_cost - lra_reg_info[regno].freq;
684 return best_hard_regno;
687 /* A wrapper for find_hard_regno_for_1 (see comments for that function
688 description). This function tries to find a hard register for
689 preferred class first if it is worth. */
690 static int
691 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno, bool first_p)
693 int hard_regno;
694 HARD_REG_SET regno_set;
696 /* Only original pseudos can have a different preferred class. */
697 if (try_only_hard_regno < 0 && regno < lra_new_regno_start)
699 enum reg_class pref_class = reg_preferred_class (regno);
701 if (regno_allocno_class_array[regno] != pref_class)
703 hard_regno = find_hard_regno_for_1 (regno, cost, -1, first_p,
704 reg_class_contents[pref_class]);
705 if (hard_regno >= 0)
706 return hard_regno;
709 CLEAR_HARD_REG_SET (regno_set);
710 return find_hard_regno_for_1 (regno, cost, try_only_hard_regno, first_p,
711 regno_set);
714 /* Current value used for checking elements in
715 update_hard_regno_preference_check. */
716 static int curr_update_hard_regno_preference_check;
717 /* If an element value is equal to the above variable value, then the
718 corresponding regno has been processed for preference
719 propagation. */
720 static int *update_hard_regno_preference_check;
722 /* Update the preference for using HARD_REGNO for pseudos that are
723 connected directly or indirectly with REGNO. Apply divisor DIV
724 to any preference adjustments.
726 The more indirectly a pseudo is connected, the smaller its effect
727 should be. We therefore increase DIV on each "hop". */
728 static void
729 update_hard_regno_preference (int regno, int hard_regno, int div)
731 int another_regno, cost;
732 lra_copy_t cp, next_cp;
734 /* Search depth 5 seems to be enough. */
735 if (div > (1 << 5))
736 return;
737 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
739 if (cp->regno1 == regno)
741 next_cp = cp->regno1_next;
742 another_regno = cp->regno2;
744 else if (cp->regno2 == regno)
746 next_cp = cp->regno2_next;
747 another_regno = cp->regno1;
749 else
750 gcc_unreachable ();
751 if (reg_renumber[another_regno] < 0
752 && (update_hard_regno_preference_check[another_regno]
753 != curr_update_hard_regno_preference_check))
755 update_hard_regno_preference_check[another_regno]
756 = curr_update_hard_regno_preference_check;
757 cost = cp->freq < div ? 1 : cp->freq / div;
758 lra_setup_reload_pseudo_preferenced_hard_reg
759 (another_regno, hard_regno, cost);
760 update_hard_regno_preference (another_regno, hard_regno, div * 2);
765 /* Return prefix title for pseudo REGNO. */
766 static const char *
767 pseudo_prefix_title (int regno)
769 return
770 (regno < lra_constraint_new_regno_start ? ""
771 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
772 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
773 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
774 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
775 : "reload ");
778 /* Update REG_RENUMBER and other pseudo preferences by assignment of
779 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
780 void
781 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
783 int i, hr;
785 /* We can not just reassign hard register. */
786 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
787 if ((hr = hard_regno) < 0)
788 hr = reg_renumber[regno];
789 reg_renumber[regno] = hard_regno;
790 lra_assert (hr >= 0);
791 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
792 if (hard_regno < 0)
793 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
794 else
795 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
796 if (print_p && lra_dump_file != NULL)
797 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
798 reg_renumber[regno], pseudo_prefix_title (regno),
799 regno, lra_reg_info[regno].freq);
800 if (hard_regno >= 0)
802 curr_update_hard_regno_preference_check++;
803 update_hard_regno_preference (regno, hard_regno, 1);
807 /* Pseudos which occur in insns containing a particular pseudo. */
808 static bitmap_head insn_conflict_pseudos;
810 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
811 and best spill pseudos for given pseudo (and best hard regno). */
812 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
814 /* Current pseudo check for validity of elements in
815 TRY_HARD_REG_PSEUDOS. */
816 static int curr_pseudo_check;
817 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
818 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
819 /* Pseudos who hold given hard register at the considered points. */
820 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
822 /* Set up try_hard_reg_pseudos for given program point P and class
823 RCLASS. Those are pseudos living at P and assigned to a hard
824 register of RCLASS. In other words, those are pseudos which can be
825 spilled to assign a hard register of RCLASS to a pseudo living at
826 P. */
827 static void
828 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
830 int i, hard_regno;
831 machine_mode mode;
832 unsigned int spill_regno;
833 bitmap_iterator bi;
835 /* Find what pseudos could be spilled. */
836 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
838 mode = PSEUDO_REGNO_MODE (spill_regno);
839 hard_regno = live_pseudos_reg_renumber[spill_regno];
840 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
841 mode, hard_regno))
843 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
845 if (try_hard_reg_pseudos_check[hard_regno + i]
846 != curr_pseudo_check)
848 try_hard_reg_pseudos_check[hard_regno + i]
849 = curr_pseudo_check;
850 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
852 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
853 spill_regno);
859 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
860 assignment means that we might undo the data change. */
861 static void
862 assign_temporarily (int regno, int hard_regno)
864 int p;
865 lra_live_range_t r;
867 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
869 for (p = r->start; p <= r->finish; p++)
870 if (hard_regno < 0)
871 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
872 else
874 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
875 insert_in_live_range_start_chain (regno);
878 live_pseudos_reg_renumber[regno] = hard_regno;
881 /* Array used for sorting reload pseudos for subsequent allocation
882 after spilling some pseudo. */
883 static int *sorted_reload_pseudos;
885 /* Spill some pseudos for a reload pseudo REGNO and return hard
886 register which should be used for pseudo after spilling. The
887 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
888 choose hard register (and pseudos occupying the hard registers and
889 to be spilled), we take into account not only how REGNO will
890 benefit from the spills but also how other reload pseudos not yet
891 assigned to hard registers benefit from the spills too. In very
892 rare cases, the function can fail and return -1.
894 If FIRST_P, return the first available hard reg ignoring other
895 criteria, e.g. allocation cost and cost of spilling non-reload
896 pseudos. This approach results in less hard reg pool fragmentation
897 and permit to allocate hard regs to reload pseudos in complicated
898 situations where pseudo sizes are different. */
899 static int
900 spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
902 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
903 int reload_hard_regno, reload_cost;
904 machine_mode mode;
905 enum reg_class rclass;
906 unsigned int spill_regno, reload_regno, uid;
907 int insn_pseudos_num, best_insn_pseudos_num;
908 int bad_spills_num, smallest_bad_spills_num;
909 lra_live_range_t r;
910 bitmap_iterator bi;
912 rclass = regno_allocno_class_array[regno];
913 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
914 bitmap_clear (&insn_conflict_pseudos);
915 bitmap_clear (&best_spill_pseudos_bitmap);
916 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
918 struct lra_insn_reg *ir;
920 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
921 if (ir->regno >= FIRST_PSEUDO_REGISTER)
922 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
924 best_hard_regno = -1;
925 best_cost = INT_MAX;
926 best_insn_pseudos_num = INT_MAX;
927 smallest_bad_spills_num = INT_MAX;
928 rclass_size = ira_class_hard_regs_num[rclass];
929 mode = PSEUDO_REGNO_MODE (regno);
930 /* Invalidate try_hard_reg_pseudos elements. */
931 curr_pseudo_check++;
932 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
933 for (p = r->start; p <= r->finish; p++)
934 setup_try_hard_regno_pseudos (p, rclass);
935 for (i = 0; i < rclass_size; i++)
937 hard_regno = ira_class_hard_regs[rclass][i];
938 bitmap_clear (&spill_pseudos_bitmap);
939 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
941 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
942 continue;
943 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
944 bitmap_ior_into (&spill_pseudos_bitmap,
945 &try_hard_reg_pseudos[hard_regno + j]);
947 /* Spill pseudos. */
948 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
949 if ((pic_offset_table_rtx != NULL
950 && spill_regno == REGNO (pic_offset_table_rtx))
951 || ((int) spill_regno >= lra_constraint_new_regno_start
952 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
953 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
954 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
955 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
956 goto fail;
957 insn_pseudos_num = 0;
958 bad_spills_num = 0;
959 if (lra_dump_file != NULL)
960 fprintf (lra_dump_file, " Trying %d:", hard_regno);
961 sparseset_clear (live_range_reload_inheritance_pseudos);
962 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
964 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
965 insn_pseudos_num++;
966 if (spill_regno >= (unsigned int) lra_bad_spill_regno_start)
967 bad_spills_num++;
968 for (r = lra_reg_info[spill_regno].live_ranges;
969 r != NULL;
970 r = r->next)
972 for (p = r->start; p <= r->finish; p++)
974 lra_live_range_t r2;
976 for (r2 = start_point_ranges[p];
977 r2 != NULL;
978 r2 = r2->start_next)
979 if (r2->regno >= lra_constraint_new_regno_start)
980 sparseset_set_bit (live_range_reload_inheritance_pseudos,
981 r2->regno);
985 n = 0;
986 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
987 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
988 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
989 reload_regno)
990 if ((int) reload_regno != regno
991 && (ira_reg_classes_intersect_p
992 [rclass][regno_allocno_class_array[reload_regno]])
993 && live_pseudos_reg_renumber[reload_regno] < 0
994 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
995 sorted_reload_pseudos[n++] = reload_regno;
996 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
998 update_lives (spill_regno, true);
999 if (lra_dump_file != NULL)
1000 fprintf (lra_dump_file, " spill %d(freq=%d)",
1001 spill_regno, lra_reg_info[spill_regno].freq);
1003 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
1004 if (hard_regno >= 0)
1006 assign_temporarily (regno, hard_regno);
1007 qsort (sorted_reload_pseudos, n, sizeof (int),
1008 reload_pseudo_compare_func);
1009 for (j = 0; j < n; j++)
1011 reload_regno = sorted_reload_pseudos[j];
1012 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
1013 if ((reload_hard_regno
1014 = find_hard_regno_for (reload_regno,
1015 &reload_cost, -1, first_p)) >= 0)
1017 if (lra_dump_file != NULL)
1018 fprintf (lra_dump_file, " assign %d(cost=%d)",
1019 reload_regno, reload_cost);
1020 assign_temporarily (reload_regno, reload_hard_regno);
1021 cost += reload_cost;
1024 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1026 rtx_insn_list *x;
1028 cost += lra_reg_info[spill_regno].freq;
1029 if (ira_reg_equiv[spill_regno].memory != NULL
1030 || ira_reg_equiv[spill_regno].constant != NULL)
1031 for (x = ira_reg_equiv[spill_regno].init_insns;
1032 x != NULL;
1033 x = x->next ())
1034 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
1036 if (best_insn_pseudos_num > insn_pseudos_num
1037 || (best_insn_pseudos_num == insn_pseudos_num
1038 && (bad_spills_num < smallest_bad_spills_num
1039 || (bad_spills_num == smallest_bad_spills_num
1040 && best_cost > cost))))
1042 best_insn_pseudos_num = insn_pseudos_num;
1043 smallest_bad_spills_num = bad_spills_num;
1044 best_cost = cost;
1045 best_hard_regno = hard_regno;
1046 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
1047 if (lra_dump_file != NULL)
1048 fprintf (lra_dump_file,
1049 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1050 hard_regno, cost, bad_spills_num, insn_pseudos_num);
1052 assign_temporarily (regno, -1);
1053 for (j = 0; j < n; j++)
1055 reload_regno = sorted_reload_pseudos[j];
1056 if (live_pseudos_reg_renumber[reload_regno] >= 0)
1057 assign_temporarily (reload_regno, -1);
1060 if (lra_dump_file != NULL)
1061 fprintf (lra_dump_file, "\n");
1062 /* Restore the live hard reg pseudo info for spilled pseudos. */
1063 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1064 update_lives (spill_regno, false);
1065 fail:
1068 /* Spill: */
1069 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
1071 if ((int) spill_regno >= lra_constraint_new_regno_start)
1072 former_reload_pseudo_spill_p = true;
1073 if (lra_dump_file != NULL)
1074 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
1075 pseudo_prefix_title (spill_regno),
1076 spill_regno, reg_renumber[spill_regno],
1077 lra_reg_info[spill_regno].freq, regno);
1078 update_lives (spill_regno, true);
1079 lra_setup_reg_renumber (spill_regno, -1, false);
1081 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1082 return best_hard_regno;
1085 /* Assign HARD_REGNO to REGNO. */
1086 static void
1087 assign_hard_regno (int hard_regno, int regno)
1089 int i;
1091 lra_assert (hard_regno >= 0);
1092 lra_setup_reg_renumber (regno, hard_regno, true);
1093 update_lives (regno, false);
1094 for (i = 0;
1095 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
1096 i++)
1097 df_set_regs_ever_live (hard_regno + i, true);
1100 /* Array used for sorting different pseudos. */
1101 static int *sorted_pseudos;
1103 /* The constraints pass is allowed to create equivalences between
1104 pseudos that make the current allocation "incorrect" (in the sense
1105 that pseudos are assigned to hard registers from their own conflict
1106 sets). The global variable lra_risky_transformations_p says
1107 whether this might have happened.
1109 Process pseudos assigned to hard registers (less frequently used
1110 first), spill if a conflict is found, and mark the spilled pseudos
1111 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1112 pseudos, assigned to hard registers. */
1113 static void
1114 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1115 spilled_pseudo_bitmap)
1117 int p, i, j, n, regno, hard_regno;
1118 unsigned int k, conflict_regno;
1119 int val, offset;
1120 HARD_REG_SET conflict_set;
1121 machine_mode mode;
1122 lra_live_range_t r;
1123 bitmap_iterator bi;
1124 int max_regno = max_reg_num ();
1126 if (! lra_risky_transformations_p)
1128 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1129 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1130 update_lives (i, false);
1131 return;
1133 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1134 if ((pic_offset_table_rtx == NULL_RTX
1135 || i != (int) REGNO (pic_offset_table_rtx))
1136 && reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1137 sorted_pseudos[n++] = i;
1138 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1139 if (pic_offset_table_rtx != NULL_RTX
1140 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1141 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1142 sorted_pseudos[n++] = regno;
1143 for (i = n - 1; i >= 0; i--)
1145 regno = sorted_pseudos[i];
1146 hard_regno = reg_renumber[regno];
1147 lra_assert (hard_regno >= 0);
1148 mode = lra_reg_info[regno].biggest_mode;
1149 sparseset_clear (live_range_hard_reg_pseudos);
1150 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1152 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1153 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1154 for (p = r->start + 1; p <= r->finish; p++)
1156 lra_live_range_t r2;
1158 for (r2 = start_point_ranges[p];
1159 r2 != NULL;
1160 r2 = r2->start_next)
1161 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1162 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1165 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1166 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1167 val = lra_reg_info[regno].val;
1168 offset = lra_reg_info[regno].offset;
1169 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1170 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1171 /* If it is multi-register pseudos they should start on
1172 the same hard register. */
1173 || hard_regno != reg_renumber[conflict_regno])
1174 add_to_hard_reg_set (&conflict_set,
1175 lra_reg_info[conflict_regno].biggest_mode,
1176 reg_renumber[conflict_regno]);
1177 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1179 update_lives (regno, false);
1180 continue;
1182 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1183 for (j = 0;
1184 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1185 j++)
1186 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1187 reg_renumber[regno] = -1;
1188 if (regno >= lra_constraint_new_regno_start)
1189 former_reload_pseudo_spill_p = true;
1190 if (lra_dump_file != NULL)
1191 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1192 regno);
1196 /* Improve allocation by assigning the same hard regno of inheritance
1197 pseudos to the connected pseudos. We need this because inheritance
1198 pseudos are allocated after reload pseudos in the thread and when
1199 we assign a hard register to a reload pseudo we don't know yet that
1200 the connected inheritance pseudos can get the same hard register.
1201 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1202 static void
1203 improve_inheritance (bitmap changed_pseudos)
1205 unsigned int k;
1206 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1207 lra_copy_t cp, next_cp;
1208 bitmap_iterator bi;
1210 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1211 return;
1212 n = 0;
1213 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1214 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1215 sorted_pseudos[n++] = k;
1216 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1217 for (i = 0; i < n; i++)
1219 regno = sorted_pseudos[i];
1220 hard_regno = reg_renumber[regno];
1221 lra_assert (hard_regno >= 0);
1222 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1224 if (cp->regno1 == regno)
1226 next_cp = cp->regno1_next;
1227 another_regno = cp->regno2;
1229 else if (cp->regno2 == regno)
1231 next_cp = cp->regno2_next;
1232 another_regno = cp->regno1;
1234 else
1235 gcc_unreachable ();
1236 /* Don't change reload pseudo allocation. It might have
1237 this allocation for a purpose and changing it can result
1238 in LRA cycling. */
1239 if ((another_regno < lra_constraint_new_regno_start
1240 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1241 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1242 && another_hard_regno != hard_regno)
1244 if (lra_dump_file != NULL)
1245 fprintf
1246 (lra_dump_file,
1247 " Improving inheritance for %d(%d) and %d(%d)...\n",
1248 regno, hard_regno, another_regno, another_hard_regno);
1249 update_lives (another_regno, true);
1250 lra_setup_reg_renumber (another_regno, -1, false);
1251 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1252 hard_regno, false))
1253 assign_hard_regno (hard_regno, another_regno);
1254 else
1255 assign_hard_regno (another_hard_regno, another_regno);
1256 bitmap_set_bit (changed_pseudos, another_regno);
1263 /* Bitmap finally containing all pseudos spilled on this assignment
1264 pass. */
1265 static bitmap_head all_spilled_pseudos;
1266 /* All pseudos whose allocation was changed. */
1267 static bitmap_head changed_pseudo_bitmap;
1270 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1271 REGNO and whose hard regs can be assigned to REGNO. */
1272 static void
1273 find_all_spills_for (int regno)
1275 int p;
1276 lra_live_range_t r;
1277 unsigned int k;
1278 bitmap_iterator bi;
1279 enum reg_class rclass;
1280 bool *rclass_intersect_p;
1282 rclass = regno_allocno_class_array[regno];
1283 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1284 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1286 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1287 if (rclass_intersect_p[regno_allocno_class_array[k]])
1288 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1289 for (p = r->start + 1; p <= r->finish; p++)
1291 lra_live_range_t r2;
1293 for (r2 = start_point_ranges[p];
1294 r2 != NULL;
1295 r2 = r2->start_next)
1297 if (live_pseudos_reg_renumber[r2->regno] >= 0
1298 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
1299 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1305 /* Assign hard registers to reload pseudos and other pseudos. */
1306 static void
1307 assign_by_spills (void)
1309 int i, n, nfails, iter, regno, hard_regno, cost, restore_regno;
1310 rtx_insn *insn;
1311 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1312 unsigned int u, conflict_regno;
1313 bitmap_iterator bi;
1314 bool reload_p;
1315 int max_regno = max_reg_num ();
1317 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1318 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1319 && regno_allocno_class_array[i] != NO_REGS)
1320 sorted_pseudos[n++] = i;
1321 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1322 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1323 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1324 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1325 curr_update_hard_regno_preference_check = 0;
1326 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1327 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1328 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1329 curr_pseudo_check = 0;
1330 bitmap_initialize (&changed_insns, &reg_obstack);
1331 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1332 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1333 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1334 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1335 for (iter = 0; iter <= 1; iter++)
1337 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1338 nfails = 0;
1339 for (i = 0; i < n; i++)
1341 regno = sorted_pseudos[i];
1342 if (lra_dump_file != NULL)
1343 fprintf (lra_dump_file, " Assigning to %d "
1344 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1345 regno, reg_class_names[regno_allocno_class_array[regno]],
1346 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1347 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1348 regno_assign_info[regno_assign_info[regno].first].freq);
1349 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
1350 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1351 if (hard_regno < 0 && reload_p)
1352 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
1353 if (hard_regno < 0)
1355 if (reload_p)
1356 sorted_pseudos[nfails++] = regno;
1358 else
1360 /* This register might have been spilled by the previous
1361 pass. Indicate that it is no longer spilled. */
1362 bitmap_clear_bit (&all_spilled_pseudos, regno);
1363 assign_hard_regno (hard_regno, regno);
1364 if (! reload_p)
1365 /* As non-reload pseudo assignment is changed we
1366 should reconsider insns referring for the
1367 pseudo. */
1368 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1371 if (nfails == 0)
1372 break;
1373 if (iter > 0)
1375 /* We did not assign hard regs to reload pseudos after two iterations.
1376 Either it's an asm and something is wrong with the constraints, or
1377 we have run out of spill registers; error out in either case. */
1378 bool asm_p = false;
1379 bitmap_head failed_reload_insns;
1381 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1382 for (i = 0; i < nfails; i++)
1384 regno = sorted_pseudos[i];
1385 bitmap_ior_into (&failed_reload_insns,
1386 &lra_reg_info[regno].insn_bitmap);
1387 /* Assign an arbitrary hard register of regno class to
1388 avoid further trouble with this insn. */
1389 bitmap_clear_bit (&all_spilled_pseudos, regno);
1390 assign_hard_regno
1391 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1392 regno);
1394 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1396 insn = lra_insn_recog_data[u]->insn;
1397 if (asm_noperands (PATTERN (insn)) >= 0)
1399 asm_p = true;
1400 error_for_asm (insn,
1401 "%<asm%> operand has impossible constraints");
1402 /* Avoid further trouble with this insn.
1403 For asm goto, instead of fixing up all the edges
1404 just clear the template and clear input operands
1405 (asm goto doesn't have any output operands). */
1406 if (JUMP_P (insn))
1408 rtx asm_op = extract_asm_operands (PATTERN (insn));
1409 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1410 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1411 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1412 lra_update_insn_regno_info (insn);
1414 else
1416 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1417 lra_set_insn_deleted (insn);
1420 else if (!asm_p)
1422 error ("unable to find a register to spill");
1423 fatal_insn ("this is the insn:", insn);
1426 break;
1428 /* This is a very rare event. We can not assign a hard register
1429 to reload pseudo because the hard register was assigned to
1430 another reload pseudo on a previous assignment pass. For x86
1431 example, on the 1st pass we assigned CX (although another
1432 hard register could be used for this) to reload pseudo in an
1433 insn, on the 2nd pass we need CX (and only this) hard
1434 register for a new reload pseudo in the same insn. Another
1435 possible situation may occur in assigning to multi-regs
1436 reload pseudos when hard regs pool is too fragmented even
1437 after spilling non-reload pseudos.
1439 We should do something radical here to succeed. Here we
1440 spill *all* conflicting pseudos and reassign them. */
1441 if (lra_dump_file != NULL)
1442 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1443 sparseset_clear (live_range_hard_reg_pseudos);
1444 for (i = 0; i < nfails; i++)
1446 if (lra_dump_file != NULL)
1447 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1448 sorted_pseudos[i]);
1449 find_all_spills_for (sorted_pseudos[i]);
1451 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1453 if ((int) conflict_regno >= lra_constraint_new_regno_start)
1455 sorted_pseudos[nfails++] = conflict_regno;
1456 former_reload_pseudo_spill_p = true;
1458 if (lra_dump_file != NULL)
1459 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1460 pseudo_prefix_title (conflict_regno), conflict_regno,
1461 reg_renumber[conflict_regno],
1462 lra_reg_info[conflict_regno].freq);
1463 update_lives (conflict_regno, true);
1464 lra_setup_reg_renumber (conflict_regno, -1, false);
1466 n = nfails;
1468 improve_inheritance (&changed_pseudo_bitmap);
1469 bitmap_clear (&non_reload_pseudos);
1470 bitmap_clear (&changed_insns);
1471 if (! lra_simple_p)
1473 /* We should not assign to original pseudos of inheritance
1474 pseudos or split pseudos if any its inheritance pseudo did
1475 not get hard register or any its split pseudo was not split
1476 because undo inheritance/split pass will extend live range of
1477 such inheritance or split pseudos. */
1478 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1479 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1480 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1481 && reg_renumber[u] < 0
1482 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1483 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1484 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1485 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1486 && reg_renumber[u] >= 0)
1487 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1488 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1489 if (((i < lra_constraint_new_regno_start
1490 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1491 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1492 && lra_reg_info[i].restore_regno >= 0)
1493 || (bitmap_bit_p (&lra_split_regs, i)
1494 && lra_reg_info[i].restore_regno >= 0)
1495 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1496 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1497 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1498 && regno_allocno_class_array[i] != NO_REGS)
1499 sorted_pseudos[n++] = i;
1500 bitmap_clear (&do_not_assign_nonreload_pseudos);
1501 if (n != 0 && lra_dump_file != NULL)
1502 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1503 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1504 for (i = 0; i < n; i++)
1506 regno = sorted_pseudos[i];
1507 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1508 if (hard_regno >= 0)
1510 assign_hard_regno (hard_regno, regno);
1511 /* We change allocation for non-reload pseudo on this
1512 iteration -- mark the pseudo for invalidation of used
1513 alternatives of insns containing the pseudo. */
1514 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1516 else
1518 enum reg_class rclass = lra_get_allocno_class (regno);
1519 enum reg_class spill_class;
1521 if (targetm.spill_class == NULL
1522 || lra_reg_info[regno].restore_regno < 0
1523 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1524 || (spill_class
1525 = ((enum reg_class)
1526 targetm.spill_class
1527 ((reg_class_t) rclass,
1528 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1529 continue;
1530 regno_allocno_class_array[regno] = spill_class;
1531 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1532 if (hard_regno < 0)
1533 regno_allocno_class_array[regno] = rclass;
1534 else
1536 setup_reg_classes
1537 (regno, spill_class, spill_class, spill_class);
1538 assign_hard_regno (hard_regno, regno);
1539 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1544 free (update_hard_regno_preference_check);
1545 bitmap_clear (&best_spill_pseudos_bitmap);
1546 bitmap_clear (&spill_pseudos_bitmap);
1547 bitmap_clear (&insn_conflict_pseudos);
1551 /* Entry function to assign hard registers to new reload pseudos
1552 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1553 of old pseudos) and possibly to the old pseudos. The function adds
1554 what insns to process for the next constraint pass. Those are all
1555 insns who contains non-reload and non-inheritance pseudos with
1556 changed allocation.
1558 Return true if we did not spill any non-reload and non-inheritance
1559 pseudos. */
1560 bool
1561 lra_assign (void)
1563 int i;
1564 unsigned int u;
1565 bitmap_iterator bi;
1566 bitmap_head insns_to_process;
1567 bool no_spills_p;
1568 int max_regno = max_reg_num ();
1570 timevar_push (TV_LRA_ASSIGN);
1571 lra_assignment_iter++;
1572 if (lra_dump_file != NULL)
1573 fprintf (lra_dump_file, "\n********** Assignment #%d: **********\n\n",
1574 lra_assignment_iter);
1575 init_lives ();
1576 sorted_pseudos = XNEWVEC (int, max_regno);
1577 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1578 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1579 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1580 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1581 former_reload_pseudo_spill_p = false;
1582 init_regno_assign_info ();
1583 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1584 create_live_range_start_chains ();
1585 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1586 #ifdef ENABLE_CHECKING
1587 if (!flag_ipa_ra)
1588 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1589 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1590 && lra_reg_info[i].call_p
1591 && overlaps_hard_reg_set_p (call_used_reg_set,
1592 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1593 gcc_unreachable ();
1594 #endif
1595 /* Setup insns to process on the next constraint pass. */
1596 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1597 init_live_reload_and_inheritance_pseudos ();
1598 assign_by_spills ();
1599 finish_live_reload_and_inheritance_pseudos ();
1600 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1601 no_spills_p = true;
1602 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1603 /* We ignore spilled pseudos created on last inheritance pass
1604 because they will be removed. */
1605 if (lra_reg_info[u].restore_regno < 0)
1607 no_spills_p = false;
1608 break;
1610 finish_live_range_start_chains ();
1611 bitmap_clear (&all_spilled_pseudos);
1612 bitmap_initialize (&insns_to_process, &reg_obstack);
1613 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1614 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1615 bitmap_clear (&changed_pseudo_bitmap);
1616 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1618 lra_push_insn_by_uid (u);
1619 /* Invalidate alternatives for insn should be processed. */
1620 lra_set_used_insn_alternative_by_uid (u, -1);
1622 bitmap_clear (&insns_to_process);
1623 finish_regno_assign_info ();
1624 free (regno_allocno_class_array);
1625 free (sorted_pseudos);
1626 free (sorted_reload_pseudos);
1627 finish_lives ();
1628 timevar_pop (TV_LRA_ASSIGN);
1629 if (former_reload_pseudo_spill_p)
1630 lra_assignment_iter_after_spill++;
1631 if (lra_assignment_iter_after_spill > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER)
1632 internal_error
1633 ("Maximum number of LRA assignment passes is achieved (%d)\n",
1634 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER);
1635 return no_spills_p;