2015-06-11 Paul Thomas <pault@gcc.gnu.org>
[official-gcc.git] / gcc / lra-assigns.c
blob8bbede0b3b484c37bf86d0e06e3ddbcf27b7c8e7
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2015 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "tm.h"
81 #include "hard-reg-set.h"
82 #include "rtl.h"
83 #include "rtl-error.h"
84 #include "tm_p.h"
85 #include "target.h"
86 #include "insn-config.h"
87 #include "recog.h"
88 #include "output.h"
89 #include "regs.h"
90 #include "input.h"
91 #include "function.h"
92 #include "symtab.h"
93 #include "flags.h"
94 #include "alias.h"
95 #include "tree.h"
96 #include "expmed.h"
97 #include "dojump.h"
98 #include "explow.h"
99 #include "calls.h"
100 #include "emit-rtl.h"
101 #include "varasm.h"
102 #include "stmt.h"
103 #include "expr.h"
104 #include "predict.h"
105 #include "dominance.h"
106 #include "cfg.h"
107 #include "basic-block.h"
108 #include "except.h"
109 #include "df.h"
110 #include "ira.h"
111 #include "sparseset.h"
112 #include "params.h"
113 #include "lra-int.h"
115 /* Current iteration number of the pass and current iteration number
116 of the pass after the latest spill pass when any former reload
117 pseudo was spilled. */
118 int lra_assignment_iter;
119 int lra_assignment_iter_after_spill;
121 /* Flag of spilling former reload pseudos on this pass. */
122 static bool former_reload_pseudo_spill_p;
124 /* Array containing corresponding values of function
125 lra_get_allocno_class. It is used to speed up the code. */
126 static enum reg_class *regno_allocno_class_array;
128 /* Information about the thread to which a pseudo belongs. Threads are
129 a set of connected reload and inheritance pseudos with the same set of
130 available hard registers. Lone registers belong to their own threads. */
131 struct regno_assign_info
133 /* First/next pseudo of the same thread. */
134 int first, next;
135 /* Frequency of the thread (execution frequency of only reload
136 pseudos in the thread when the thread contains a reload pseudo).
137 Defined only for the first thread pseudo. */
138 int freq;
141 /* Map regno to the corresponding regno assignment info. */
142 static struct regno_assign_info *regno_assign_info;
144 /* All inherited, subreg or optional pseudos created before last spill
145 sub-pass. Such pseudos are permitted to get memory instead of hard
146 regs. */
147 static bitmap_head non_reload_pseudos;
149 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
150 REGNO1 and REGNO2 to form threads. */
151 static void
152 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
154 int last, regno1_first, regno2_first;
156 lra_assert (regno1 >= lra_constraint_new_regno_start
157 && regno2 >= lra_constraint_new_regno_start);
158 regno1_first = regno_assign_info[regno1].first;
159 regno2_first = regno_assign_info[regno2].first;
160 if (regno1_first != regno2_first)
162 for (last = regno2_first;
163 regno_assign_info[last].next >= 0;
164 last = regno_assign_info[last].next)
165 regno_assign_info[last].first = regno1_first;
166 regno_assign_info[last].first = regno1_first;
167 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
168 regno_assign_info[regno1_first].next = regno2_first;
169 regno_assign_info[regno1_first].freq
170 += regno_assign_info[regno2_first].freq;
172 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
173 lra_assert (regno_assign_info[regno1_first].freq >= 0);
176 /* Initialize REGNO_ASSIGN_INFO and form threads. */
177 static void
178 init_regno_assign_info (void)
180 int i, regno1, regno2, max_regno = max_reg_num ();
181 lra_copy_t cp;
183 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
184 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
186 regno_assign_info[i].first = i;
187 regno_assign_info[i].next = -1;
188 regno_assign_info[i].freq = lra_reg_info[i].freq;
190 /* Form the threads. */
191 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
192 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
193 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
194 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
195 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
196 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
197 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
198 process_copy_to_form_thread (regno1, regno2, cp->freq);
201 /* Free REGNO_ASSIGN_INFO. */
202 static void
203 finish_regno_assign_info (void)
205 free (regno_assign_info);
208 /* The function is used to sort *reload* and *inheritance* pseudos to
209 try to assign them hard registers. We put pseudos from the same
210 thread always nearby. */
211 static int
212 reload_pseudo_compare_func (const void *v1p, const void *v2p)
214 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
215 enum reg_class cl1 = regno_allocno_class_array[r1];
216 enum reg_class cl2 = regno_allocno_class_array[r2];
217 int diff;
219 lra_assert (r1 >= lra_constraint_new_regno_start
220 && r2 >= lra_constraint_new_regno_start);
222 /* Prefer to assign reload registers with smaller classes first to
223 guarantee assignment to all reload registers. */
224 if ((diff = (ira_class_hard_regs_num[cl1]
225 - ira_class_hard_regs_num[cl2])) != 0)
226 return diff;
227 if ((diff
228 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
229 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0
230 /* The code below executes rarely as nregs == 1 in most cases.
231 So we should not worry about using faster data structures to
232 check reload pseudos. */
233 && ! bitmap_bit_p (&non_reload_pseudos, r1)
234 && ! bitmap_bit_p (&non_reload_pseudos, r2))
235 return diff;
236 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
237 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
238 return diff;
239 /* Allocate bigger pseudos first to avoid register file
240 fragmentation. */
241 if ((diff
242 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
243 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
244 return diff;
245 /* Put pseudos from the thread nearby. */
246 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
247 return diff;
248 /* If regs are equally good, sort by their numbers, so that the
249 results of qsort leave nothing to chance. */
250 return r1 - r2;
253 /* The function is used to sort *non-reload* pseudos to try to assign
254 them hard registers. The order calculation is simpler than in the
255 previous function and based on the pseudo frequency usage. */
256 static int
257 pseudo_compare_func (const void *v1p, const void *v2p)
259 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
260 int diff;
262 /* Prefer to assign more frequently used registers first. */
263 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
264 return diff;
266 /* If regs are equally good, sort by their numbers, so that the
267 results of qsort leave nothing to chance. */
268 return r1 - r2;
271 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
272 pseudo live ranges with given start point. We insert only live
273 ranges of pseudos interesting for assignment purposes. They are
274 reload pseudos and pseudos assigned to hard registers. */
275 static lra_live_range_t *start_point_ranges;
277 /* Used as a flag that a live range is not inserted in the start point
278 chain. */
279 static struct lra_live_range not_in_chain_mark;
281 /* Create and set up START_POINT_RANGES. */
282 static void
283 create_live_range_start_chains (void)
285 int i, max_regno;
286 lra_live_range_t r;
288 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
289 max_regno = max_reg_num ();
290 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
291 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
293 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
295 r->start_next = start_point_ranges[r->start];
296 start_point_ranges[r->start] = r;
299 else
301 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
302 r->start_next = &not_in_chain_mark;
306 /* Insert live ranges of pseudo REGNO into start chains if they are
307 not there yet. */
308 static void
309 insert_in_live_range_start_chain (int regno)
311 lra_live_range_t r = lra_reg_info[regno].live_ranges;
313 if (r->start_next != &not_in_chain_mark)
314 return;
315 for (; r != NULL; r = r->next)
317 r->start_next = start_point_ranges[r->start];
318 start_point_ranges[r->start] = r;
322 /* Free START_POINT_RANGES. */
323 static void
324 finish_live_range_start_chains (void)
326 gcc_assert (start_point_ranges != NULL);
327 free (start_point_ranges);
328 start_point_ranges = NULL;
331 /* Map: program point -> bitmap of all pseudos living at the point and
332 assigned to hard registers. */
333 static bitmap_head *live_hard_reg_pseudos;
334 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
336 /* reg_renumber corresponding to pseudos marked in
337 live_hard_reg_pseudos. reg_renumber might be not matched to
338 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
339 live_hard_reg_pseudos. */
340 static int *live_pseudos_reg_renumber;
342 /* Sparseset used to calculate living hard reg pseudos for some program
343 point range. */
344 static sparseset live_range_hard_reg_pseudos;
346 /* Sparseset used to calculate living reload/inheritance pseudos for
347 some program point range. */
348 static sparseset live_range_reload_inheritance_pseudos;
350 /* Allocate and initialize the data about living pseudos at program
351 points. */
352 static void
353 init_lives (void)
355 int i, max_regno = max_reg_num ();
357 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
358 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
359 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
360 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
361 for (i = 0; i < lra_live_max_point; i++)
362 bitmap_initialize (&live_hard_reg_pseudos[i],
363 &live_hard_reg_pseudos_bitmap_obstack);
364 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
365 for (i = 0; i < max_regno; i++)
366 live_pseudos_reg_renumber[i] = -1;
369 /* Free the data about living pseudos at program points. */
370 static void
371 finish_lives (void)
373 sparseset_free (live_range_hard_reg_pseudos);
374 sparseset_free (live_range_reload_inheritance_pseudos);
375 free (live_hard_reg_pseudos);
376 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
377 free (live_pseudos_reg_renumber);
380 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
381 entries for pseudo REGNO. Assume that the register has been
382 spilled if FREE_P, otherwise assume that it has been assigned
383 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
384 ranges in the start chains when it is assumed to be assigned to a
385 hard register because we use the chains of pseudos assigned to hard
386 registers during allocation. */
387 static void
388 update_lives (int regno, bool free_p)
390 int p;
391 lra_live_range_t r;
393 if (reg_renumber[regno] < 0)
394 return;
395 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
396 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
398 for (p = r->start; p <= r->finish; p++)
399 if (free_p)
400 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
401 else
403 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
404 insert_in_live_range_start_chain (regno);
409 /* Sparseset used to calculate reload pseudos conflicting with a given
410 pseudo when we are trying to find a hard register for the given
411 pseudo. */
412 static sparseset conflict_reload_and_inheritance_pseudos;
414 /* Map: program point -> bitmap of all reload and inheritance pseudos
415 living at the point. */
416 static bitmap_head *live_reload_and_inheritance_pseudos;
417 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
419 /* Allocate and initialize data about living reload pseudos at any
420 given program point. */
421 static void
422 init_live_reload_and_inheritance_pseudos (void)
424 int i, p, max_regno = max_reg_num ();
425 lra_live_range_t r;
427 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
428 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
429 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
430 for (p = 0; p < lra_live_max_point; p++)
431 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
432 &live_reload_and_inheritance_pseudos_bitmap_obstack);
433 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
435 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
436 for (p = r->start; p <= r->finish; p++)
437 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
441 /* Finalize data about living reload pseudos at any given program
442 point. */
443 static void
444 finish_live_reload_and_inheritance_pseudos (void)
446 sparseset_free (conflict_reload_and_inheritance_pseudos);
447 free (live_reload_and_inheritance_pseudos);
448 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
451 /* The value used to check that cost of given hard reg is really
452 defined currently. */
453 static int curr_hard_regno_costs_check = 0;
454 /* Array used to check that cost of the corresponding hard reg (the
455 array element index) is really defined currently. */
456 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
457 /* The current costs of allocation of hard regs. Defined only if the
458 value of the corresponding element of the previous array is equal to
459 CURR_HARD_REGNO_COSTS_CHECK. */
460 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
462 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
463 not defined yet. */
464 static inline void
465 adjust_hard_regno_cost (int hard_regno, int incr)
467 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
468 hard_regno_costs[hard_regno] = 0;
469 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
470 hard_regno_costs[hard_regno] += incr;
473 /* Try to find a free hard register for pseudo REGNO. Return the
474 hard register on success and set *COST to the cost of using
475 that register. (If several registers have equal cost, the one with
476 the highest priority wins.) Return -1 on failure.
478 If FIRST_P, return the first available hard reg ignoring other
479 criteria, e.g. allocation cost. This approach results in less hard
480 reg pool fragmentation and permit to allocate hard regs to reload
481 pseudos in complicated situations where pseudo sizes are different.
483 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
484 otherwise consider all hard registers in REGNO's class.
486 If REGNO_SET is not empty, only hard registers from the set are
487 considered. */
488 static int
489 find_hard_regno_for_1 (int regno, int *cost, int try_only_hard_regno,
490 bool first_p, HARD_REG_SET regno_set)
492 HARD_REG_SET conflict_set;
493 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
494 lra_live_range_t r;
495 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
496 int hr, conflict_hr, nregs;
497 machine_mode biggest_mode;
498 unsigned int k, conflict_regno;
499 int offset, val, biggest_nregs, nregs_diff;
500 enum reg_class rclass;
501 bitmap_iterator bi;
502 bool *rclass_intersect_p;
503 HARD_REG_SET impossible_start_hard_regs, available_regs;
505 if (hard_reg_set_empty_p (regno_set))
506 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
507 else
509 COMPL_HARD_REG_SET (conflict_set, regno_set);
510 IOR_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
512 rclass = regno_allocno_class_array[regno];
513 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
514 curr_hard_regno_costs_check++;
515 sparseset_clear (conflict_reload_and_inheritance_pseudos);
516 sparseset_clear (live_range_hard_reg_pseudos);
517 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
518 biggest_mode = lra_reg_info[regno].biggest_mode;
519 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
521 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
522 if (rclass_intersect_p[regno_allocno_class_array[k]])
523 sparseset_set_bit (live_range_hard_reg_pseudos, k);
524 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
525 0, k, bi)
526 if (lra_reg_info[k].preferred_hard_regno1 >= 0
527 && live_pseudos_reg_renumber[k] < 0
528 && rclass_intersect_p[regno_allocno_class_array[k]])
529 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
530 for (p = r->start + 1; p <= r->finish; p++)
532 lra_live_range_t r2;
534 for (r2 = start_point_ranges[p];
535 r2 != NULL;
536 r2 = r2->start_next)
538 if (r2->regno >= lra_constraint_new_regno_start
539 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
540 && live_pseudos_reg_renumber[r2->regno] < 0
541 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
542 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
543 r2->regno);
544 if (live_pseudos_reg_renumber[r2->regno] >= 0
545 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
546 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
550 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
552 adjust_hard_regno_cost
553 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
554 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
555 adjust_hard_regno_cost
556 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
558 #ifdef STACK_REGS
559 if (lra_reg_info[regno].no_stack_p)
560 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
561 SET_HARD_REG_BIT (conflict_set, i);
562 #endif
563 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
564 val = lra_reg_info[regno].val;
565 offset = lra_reg_info[regno].offset;
566 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
567 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
568 if (lra_reg_val_equal_p (conflict_regno, val, offset))
570 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
571 nregs = (hard_regno_nregs[conflict_hr]
572 [lra_reg_info[conflict_regno].biggest_mode]);
573 /* Remember about multi-register pseudos. For example, 2 hard
574 register pseudos can start on the same hard register but can
575 not start on HR and HR+1/HR-1. */
576 for (hr = conflict_hr + 1;
577 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
578 hr++)
579 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
580 for (hr = conflict_hr - 1;
581 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
582 hr--)
583 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
585 else
587 add_to_hard_reg_set (&conflict_set,
588 lra_reg_info[conflict_regno].biggest_mode,
589 live_pseudos_reg_renumber[conflict_regno]);
590 if (hard_reg_set_subset_p (reg_class_contents[rclass],
591 conflict_set))
592 return -1;
594 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
595 conflict_regno)
596 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
598 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
599 if ((hard_regno
600 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
602 adjust_hard_regno_cost
603 (hard_regno,
604 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
605 if ((hard_regno
606 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
607 adjust_hard_regno_cost
608 (hard_regno,
609 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
612 /* Make sure that all registers in a multi-word pseudo belong to the
613 required class. */
614 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
615 lra_assert (rclass != NO_REGS);
616 rclass_size = ira_class_hard_regs_num[rclass];
617 best_hard_regno = -1;
618 hard_regno = ira_class_hard_regs[rclass][0];
619 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
620 nregs_diff = (biggest_nregs
621 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
622 COPY_HARD_REG_SET (available_regs, reg_class_contents[rclass]);
623 AND_COMPL_HARD_REG_SET (available_regs, lra_no_alloc_regs);
624 for (i = 0; i < rclass_size; i++)
626 if (try_only_hard_regno >= 0)
627 hard_regno = try_only_hard_regno;
628 else
629 hard_regno = ira_class_hard_regs[rclass][i];
630 if (! overlaps_hard_reg_set_p (conflict_set,
631 PSEUDO_REGNO_MODE (regno), hard_regno)
632 /* We can not use prohibited_class_mode_regs because it is
633 not defined for all classes. */
634 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
635 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
636 && (nregs_diff == 0
637 || (WORDS_BIG_ENDIAN
638 ? (hard_regno - nregs_diff >= 0
639 && TEST_HARD_REG_BIT (available_regs,
640 hard_regno - nregs_diff))
641 : TEST_HARD_REG_BIT (available_regs,
642 hard_regno + nregs_diff))))
644 if (hard_regno_costs_check[hard_regno]
645 != curr_hard_regno_costs_check)
647 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
648 hard_regno_costs[hard_regno] = 0;
650 for (j = 0;
651 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
652 j++)
653 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
654 && ! df_regs_ever_live_p (hard_regno + j))
655 /* It needs save restore. */
656 hard_regno_costs[hard_regno]
657 += (2
658 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
659 + 1);
660 priority = targetm.register_priority (hard_regno);
661 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
662 || (hard_regno_costs[hard_regno] == best_cost
663 && (priority > best_priority
664 || (targetm.register_usage_leveling_p ()
665 && priority == best_priority
666 && best_usage > lra_hard_reg_usage[hard_regno]))))
668 best_hard_regno = hard_regno;
669 best_cost = hard_regno_costs[hard_regno];
670 best_priority = priority;
671 best_usage = lra_hard_reg_usage[hard_regno];
674 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
675 break;
677 if (best_hard_regno >= 0)
678 *cost = best_cost - lra_reg_info[regno].freq;
679 return best_hard_regno;
682 /* A wrapper for find_hard_regno_for_1 (see comments for that function
683 description). This function tries to find a hard register for
684 preferred class first if it is worth. */
685 static int
686 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno, bool first_p)
688 int hard_regno;
689 HARD_REG_SET regno_set;
691 /* Only original pseudos can have a different preferred class. */
692 if (try_only_hard_regno < 0 && regno < lra_new_regno_start)
694 enum reg_class pref_class = reg_preferred_class (regno);
696 if (regno_allocno_class_array[regno] != pref_class)
698 hard_regno = find_hard_regno_for_1 (regno, cost, -1, first_p,
699 reg_class_contents[pref_class]);
700 if (hard_regno >= 0)
701 return hard_regno;
704 CLEAR_HARD_REG_SET (regno_set);
705 return find_hard_regno_for_1 (regno, cost, try_only_hard_regno, first_p,
706 regno_set);
709 /* Current value used for checking elements in
710 update_hard_regno_preference_check. */
711 static int curr_update_hard_regno_preference_check;
712 /* If an element value is equal to the above variable value, then the
713 corresponding regno has been processed for preference
714 propagation. */
715 static int *update_hard_regno_preference_check;
717 /* Update the preference for using HARD_REGNO for pseudos that are
718 connected directly or indirectly with REGNO. Apply divisor DIV
719 to any preference adjustments.
721 The more indirectly a pseudo is connected, the smaller its effect
722 should be. We therefore increase DIV on each "hop". */
723 static void
724 update_hard_regno_preference (int regno, int hard_regno, int div)
726 int another_regno, cost;
727 lra_copy_t cp, next_cp;
729 /* Search depth 5 seems to be enough. */
730 if (div > (1 << 5))
731 return;
732 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
734 if (cp->regno1 == regno)
736 next_cp = cp->regno1_next;
737 another_regno = cp->regno2;
739 else if (cp->regno2 == regno)
741 next_cp = cp->regno2_next;
742 another_regno = cp->regno1;
744 else
745 gcc_unreachable ();
746 if (reg_renumber[another_regno] < 0
747 && (update_hard_regno_preference_check[another_regno]
748 != curr_update_hard_regno_preference_check))
750 update_hard_regno_preference_check[another_regno]
751 = curr_update_hard_regno_preference_check;
752 cost = cp->freq < div ? 1 : cp->freq / div;
753 lra_setup_reload_pseudo_preferenced_hard_reg
754 (another_regno, hard_regno, cost);
755 update_hard_regno_preference (another_regno, hard_regno, div * 2);
760 /* Return prefix title for pseudo REGNO. */
761 static const char *
762 pseudo_prefix_title (int regno)
764 return
765 (regno < lra_constraint_new_regno_start ? ""
766 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
767 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
768 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
769 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
770 : "reload ");
773 /* Update REG_RENUMBER and other pseudo preferences by assignment of
774 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
775 void
776 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
778 int i, hr;
780 /* We can not just reassign hard register. */
781 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
782 if ((hr = hard_regno) < 0)
783 hr = reg_renumber[regno];
784 reg_renumber[regno] = hard_regno;
785 lra_assert (hr >= 0);
786 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
787 if (hard_regno < 0)
788 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
789 else
790 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
791 if (print_p && lra_dump_file != NULL)
792 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
793 reg_renumber[regno], pseudo_prefix_title (regno),
794 regno, lra_reg_info[regno].freq);
795 if (hard_regno >= 0)
797 curr_update_hard_regno_preference_check++;
798 update_hard_regno_preference (regno, hard_regno, 1);
802 /* Pseudos which occur in insns containing a particular pseudo. */
803 static bitmap_head insn_conflict_pseudos;
805 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
806 and best spill pseudos for given pseudo (and best hard regno). */
807 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
809 /* Current pseudo check for validity of elements in
810 TRY_HARD_REG_PSEUDOS. */
811 static int curr_pseudo_check;
812 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
813 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
814 /* Pseudos who hold given hard register at the considered points. */
815 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
817 /* Set up try_hard_reg_pseudos for given program point P and class
818 RCLASS. Those are pseudos living at P and assigned to a hard
819 register of RCLASS. In other words, those are pseudos which can be
820 spilled to assign a hard register of RCLASS to a pseudo living at
821 P. */
822 static void
823 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
825 int i, hard_regno;
826 machine_mode mode;
827 unsigned int spill_regno;
828 bitmap_iterator bi;
830 /* Find what pseudos could be spilled. */
831 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
833 mode = PSEUDO_REGNO_MODE (spill_regno);
834 hard_regno = live_pseudos_reg_renumber[spill_regno];
835 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
836 mode, hard_regno))
838 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
840 if (try_hard_reg_pseudos_check[hard_regno + i]
841 != curr_pseudo_check)
843 try_hard_reg_pseudos_check[hard_regno + i]
844 = curr_pseudo_check;
845 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
847 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
848 spill_regno);
854 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
855 assignment means that we might undo the data change. */
856 static void
857 assign_temporarily (int regno, int hard_regno)
859 int p;
860 lra_live_range_t r;
862 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
864 for (p = r->start; p <= r->finish; p++)
865 if (hard_regno < 0)
866 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
867 else
869 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
870 insert_in_live_range_start_chain (regno);
873 live_pseudos_reg_renumber[regno] = hard_regno;
876 /* Array used for sorting reload pseudos for subsequent allocation
877 after spilling some pseudo. */
878 static int *sorted_reload_pseudos;
880 /* Spill some pseudos for a reload pseudo REGNO and return hard
881 register which should be used for pseudo after spilling. The
882 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
883 choose hard register (and pseudos occupying the hard registers and
884 to be spilled), we take into account not only how REGNO will
885 benefit from the spills but also how other reload pseudos not yet
886 assigned to hard registers benefit from the spills too. In very
887 rare cases, the function can fail and return -1.
889 If FIRST_P, return the first available hard reg ignoring other
890 criteria, e.g. allocation cost and cost of spilling non-reload
891 pseudos. This approach results in less hard reg pool fragmentation
892 and permit to allocate hard regs to reload pseudos in complicated
893 situations where pseudo sizes are different. */
894 static int
895 spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
897 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
898 int reload_hard_regno, reload_cost;
899 machine_mode mode;
900 enum reg_class rclass;
901 unsigned int spill_regno, reload_regno, uid;
902 int insn_pseudos_num, best_insn_pseudos_num;
903 int bad_spills_num, smallest_bad_spills_num;
904 lra_live_range_t r;
905 bitmap_iterator bi;
907 rclass = regno_allocno_class_array[regno];
908 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
909 bitmap_clear (&insn_conflict_pseudos);
910 bitmap_clear (&best_spill_pseudos_bitmap);
911 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
913 struct lra_insn_reg *ir;
915 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
916 if (ir->regno >= FIRST_PSEUDO_REGISTER)
917 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
919 best_hard_regno = -1;
920 best_cost = INT_MAX;
921 best_insn_pseudos_num = INT_MAX;
922 smallest_bad_spills_num = INT_MAX;
923 rclass_size = ira_class_hard_regs_num[rclass];
924 mode = PSEUDO_REGNO_MODE (regno);
925 /* Invalidate try_hard_reg_pseudos elements. */
926 curr_pseudo_check++;
927 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
928 for (p = r->start; p <= r->finish; p++)
929 setup_try_hard_regno_pseudos (p, rclass);
930 for (i = 0; i < rclass_size; i++)
932 hard_regno = ira_class_hard_regs[rclass][i];
933 bitmap_clear (&spill_pseudos_bitmap);
934 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
936 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
937 continue;
938 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
939 bitmap_ior_into (&spill_pseudos_bitmap,
940 &try_hard_reg_pseudos[hard_regno + j]);
942 /* Spill pseudos. */
943 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
944 if ((pic_offset_table_rtx != NULL
945 && spill_regno == REGNO (pic_offset_table_rtx))
946 || ((int) spill_regno >= lra_constraint_new_regno_start
947 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
948 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
949 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
950 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
951 goto fail;
952 insn_pseudos_num = 0;
953 bad_spills_num = 0;
954 if (lra_dump_file != NULL)
955 fprintf (lra_dump_file, " Trying %d:", hard_regno);
956 sparseset_clear (live_range_reload_inheritance_pseudos);
957 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
959 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
960 insn_pseudos_num++;
961 if (spill_regno >= (unsigned int) lra_bad_spill_regno_start)
962 bad_spills_num++;
963 for (r = lra_reg_info[spill_regno].live_ranges;
964 r != NULL;
965 r = r->next)
967 for (p = r->start; p <= r->finish; p++)
969 lra_live_range_t r2;
971 for (r2 = start_point_ranges[p];
972 r2 != NULL;
973 r2 = r2->start_next)
974 if (r2->regno >= lra_constraint_new_regno_start)
975 sparseset_set_bit (live_range_reload_inheritance_pseudos,
976 r2->regno);
980 n = 0;
981 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
982 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
983 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
984 reload_regno)
985 if ((int) reload_regno != regno
986 && (ira_reg_classes_intersect_p
987 [rclass][regno_allocno_class_array[reload_regno]])
988 && live_pseudos_reg_renumber[reload_regno] < 0
989 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
990 sorted_reload_pseudos[n++] = reload_regno;
991 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
993 update_lives (spill_regno, true);
994 if (lra_dump_file != NULL)
995 fprintf (lra_dump_file, " spill %d(freq=%d)",
996 spill_regno, lra_reg_info[spill_regno].freq);
998 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
999 if (hard_regno >= 0)
1001 assign_temporarily (regno, hard_regno);
1002 qsort (sorted_reload_pseudos, n, sizeof (int),
1003 reload_pseudo_compare_func);
1004 for (j = 0; j < n; j++)
1006 reload_regno = sorted_reload_pseudos[j];
1007 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
1008 if ((reload_hard_regno
1009 = find_hard_regno_for (reload_regno,
1010 &reload_cost, -1, first_p)) >= 0)
1012 if (lra_dump_file != NULL)
1013 fprintf (lra_dump_file, " assign %d(cost=%d)",
1014 reload_regno, reload_cost);
1015 assign_temporarily (reload_regno, reload_hard_regno);
1016 cost += reload_cost;
1019 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1021 rtx_insn_list *x;
1023 cost += lra_reg_info[spill_regno].freq;
1024 if (ira_reg_equiv[spill_regno].memory != NULL
1025 || ira_reg_equiv[spill_regno].constant != NULL)
1026 for (x = ira_reg_equiv[spill_regno].init_insns;
1027 x != NULL;
1028 x = x->next ())
1029 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
1031 if (best_insn_pseudos_num > insn_pseudos_num
1032 || (best_insn_pseudos_num == insn_pseudos_num
1033 && (bad_spills_num < smallest_bad_spills_num
1034 || (bad_spills_num == smallest_bad_spills_num
1035 && best_cost > cost))))
1037 best_insn_pseudos_num = insn_pseudos_num;
1038 smallest_bad_spills_num = bad_spills_num;
1039 best_cost = cost;
1040 best_hard_regno = hard_regno;
1041 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
1042 if (lra_dump_file != NULL)
1043 fprintf (lra_dump_file,
1044 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1045 hard_regno, cost, bad_spills_num, insn_pseudos_num);
1047 assign_temporarily (regno, -1);
1048 for (j = 0; j < n; j++)
1050 reload_regno = sorted_reload_pseudos[j];
1051 if (live_pseudos_reg_renumber[reload_regno] >= 0)
1052 assign_temporarily (reload_regno, -1);
1055 if (lra_dump_file != NULL)
1056 fprintf (lra_dump_file, "\n");
1057 /* Restore the live hard reg pseudo info for spilled pseudos. */
1058 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1059 update_lives (spill_regno, false);
1060 fail:
1063 /* Spill: */
1064 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
1066 if ((int) spill_regno >= lra_constraint_new_regno_start)
1067 former_reload_pseudo_spill_p = true;
1068 if (lra_dump_file != NULL)
1069 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
1070 pseudo_prefix_title (spill_regno),
1071 spill_regno, reg_renumber[spill_regno],
1072 lra_reg_info[spill_regno].freq, regno);
1073 update_lives (spill_regno, true);
1074 lra_setup_reg_renumber (spill_regno, -1, false);
1076 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1077 return best_hard_regno;
1080 /* Assign HARD_REGNO to REGNO. */
1081 static void
1082 assign_hard_regno (int hard_regno, int regno)
1084 int i;
1086 lra_assert (hard_regno >= 0);
1087 lra_setup_reg_renumber (regno, hard_regno, true);
1088 update_lives (regno, false);
1089 for (i = 0;
1090 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
1091 i++)
1092 df_set_regs_ever_live (hard_regno + i, true);
1095 /* Array used for sorting different pseudos. */
1096 static int *sorted_pseudos;
1098 /* The constraints pass is allowed to create equivalences between
1099 pseudos that make the current allocation "incorrect" (in the sense
1100 that pseudos are assigned to hard registers from their own conflict
1101 sets). The global variable lra_risky_transformations_p says
1102 whether this might have happened.
1104 Process pseudos assigned to hard registers (less frequently used
1105 first), spill if a conflict is found, and mark the spilled pseudos
1106 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1107 pseudos, assigned to hard registers. */
1108 static void
1109 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1110 spilled_pseudo_bitmap)
1112 int p, i, j, n, regno, hard_regno;
1113 unsigned int k, conflict_regno;
1114 int val, offset;
1115 HARD_REG_SET conflict_set;
1116 machine_mode mode;
1117 lra_live_range_t r;
1118 bitmap_iterator bi;
1119 int max_regno = max_reg_num ();
1121 if (! lra_risky_transformations_p)
1123 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1124 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1125 update_lives (i, false);
1126 return;
1128 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1129 if ((pic_offset_table_rtx == NULL_RTX
1130 || i != (int) REGNO (pic_offset_table_rtx))
1131 && reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1132 sorted_pseudos[n++] = i;
1133 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1134 if (pic_offset_table_rtx != NULL_RTX
1135 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1136 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1137 sorted_pseudos[n++] = regno;
1138 for (i = n - 1; i >= 0; i--)
1140 regno = sorted_pseudos[i];
1141 hard_regno = reg_renumber[regno];
1142 lra_assert (hard_regno >= 0);
1143 mode = lra_reg_info[regno].biggest_mode;
1144 sparseset_clear (live_range_hard_reg_pseudos);
1145 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1147 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1148 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1149 for (p = r->start + 1; p <= r->finish; p++)
1151 lra_live_range_t r2;
1153 for (r2 = start_point_ranges[p];
1154 r2 != NULL;
1155 r2 = r2->start_next)
1156 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1157 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1160 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1161 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1162 val = lra_reg_info[regno].val;
1163 offset = lra_reg_info[regno].offset;
1164 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1165 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1166 /* If it is multi-register pseudos they should start on
1167 the same hard register. */
1168 || hard_regno != reg_renumber[conflict_regno])
1169 add_to_hard_reg_set (&conflict_set,
1170 lra_reg_info[conflict_regno].biggest_mode,
1171 reg_renumber[conflict_regno]);
1172 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1174 update_lives (regno, false);
1175 continue;
1177 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1178 for (j = 0;
1179 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1180 j++)
1181 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1182 reg_renumber[regno] = -1;
1183 if (regno >= lra_constraint_new_regno_start)
1184 former_reload_pseudo_spill_p = true;
1185 if (lra_dump_file != NULL)
1186 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1187 regno);
1191 /* Improve allocation by assigning the same hard regno of inheritance
1192 pseudos to the connected pseudos. We need this because inheritance
1193 pseudos are allocated after reload pseudos in the thread and when
1194 we assign a hard register to a reload pseudo we don't know yet that
1195 the connected inheritance pseudos can get the same hard register.
1196 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1197 static void
1198 improve_inheritance (bitmap changed_pseudos)
1200 unsigned int k;
1201 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1202 lra_copy_t cp, next_cp;
1203 bitmap_iterator bi;
1205 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1206 return;
1207 n = 0;
1208 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1209 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1210 sorted_pseudos[n++] = k;
1211 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1212 for (i = 0; i < n; i++)
1214 regno = sorted_pseudos[i];
1215 hard_regno = reg_renumber[regno];
1216 lra_assert (hard_regno >= 0);
1217 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1219 if (cp->regno1 == regno)
1221 next_cp = cp->regno1_next;
1222 another_regno = cp->regno2;
1224 else if (cp->regno2 == regno)
1226 next_cp = cp->regno2_next;
1227 another_regno = cp->regno1;
1229 else
1230 gcc_unreachable ();
1231 /* Don't change reload pseudo allocation. It might have
1232 this allocation for a purpose and changing it can result
1233 in LRA cycling. */
1234 if ((another_regno < lra_constraint_new_regno_start
1235 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1236 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1237 && another_hard_regno != hard_regno)
1239 if (lra_dump_file != NULL)
1240 fprintf
1241 (lra_dump_file,
1242 " Improving inheritance for %d(%d) and %d(%d)...\n",
1243 regno, hard_regno, another_regno, another_hard_regno);
1244 update_lives (another_regno, true);
1245 lra_setup_reg_renumber (another_regno, -1, false);
1246 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1247 hard_regno, false))
1248 assign_hard_regno (hard_regno, another_regno);
1249 else
1250 assign_hard_regno (another_hard_regno, another_regno);
1251 bitmap_set_bit (changed_pseudos, another_regno);
1258 /* Bitmap finally containing all pseudos spilled on this assignment
1259 pass. */
1260 static bitmap_head all_spilled_pseudos;
1261 /* All pseudos whose allocation was changed. */
1262 static bitmap_head changed_pseudo_bitmap;
1265 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1266 REGNO and whose hard regs can be assigned to REGNO. */
1267 static void
1268 find_all_spills_for (int regno)
1270 int p;
1271 lra_live_range_t r;
1272 unsigned int k;
1273 bitmap_iterator bi;
1274 enum reg_class rclass;
1275 bool *rclass_intersect_p;
1277 rclass = regno_allocno_class_array[regno];
1278 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1279 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1281 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1282 if (rclass_intersect_p[regno_allocno_class_array[k]])
1283 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1284 for (p = r->start + 1; p <= r->finish; p++)
1286 lra_live_range_t r2;
1288 for (r2 = start_point_ranges[p];
1289 r2 != NULL;
1290 r2 = r2->start_next)
1292 if (live_pseudos_reg_renumber[r2->regno] >= 0
1293 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
1294 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1300 /* Assign hard registers to reload pseudos and other pseudos. */
1301 static void
1302 assign_by_spills (void)
1304 int i, n, nfails, iter, regno, hard_regno, cost, restore_regno;
1305 rtx_insn *insn;
1306 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1307 unsigned int u, conflict_regno;
1308 bitmap_iterator bi;
1309 bool reload_p;
1310 int max_regno = max_reg_num ();
1312 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1313 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1314 && regno_allocno_class_array[i] != NO_REGS)
1315 sorted_pseudos[n++] = i;
1316 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1317 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1318 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1319 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1320 curr_update_hard_regno_preference_check = 0;
1321 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1322 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1323 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1324 curr_pseudo_check = 0;
1325 bitmap_initialize (&changed_insns, &reg_obstack);
1326 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1327 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1328 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1329 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1330 for (iter = 0; iter <= 1; iter++)
1332 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1333 nfails = 0;
1334 for (i = 0; i < n; i++)
1336 regno = sorted_pseudos[i];
1337 if (lra_dump_file != NULL)
1338 fprintf (lra_dump_file, " Assigning to %d "
1339 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1340 regno, reg_class_names[regno_allocno_class_array[regno]],
1341 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1342 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1343 regno_assign_info[regno_assign_info[regno].first].freq);
1344 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
1345 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1346 if (hard_regno < 0 && reload_p)
1347 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
1348 if (hard_regno < 0)
1350 if (reload_p)
1351 sorted_pseudos[nfails++] = regno;
1353 else
1355 /* This register might have been spilled by the previous
1356 pass. Indicate that it is no longer spilled. */
1357 bitmap_clear_bit (&all_spilled_pseudos, regno);
1358 assign_hard_regno (hard_regno, regno);
1359 if (! reload_p)
1360 /* As non-reload pseudo assignment is changed we
1361 should reconsider insns referring for the
1362 pseudo. */
1363 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1366 if (nfails == 0)
1367 break;
1368 if (iter > 0)
1370 /* We did not assign hard regs to reload pseudos after two iterations.
1371 Either it's an asm and something is wrong with the constraints, or
1372 we have run out of spill registers; error out in either case. */
1373 bool asm_p = false;
1374 bitmap_head failed_reload_insns;
1376 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1377 for (i = 0; i < nfails; i++)
1379 regno = sorted_pseudos[i];
1380 bitmap_ior_into (&failed_reload_insns,
1381 &lra_reg_info[regno].insn_bitmap);
1382 /* Assign an arbitrary hard register of regno class to
1383 avoid further trouble with this insn. */
1384 bitmap_clear_bit (&all_spilled_pseudos, regno);
1385 assign_hard_regno
1386 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1387 regno);
1389 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1391 insn = lra_insn_recog_data[u]->insn;
1392 if (asm_noperands (PATTERN (insn)) >= 0)
1394 asm_p = true;
1395 error_for_asm (insn,
1396 "%<asm%> operand has impossible constraints");
1397 /* Avoid further trouble with this insn.
1398 For asm goto, instead of fixing up all the edges
1399 just clear the template and clear input operands
1400 (asm goto doesn't have any output operands). */
1401 if (JUMP_P (insn))
1403 rtx asm_op = extract_asm_operands (PATTERN (insn));
1404 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1405 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1406 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1407 lra_update_insn_regno_info (insn);
1409 else
1411 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1412 lra_set_insn_deleted (insn);
1415 else if (!asm_p)
1417 error ("unable to find a register to spill");
1418 fatal_insn ("this is the insn:", insn);
1421 break;
1423 /* This is a very rare event. We can not assign a hard register
1424 to reload pseudo because the hard register was assigned to
1425 another reload pseudo on a previous assignment pass. For x86
1426 example, on the 1st pass we assigned CX (although another
1427 hard register could be used for this) to reload pseudo in an
1428 insn, on the 2nd pass we need CX (and only this) hard
1429 register for a new reload pseudo in the same insn. Another
1430 possible situation may occur in assigning to multi-regs
1431 reload pseudos when hard regs pool is too fragmented even
1432 after spilling non-reload pseudos.
1434 We should do something radical here to succeed. Here we
1435 spill *all* conflicting pseudos and reassign them. */
1436 if (lra_dump_file != NULL)
1437 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1438 sparseset_clear (live_range_hard_reg_pseudos);
1439 for (i = 0; i < nfails; i++)
1441 if (lra_dump_file != NULL)
1442 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1443 sorted_pseudos[i]);
1444 find_all_spills_for (sorted_pseudos[i]);
1446 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1448 if ((int) conflict_regno >= lra_constraint_new_regno_start)
1450 sorted_pseudos[nfails++] = conflict_regno;
1451 former_reload_pseudo_spill_p = true;
1453 if (lra_dump_file != NULL)
1454 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1455 pseudo_prefix_title (conflict_regno), conflict_regno,
1456 reg_renumber[conflict_regno],
1457 lra_reg_info[conflict_regno].freq);
1458 update_lives (conflict_regno, true);
1459 lra_setup_reg_renumber (conflict_regno, -1, false);
1461 n = nfails;
1463 improve_inheritance (&changed_pseudo_bitmap);
1464 bitmap_clear (&non_reload_pseudos);
1465 bitmap_clear (&changed_insns);
1466 if (! lra_simple_p)
1468 /* We should not assign to original pseudos of inheritance
1469 pseudos or split pseudos if any its inheritance pseudo did
1470 not get hard register or any its split pseudo was not split
1471 because undo inheritance/split pass will extend live range of
1472 such inheritance or split pseudos. */
1473 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1474 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1475 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1476 && reg_renumber[u] < 0
1477 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1478 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1479 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1480 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1481 && reg_renumber[u] >= 0)
1482 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1483 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1484 if (((i < lra_constraint_new_regno_start
1485 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1486 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1487 && lra_reg_info[i].restore_regno >= 0)
1488 || (bitmap_bit_p (&lra_split_regs, i)
1489 && lra_reg_info[i].restore_regno >= 0)
1490 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1491 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1492 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1493 && regno_allocno_class_array[i] != NO_REGS)
1494 sorted_pseudos[n++] = i;
1495 bitmap_clear (&do_not_assign_nonreload_pseudos);
1496 if (n != 0 && lra_dump_file != NULL)
1497 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1498 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1499 for (i = 0; i < n; i++)
1501 regno = sorted_pseudos[i];
1502 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1503 if (hard_regno >= 0)
1505 assign_hard_regno (hard_regno, regno);
1506 /* We change allocation for non-reload pseudo on this
1507 iteration -- mark the pseudo for invalidation of used
1508 alternatives of insns containing the pseudo. */
1509 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1511 else
1513 enum reg_class rclass = lra_get_allocno_class (regno);
1514 enum reg_class spill_class;
1516 if (targetm.spill_class == NULL
1517 || lra_reg_info[regno].restore_regno < 0
1518 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1519 || (spill_class
1520 = ((enum reg_class)
1521 targetm.spill_class
1522 ((reg_class_t) rclass,
1523 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1524 continue;
1525 regno_allocno_class_array[regno] = spill_class;
1526 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1527 if (hard_regno < 0)
1528 regno_allocno_class_array[regno] = rclass;
1529 else
1531 setup_reg_classes
1532 (regno, spill_class, spill_class, spill_class);
1533 assign_hard_regno (hard_regno, regno);
1534 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1539 free (update_hard_regno_preference_check);
1540 bitmap_clear (&best_spill_pseudos_bitmap);
1541 bitmap_clear (&spill_pseudos_bitmap);
1542 bitmap_clear (&insn_conflict_pseudos);
1546 /* Entry function to assign hard registers to new reload pseudos
1547 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1548 of old pseudos) and possibly to the old pseudos. The function adds
1549 what insns to process for the next constraint pass. Those are all
1550 insns who contains non-reload and non-inheritance pseudos with
1551 changed allocation.
1553 Return true if we did not spill any non-reload and non-inheritance
1554 pseudos. */
1555 bool
1556 lra_assign (void)
1558 int i;
1559 unsigned int u;
1560 bitmap_iterator bi;
1561 bitmap_head insns_to_process;
1562 bool no_spills_p;
1563 int max_regno = max_reg_num ();
1565 timevar_push (TV_LRA_ASSIGN);
1566 lra_assignment_iter++;
1567 if (lra_dump_file != NULL)
1568 fprintf (lra_dump_file, "\n********** Assignment #%d: **********\n\n",
1569 lra_assignment_iter);
1570 init_lives ();
1571 sorted_pseudos = XNEWVEC (int, max_regno);
1572 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1573 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1574 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1575 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1576 former_reload_pseudo_spill_p = false;
1577 init_regno_assign_info ();
1578 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1579 create_live_range_start_chains ();
1580 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1581 #ifdef ENABLE_CHECKING
1582 if (!flag_ipa_ra)
1583 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1584 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1585 && lra_reg_info[i].call_p
1586 && overlaps_hard_reg_set_p (call_used_reg_set,
1587 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1588 gcc_unreachable ();
1589 #endif
1590 /* Setup insns to process on the next constraint pass. */
1591 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1592 init_live_reload_and_inheritance_pseudos ();
1593 assign_by_spills ();
1594 finish_live_reload_and_inheritance_pseudos ();
1595 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1596 no_spills_p = true;
1597 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1598 /* We ignore spilled pseudos created on last inheritance pass
1599 because they will be removed. */
1600 if (lra_reg_info[u].restore_regno < 0)
1602 no_spills_p = false;
1603 break;
1605 finish_live_range_start_chains ();
1606 bitmap_clear (&all_spilled_pseudos);
1607 bitmap_initialize (&insns_to_process, &reg_obstack);
1608 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1609 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1610 bitmap_clear (&changed_pseudo_bitmap);
1611 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1613 lra_push_insn_by_uid (u);
1614 /* Invalidate alternatives for insn should be processed. */
1615 lra_set_used_insn_alternative_by_uid (u, -1);
1617 bitmap_clear (&insns_to_process);
1618 finish_regno_assign_info ();
1619 free (regno_allocno_class_array);
1620 free (sorted_pseudos);
1621 free (sorted_reload_pseudos);
1622 finish_lives ();
1623 timevar_pop (TV_LRA_ASSIGN);
1624 if (former_reload_pseudo_spill_p)
1625 lra_assignment_iter_after_spill++;
1626 if (lra_assignment_iter_after_spill > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER)
1627 internal_error
1628 ("Maximum number of LRA assignment passes is achieved (%d)\n",
1629 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER);
1630 return no_spills_p;