make recog () take a rtx_insn *
[official-gcc.git] / gcc / lra-assigns.c
blob936a16990ef243e268569d9d084d65f0e168a1d4
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2016 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "backend.h"
81 #include "target.h"
82 #include "rtl.h"
83 #include "tree.h"
84 #include "predict.h"
85 #include "df.h"
86 #include "memmodel.h"
87 #include "tm_p.h"
88 #include "insn-config.h"
89 #include "regs.h"
90 #include "ira.h"
91 #include "recog.h"
92 #include "rtl-error.h"
93 #include "sparseset.h"
94 #include "params.h"
95 #include "lra.h"
96 #include "lra-int.h"
98 /* Current iteration number of the pass and current iteration number
99 of the pass after the latest spill pass when any former reload
100 pseudo was spilled. */
101 int lra_assignment_iter;
102 int lra_assignment_iter_after_spill;
104 /* Flag of spilling former reload pseudos on this pass. */
105 static bool former_reload_pseudo_spill_p;
107 /* Array containing corresponding values of function
108 lra_get_allocno_class. It is used to speed up the code. */
109 static enum reg_class *regno_allocno_class_array;
111 /* Array containing lengths of pseudo live ranges. It is used to
112 speed up the code. */
113 static int *regno_live_length;
115 /* Information about the thread to which a pseudo belongs. Threads are
116 a set of connected reload and inheritance pseudos with the same set of
117 available hard registers. Lone registers belong to their own threads. */
118 struct regno_assign_info
120 /* First/next pseudo of the same thread. */
121 int first, next;
122 /* Frequency of the thread (execution frequency of only reload
123 pseudos in the thread when the thread contains a reload pseudo).
124 Defined only for the first thread pseudo. */
125 int freq;
128 /* Map regno to the corresponding regno assignment info. */
129 static struct regno_assign_info *regno_assign_info;
131 /* All inherited, subreg or optional pseudos created before last spill
132 sub-pass. Such pseudos are permitted to get memory instead of hard
133 regs. */
134 static bitmap_head non_reload_pseudos;
136 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
137 REGNO1 and REGNO2 to form threads. */
138 static void
139 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
141 int last, regno1_first, regno2_first;
143 lra_assert (regno1 >= lra_constraint_new_regno_start
144 && regno2 >= lra_constraint_new_regno_start);
145 regno1_first = regno_assign_info[regno1].first;
146 regno2_first = regno_assign_info[regno2].first;
147 if (regno1_first != regno2_first)
149 for (last = regno2_first;
150 regno_assign_info[last].next >= 0;
151 last = regno_assign_info[last].next)
152 regno_assign_info[last].first = regno1_first;
153 regno_assign_info[last].first = regno1_first;
154 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
155 regno_assign_info[regno1_first].next = regno2_first;
156 regno_assign_info[regno1_first].freq
157 += regno_assign_info[regno2_first].freq;
159 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
160 lra_assert (regno_assign_info[regno1_first].freq >= 0);
163 /* Initialize REGNO_ASSIGN_INFO and form threads. */
164 static void
165 init_regno_assign_info (void)
167 int i, regno1, regno2, max_regno = max_reg_num ();
168 lra_copy_t cp;
170 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
171 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
173 regno_assign_info[i].first = i;
174 regno_assign_info[i].next = -1;
175 regno_assign_info[i].freq = lra_reg_info[i].freq;
177 /* Form the threads. */
178 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
179 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
180 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
181 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
182 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
183 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
184 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
185 process_copy_to_form_thread (regno1, regno2, cp->freq);
188 /* Free REGNO_ASSIGN_INFO. */
189 static void
190 finish_regno_assign_info (void)
192 free (regno_assign_info);
195 /* The function is used to sort *reload* and *inheritance* pseudos to
196 try to assign them hard registers. We put pseudos from the same
197 thread always nearby. */
198 static int
199 reload_pseudo_compare_func (const void *v1p, const void *v2p)
201 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
202 enum reg_class cl1 = regno_allocno_class_array[r1];
203 enum reg_class cl2 = regno_allocno_class_array[r2];
204 int diff;
206 lra_assert (r1 >= lra_constraint_new_regno_start
207 && r2 >= lra_constraint_new_regno_start);
209 /* Prefer to assign reload registers with smaller classes first to
210 guarantee assignment to all reload registers. */
211 if ((diff = (ira_class_hard_regs_num[cl1]
212 - ira_class_hard_regs_num[cl2])) != 0)
213 return diff;
214 if ((diff
215 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
216 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0
217 /* The code below executes rarely as nregs == 1 in most cases.
218 So we should not worry about using faster data structures to
219 check reload pseudos. */
220 && ! bitmap_bit_p (&non_reload_pseudos, r1)
221 && ! bitmap_bit_p (&non_reload_pseudos, r2))
222 return diff;
223 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
224 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
225 return diff;
226 /* Allocate bigger pseudos first to avoid register file
227 fragmentation. */
228 if ((diff
229 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
230 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
231 return diff;
232 /* Put pseudos from the thread nearby. */
233 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
234 return diff;
235 /* Prefer pseudos with longer live ranges. It sets up better
236 prefered hard registers for the thread pseudos and decreases
237 register-register moves between the thread pseudos. */
238 if ((diff = regno_live_length[r2] - regno_live_length[r1]) != 0)
239 return diff;
240 /* If regs are equally good, sort by their numbers, so that the
241 results of qsort leave nothing to chance. */
242 return r1 - r2;
245 /* The function is used to sort *non-reload* pseudos to try to assign
246 them hard registers. The order calculation is simpler than in the
247 previous function and based on the pseudo frequency usage. */
248 static int
249 pseudo_compare_func (const void *v1p, const void *v2p)
251 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
252 int diff;
254 /* Assign hard reg to static chain pointer first pseudo when
255 non-local goto is used. */
256 if (non_spilled_static_chain_regno_p (r1))
257 return -1;
258 else if (non_spilled_static_chain_regno_p (r2))
259 return 1;
261 /* Prefer to assign more frequently used registers first. */
262 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
263 return diff;
265 /* If regs are equally good, sort by their numbers, so that the
266 results of qsort leave nothing to chance. */
267 return r1 - r2;
270 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
271 pseudo live ranges with given start point. We insert only live
272 ranges of pseudos interesting for assignment purposes. They are
273 reload pseudos and pseudos assigned to hard registers. */
274 static lra_live_range_t *start_point_ranges;
276 /* Used as a flag that a live range is not inserted in the start point
277 chain. */
278 static struct lra_live_range not_in_chain_mark;
280 /* Create and set up START_POINT_RANGES. */
281 static void
282 create_live_range_start_chains (void)
284 int i, max_regno;
285 lra_live_range_t r;
287 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
288 max_regno = max_reg_num ();
289 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
290 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
292 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
294 r->start_next = start_point_ranges[r->start];
295 start_point_ranges[r->start] = r;
298 else
300 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
301 r->start_next = &not_in_chain_mark;
305 /* Insert live ranges of pseudo REGNO into start chains if they are
306 not there yet. */
307 static void
308 insert_in_live_range_start_chain (int regno)
310 lra_live_range_t r = lra_reg_info[regno].live_ranges;
312 if (r->start_next != &not_in_chain_mark)
313 return;
314 for (; r != NULL; r = r->next)
316 r->start_next = start_point_ranges[r->start];
317 start_point_ranges[r->start] = r;
321 /* Free START_POINT_RANGES. */
322 static void
323 finish_live_range_start_chains (void)
325 gcc_assert (start_point_ranges != NULL);
326 free (start_point_ranges);
327 start_point_ranges = NULL;
330 /* Map: program point -> bitmap of all pseudos living at the point and
331 assigned to hard registers. */
332 static bitmap_head *live_hard_reg_pseudos;
333 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
335 /* reg_renumber corresponding to pseudos marked in
336 live_hard_reg_pseudos. reg_renumber might be not matched to
337 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
338 live_hard_reg_pseudos. */
339 static int *live_pseudos_reg_renumber;
341 /* Sparseset used to calculate living hard reg pseudos for some program
342 point range. */
343 static sparseset live_range_hard_reg_pseudos;
345 /* Sparseset used to calculate living reload/inheritance pseudos for
346 some program point range. */
347 static sparseset live_range_reload_inheritance_pseudos;
349 /* Allocate and initialize the data about living pseudos at program
350 points. */
351 static void
352 init_lives (void)
354 int i, max_regno = max_reg_num ();
356 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
357 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
358 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
359 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
360 for (i = 0; i < lra_live_max_point; i++)
361 bitmap_initialize (&live_hard_reg_pseudos[i],
362 &live_hard_reg_pseudos_bitmap_obstack);
363 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
364 for (i = 0; i < max_regno; i++)
365 live_pseudos_reg_renumber[i] = -1;
368 /* Free the data about living pseudos at program points. */
369 static void
370 finish_lives (void)
372 sparseset_free (live_range_hard_reg_pseudos);
373 sparseset_free (live_range_reload_inheritance_pseudos);
374 free (live_hard_reg_pseudos);
375 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
376 free (live_pseudos_reg_renumber);
379 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
380 entries for pseudo REGNO. Assume that the register has been
381 spilled if FREE_P, otherwise assume that it has been assigned
382 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
383 ranges in the start chains when it is assumed to be assigned to a
384 hard register because we use the chains of pseudos assigned to hard
385 registers during allocation. */
386 static void
387 update_lives (int regno, bool free_p)
389 int p;
390 lra_live_range_t r;
392 if (reg_renumber[regno] < 0)
393 return;
394 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
395 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
397 for (p = r->start; p <= r->finish; p++)
398 if (free_p)
399 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
400 else
402 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
403 insert_in_live_range_start_chain (regno);
408 /* Sparseset used to calculate reload pseudos conflicting with a given
409 pseudo when we are trying to find a hard register for the given
410 pseudo. */
411 static sparseset conflict_reload_and_inheritance_pseudos;
413 /* Map: program point -> bitmap of all reload and inheritance pseudos
414 living at the point. */
415 static bitmap_head *live_reload_and_inheritance_pseudos;
416 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
418 /* Allocate and initialize data about living reload pseudos at any
419 given program point. */
420 static void
421 init_live_reload_and_inheritance_pseudos (void)
423 int i, p, max_regno = max_reg_num ();
424 lra_live_range_t r;
426 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
427 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
428 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
429 for (p = 0; p < lra_live_max_point; p++)
430 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
431 &live_reload_and_inheritance_pseudos_bitmap_obstack);
432 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
434 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
435 for (p = r->start; p <= r->finish; p++)
436 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
440 /* Finalize data about living reload pseudos at any given program
441 point. */
442 static void
443 finish_live_reload_and_inheritance_pseudos (void)
445 sparseset_free (conflict_reload_and_inheritance_pseudos);
446 free (live_reload_and_inheritance_pseudos);
447 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
450 /* The value used to check that cost of given hard reg is really
451 defined currently. */
452 static int curr_hard_regno_costs_check = 0;
453 /* Array used to check that cost of the corresponding hard reg (the
454 array element index) is really defined currently. */
455 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
456 /* The current costs of allocation of hard regs. Defined only if the
457 value of the corresponding element of the previous array is equal to
458 CURR_HARD_REGNO_COSTS_CHECK. */
459 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
461 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
462 not defined yet. */
463 static inline void
464 adjust_hard_regno_cost (int hard_regno, int incr)
466 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
467 hard_regno_costs[hard_regno] = 0;
468 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
469 hard_regno_costs[hard_regno] += incr;
472 /* Try to find a free hard register for pseudo REGNO. Return the
473 hard register on success and set *COST to the cost of using
474 that register. (If several registers have equal cost, the one with
475 the highest priority wins.) Return -1 on failure.
477 If FIRST_P, return the first available hard reg ignoring other
478 criteria, e.g. allocation cost. This approach results in less hard
479 reg pool fragmentation and permit to allocate hard regs to reload
480 pseudos in complicated situations where pseudo sizes are different.
482 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
483 otherwise consider all hard registers in REGNO's class.
485 If REGNO_SET is not empty, only hard registers from the set are
486 considered. */
487 static int
488 find_hard_regno_for_1 (int regno, int *cost, int try_only_hard_regno,
489 bool first_p, HARD_REG_SET regno_set)
491 HARD_REG_SET conflict_set;
492 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
493 lra_live_range_t r;
494 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
495 int hr, conflict_hr, nregs;
496 machine_mode biggest_mode;
497 unsigned int k, conflict_regno;
498 int offset, val, biggest_nregs, nregs_diff;
499 enum reg_class rclass;
500 bitmap_iterator bi;
501 bool *rclass_intersect_p;
502 HARD_REG_SET impossible_start_hard_regs, available_regs;
504 if (hard_reg_set_empty_p (regno_set))
505 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
506 else
508 COMPL_HARD_REG_SET (conflict_set, regno_set);
509 IOR_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
511 rclass = regno_allocno_class_array[regno];
512 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
513 curr_hard_regno_costs_check++;
514 sparseset_clear (conflict_reload_and_inheritance_pseudos);
515 sparseset_clear (live_range_hard_reg_pseudos);
516 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
517 biggest_mode = lra_reg_info[regno].biggest_mode;
518 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
520 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
521 if (rclass_intersect_p[regno_allocno_class_array[k]])
522 sparseset_set_bit (live_range_hard_reg_pseudos, k);
523 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
524 0, k, bi)
525 if (lra_reg_info[k].preferred_hard_regno1 >= 0
526 && live_pseudos_reg_renumber[k] < 0
527 && rclass_intersect_p[regno_allocno_class_array[k]])
528 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
529 for (p = r->start + 1; p <= r->finish; p++)
531 lra_live_range_t r2;
533 for (r2 = start_point_ranges[p];
534 r2 != NULL;
535 r2 = r2->start_next)
537 if (r2->regno >= lra_constraint_new_regno_start
538 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
539 && live_pseudos_reg_renumber[r2->regno] < 0
540 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
541 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
542 r2->regno);
543 if (live_pseudos_reg_renumber[r2->regno] >= 0
544 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
545 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
549 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
551 adjust_hard_regno_cost
552 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
553 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
554 adjust_hard_regno_cost
555 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
557 #ifdef STACK_REGS
558 if (lra_reg_info[regno].no_stack_p)
559 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
560 SET_HARD_REG_BIT (conflict_set, i);
561 #endif
562 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
563 val = lra_reg_info[regno].val;
564 offset = lra_reg_info[regno].offset;
565 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
566 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
567 if (lra_reg_val_equal_p (conflict_regno, val, offset))
569 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
570 nregs = (hard_regno_nregs[conflict_hr]
571 [lra_reg_info[conflict_regno].biggest_mode]);
572 /* Remember about multi-register pseudos. For example, 2 hard
573 register pseudos can start on the same hard register but can
574 not start on HR and HR+1/HR-1. */
575 for (hr = conflict_hr + 1;
576 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
577 hr++)
578 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
579 for (hr = conflict_hr - 1;
580 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
581 hr--)
582 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
584 else
586 add_to_hard_reg_set (&conflict_set,
587 lra_reg_info[conflict_regno].biggest_mode,
588 live_pseudos_reg_renumber[conflict_regno]);
589 if (hard_reg_set_subset_p (reg_class_contents[rclass],
590 conflict_set))
591 return -1;
593 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
594 conflict_regno)
595 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
597 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
598 if ((hard_regno
599 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
601 adjust_hard_regno_cost
602 (hard_regno,
603 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
604 if ((hard_regno
605 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
606 adjust_hard_regno_cost
607 (hard_regno,
608 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
611 /* Make sure that all registers in a multi-word pseudo belong to the
612 required class. */
613 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
614 lra_assert (rclass != NO_REGS);
615 rclass_size = ira_class_hard_regs_num[rclass];
616 best_hard_regno = -1;
617 hard_regno = ira_class_hard_regs[rclass][0];
618 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
619 nregs_diff = (biggest_nregs
620 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
621 COPY_HARD_REG_SET (available_regs, reg_class_contents[rclass]);
622 AND_COMPL_HARD_REG_SET (available_regs, lra_no_alloc_regs);
623 for (i = 0; i < rclass_size; i++)
625 if (try_only_hard_regno >= 0)
626 hard_regno = try_only_hard_regno;
627 else
628 hard_regno = ira_class_hard_regs[rclass][i];
629 if (! overlaps_hard_reg_set_p (conflict_set,
630 PSEUDO_REGNO_MODE (regno), hard_regno)
631 /* We can not use prohibited_class_mode_regs because it is
632 not defined for all classes. */
633 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
634 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
635 && (nregs_diff == 0
636 || (WORDS_BIG_ENDIAN
637 ? (hard_regno - nregs_diff >= 0
638 && TEST_HARD_REG_BIT (available_regs,
639 hard_regno - nregs_diff))
640 : TEST_HARD_REG_BIT (available_regs,
641 hard_regno + nregs_diff))))
643 if (hard_regno_costs_check[hard_regno]
644 != curr_hard_regno_costs_check)
646 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
647 hard_regno_costs[hard_regno] = 0;
649 for (j = 0;
650 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
651 j++)
652 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
653 && ! df_regs_ever_live_p (hard_regno + j))
654 /* It needs save restore. */
655 hard_regno_costs[hard_regno]
656 += (2
657 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
658 + 1);
659 priority = targetm.register_priority (hard_regno);
660 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
661 || (hard_regno_costs[hard_regno] == best_cost
662 && (priority > best_priority
663 || (targetm.register_usage_leveling_p ()
664 && priority == best_priority
665 && best_usage > lra_hard_reg_usage[hard_regno]))))
667 best_hard_regno = hard_regno;
668 best_cost = hard_regno_costs[hard_regno];
669 best_priority = priority;
670 best_usage = lra_hard_reg_usage[hard_regno];
673 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
674 break;
676 if (best_hard_regno >= 0)
677 *cost = best_cost - lra_reg_info[regno].freq;
678 return best_hard_regno;
681 /* A wrapper for find_hard_regno_for_1 (see comments for that function
682 description). This function tries to find a hard register for
683 preferred class first if it is worth. */
684 static int
685 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno, bool first_p)
687 int hard_regno;
688 HARD_REG_SET regno_set;
690 /* Only original pseudos can have a different preferred class. */
691 if (try_only_hard_regno < 0 && regno < lra_new_regno_start)
693 enum reg_class pref_class = reg_preferred_class (regno);
695 if (regno_allocno_class_array[regno] != pref_class)
697 hard_regno = find_hard_regno_for_1 (regno, cost, -1, first_p,
698 reg_class_contents[pref_class]);
699 if (hard_regno >= 0)
700 return hard_regno;
703 CLEAR_HARD_REG_SET (regno_set);
704 return find_hard_regno_for_1 (regno, cost, try_only_hard_regno, first_p,
705 regno_set);
708 /* Current value used for checking elements in
709 update_hard_regno_preference_check. */
710 static int curr_update_hard_regno_preference_check;
711 /* If an element value is equal to the above variable value, then the
712 corresponding regno has been processed for preference
713 propagation. */
714 static int *update_hard_regno_preference_check;
716 /* Update the preference for using HARD_REGNO for pseudos that are
717 connected directly or indirectly with REGNO. Apply divisor DIV
718 to any preference adjustments.
720 The more indirectly a pseudo is connected, the smaller its effect
721 should be. We therefore increase DIV on each "hop". */
722 static void
723 update_hard_regno_preference (int regno, int hard_regno, int div)
725 int another_regno, cost;
726 lra_copy_t cp, next_cp;
728 /* Search depth 5 seems to be enough. */
729 if (div > (1 << 5))
730 return;
731 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
733 if (cp->regno1 == regno)
735 next_cp = cp->regno1_next;
736 another_regno = cp->regno2;
738 else if (cp->regno2 == regno)
740 next_cp = cp->regno2_next;
741 another_regno = cp->regno1;
743 else
744 gcc_unreachable ();
745 if (reg_renumber[another_regno] < 0
746 && (update_hard_regno_preference_check[another_regno]
747 != curr_update_hard_regno_preference_check))
749 update_hard_regno_preference_check[another_regno]
750 = curr_update_hard_regno_preference_check;
751 cost = cp->freq < div ? 1 : cp->freq / div;
752 lra_setup_reload_pseudo_preferenced_hard_reg
753 (another_regno, hard_regno, cost);
754 update_hard_regno_preference (another_regno, hard_regno, div * 2);
759 /* Return prefix title for pseudo REGNO. */
760 static const char *
761 pseudo_prefix_title (int regno)
763 return
764 (regno < lra_constraint_new_regno_start ? ""
765 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
766 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
767 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
768 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
769 : "reload ");
772 /* Update REG_RENUMBER and other pseudo preferences by assignment of
773 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
774 void
775 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
777 int i, hr;
779 /* We can not just reassign hard register. */
780 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
781 if ((hr = hard_regno) < 0)
782 hr = reg_renumber[regno];
783 reg_renumber[regno] = hard_regno;
784 lra_assert (hr >= 0);
785 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
786 if (hard_regno < 0)
787 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
788 else
789 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
790 if (print_p && lra_dump_file != NULL)
791 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
792 reg_renumber[regno], pseudo_prefix_title (regno),
793 regno, lra_reg_info[regno].freq);
794 if (hard_regno >= 0)
796 curr_update_hard_regno_preference_check++;
797 update_hard_regno_preference (regno, hard_regno, 1);
801 /* Pseudos which occur in insns containing a particular pseudo. */
802 static bitmap_head insn_conflict_pseudos;
804 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
805 and best spill pseudos for given pseudo (and best hard regno). */
806 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
808 /* Current pseudo check for validity of elements in
809 TRY_HARD_REG_PSEUDOS. */
810 static int curr_pseudo_check;
811 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
812 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
813 /* Pseudos who hold given hard register at the considered points. */
814 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
816 /* Set up try_hard_reg_pseudos for given program point P and class
817 RCLASS. Those are pseudos living at P and assigned to a hard
818 register of RCLASS. In other words, those are pseudos which can be
819 spilled to assign a hard register of RCLASS to a pseudo living at
820 P. */
821 static void
822 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
824 int i, hard_regno;
825 machine_mode mode;
826 unsigned int spill_regno;
827 bitmap_iterator bi;
829 /* Find what pseudos could be spilled. */
830 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
832 mode = PSEUDO_REGNO_MODE (spill_regno);
833 hard_regno = live_pseudos_reg_renumber[spill_regno];
834 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
835 mode, hard_regno))
837 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
839 if (try_hard_reg_pseudos_check[hard_regno + i]
840 != curr_pseudo_check)
842 try_hard_reg_pseudos_check[hard_regno + i]
843 = curr_pseudo_check;
844 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
846 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
847 spill_regno);
853 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
854 assignment means that we might undo the data change. */
855 static void
856 assign_temporarily (int regno, int hard_regno)
858 int p;
859 lra_live_range_t r;
861 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
863 for (p = r->start; p <= r->finish; p++)
864 if (hard_regno < 0)
865 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
866 else
868 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
869 insert_in_live_range_start_chain (regno);
872 live_pseudos_reg_renumber[regno] = hard_regno;
875 /* Array used for sorting reload pseudos for subsequent allocation
876 after spilling some pseudo. */
877 static int *sorted_reload_pseudos;
879 /* Spill some pseudos for a reload pseudo REGNO and return hard
880 register which should be used for pseudo after spilling. The
881 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
882 choose hard register (and pseudos occupying the hard registers and
883 to be spilled), we take into account not only how REGNO will
884 benefit from the spills but also how other reload pseudos not yet
885 assigned to hard registers benefit from the spills too. In very
886 rare cases, the function can fail and return -1.
888 If FIRST_P, return the first available hard reg ignoring other
889 criteria, e.g. allocation cost and cost of spilling non-reload
890 pseudos. This approach results in less hard reg pool fragmentation
891 and permit to allocate hard regs to reload pseudos in complicated
892 situations where pseudo sizes are different. */
893 static int
894 spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
896 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
897 int reload_hard_regno, reload_cost;
898 bool static_p, best_static_p;
899 machine_mode mode;
900 enum reg_class rclass;
901 unsigned int spill_regno, reload_regno, uid;
902 int insn_pseudos_num, best_insn_pseudos_num;
903 int bad_spills_num, smallest_bad_spills_num;
904 lra_live_range_t r;
905 bitmap_iterator bi;
907 rclass = regno_allocno_class_array[regno];
908 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
909 bitmap_clear (&insn_conflict_pseudos);
910 bitmap_clear (&best_spill_pseudos_bitmap);
911 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
913 struct lra_insn_reg *ir;
915 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
916 if (ir->regno >= FIRST_PSEUDO_REGISTER)
917 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
919 best_hard_regno = -1;
920 best_cost = INT_MAX;
921 best_static_p = TRUE;
922 best_insn_pseudos_num = INT_MAX;
923 smallest_bad_spills_num = INT_MAX;
924 rclass_size = ira_class_hard_regs_num[rclass];
925 mode = PSEUDO_REGNO_MODE (regno);
926 /* Invalidate try_hard_reg_pseudos elements. */
927 curr_pseudo_check++;
928 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
929 for (p = r->start; p <= r->finish; p++)
930 setup_try_hard_regno_pseudos (p, rclass);
931 for (i = 0; i < rclass_size; i++)
933 hard_regno = ira_class_hard_regs[rclass][i];
934 bitmap_clear (&spill_pseudos_bitmap);
935 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
937 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
938 continue;
939 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
940 bitmap_ior_into (&spill_pseudos_bitmap,
941 &try_hard_reg_pseudos[hard_regno + j]);
943 /* Spill pseudos. */
944 static_p = false;
945 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
946 if ((pic_offset_table_rtx != NULL
947 && spill_regno == REGNO (pic_offset_table_rtx))
948 || ((int) spill_regno >= lra_constraint_new_regno_start
949 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
950 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
951 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
952 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
953 goto fail;
954 else if (non_spilled_static_chain_regno_p (spill_regno))
955 static_p = true;
956 insn_pseudos_num = 0;
957 bad_spills_num = 0;
958 if (lra_dump_file != NULL)
959 fprintf (lra_dump_file, " Trying %d:", hard_regno);
960 sparseset_clear (live_range_reload_inheritance_pseudos);
961 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
963 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
964 insn_pseudos_num++;
965 if (spill_regno >= (unsigned int) lra_bad_spill_regno_start)
966 bad_spills_num++;
967 for (r = lra_reg_info[spill_regno].live_ranges;
968 r != NULL;
969 r = r->next)
971 for (p = r->start; p <= r->finish; p++)
973 lra_live_range_t r2;
975 for (r2 = start_point_ranges[p];
976 r2 != NULL;
977 r2 = r2->start_next)
978 if (r2->regno >= lra_constraint_new_regno_start)
979 sparseset_set_bit (live_range_reload_inheritance_pseudos,
980 r2->regno);
984 n = 0;
985 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
986 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
987 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
988 reload_regno)
989 if ((int) reload_regno != regno
990 && (ira_reg_classes_intersect_p
991 [rclass][regno_allocno_class_array[reload_regno]])
992 && live_pseudos_reg_renumber[reload_regno] < 0
993 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
994 sorted_reload_pseudos[n++] = reload_regno;
995 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
997 update_lives (spill_regno, true);
998 if (lra_dump_file != NULL)
999 fprintf (lra_dump_file, " spill %d(freq=%d)",
1000 spill_regno, lra_reg_info[spill_regno].freq);
1002 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
1003 if (hard_regno >= 0)
1005 assign_temporarily (regno, hard_regno);
1006 qsort (sorted_reload_pseudos, n, sizeof (int),
1007 reload_pseudo_compare_func);
1008 for (j = 0; j < n; j++)
1010 reload_regno = sorted_reload_pseudos[j];
1011 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
1012 if ((reload_hard_regno
1013 = find_hard_regno_for (reload_regno,
1014 &reload_cost, -1, first_p)) >= 0)
1016 if (lra_dump_file != NULL)
1017 fprintf (lra_dump_file, " assign %d(cost=%d)",
1018 reload_regno, reload_cost);
1019 assign_temporarily (reload_regno, reload_hard_regno);
1020 cost += reload_cost;
1023 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1025 rtx_insn_list *x;
1027 cost += lra_reg_info[spill_regno].freq;
1028 if (ira_reg_equiv[spill_regno].memory != NULL
1029 || ira_reg_equiv[spill_regno].constant != NULL)
1030 for (x = ira_reg_equiv[spill_regno].init_insns;
1031 x != NULL;
1032 x = x->next ())
1033 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
1035 /* Avoid spilling static chain pointer pseudo when non-local
1036 goto is used. */
1037 if ((! static_p && best_static_p)
1038 || (static_p == best_static_p
1039 && (best_insn_pseudos_num > insn_pseudos_num
1040 || (best_insn_pseudos_num == insn_pseudos_num
1041 && (bad_spills_num < smallest_bad_spills_num
1042 || (bad_spills_num == smallest_bad_spills_num
1043 && best_cost > cost))))))
1045 best_insn_pseudos_num = insn_pseudos_num;
1046 smallest_bad_spills_num = bad_spills_num;
1047 best_static_p = static_p;
1048 best_cost = cost;
1049 best_hard_regno = hard_regno;
1050 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
1051 if (lra_dump_file != NULL)
1052 fprintf (lra_dump_file,
1053 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1054 hard_regno, cost, bad_spills_num, insn_pseudos_num);
1056 assign_temporarily (regno, -1);
1057 for (j = 0; j < n; j++)
1059 reload_regno = sorted_reload_pseudos[j];
1060 if (live_pseudos_reg_renumber[reload_regno] >= 0)
1061 assign_temporarily (reload_regno, -1);
1064 if (lra_dump_file != NULL)
1065 fprintf (lra_dump_file, "\n");
1066 /* Restore the live hard reg pseudo info for spilled pseudos. */
1067 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1068 update_lives (spill_regno, false);
1069 fail:
1072 /* Spill: */
1073 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
1075 if ((int) spill_regno >= lra_constraint_new_regno_start)
1076 former_reload_pseudo_spill_p = true;
1077 if (lra_dump_file != NULL)
1078 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
1079 pseudo_prefix_title (spill_regno),
1080 spill_regno, reg_renumber[spill_regno],
1081 lra_reg_info[spill_regno].freq, regno);
1082 update_lives (spill_regno, true);
1083 lra_setup_reg_renumber (spill_regno, -1, false);
1085 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1086 return best_hard_regno;
1089 /* Assign HARD_REGNO to REGNO. */
1090 static void
1091 assign_hard_regno (int hard_regno, int regno)
1093 int i;
1095 lra_assert (hard_regno >= 0);
1096 lra_setup_reg_renumber (regno, hard_regno, true);
1097 update_lives (regno, false);
1098 for (i = 0;
1099 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
1100 i++)
1101 df_set_regs_ever_live (hard_regno + i, true);
1104 /* Array used for sorting different pseudos. */
1105 static int *sorted_pseudos;
1107 /* The constraints pass is allowed to create equivalences between
1108 pseudos that make the current allocation "incorrect" (in the sense
1109 that pseudos are assigned to hard registers from their own conflict
1110 sets). The global variable lra_risky_transformations_p says
1111 whether this might have happened.
1113 Process pseudos assigned to hard registers (less frequently used
1114 first), spill if a conflict is found, and mark the spilled pseudos
1115 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1116 pseudos, assigned to hard registers. */
1117 static void
1118 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1119 spilled_pseudo_bitmap)
1121 int p, i, j, n, regno, hard_regno;
1122 unsigned int k, conflict_regno;
1123 int val, offset;
1124 HARD_REG_SET conflict_set;
1125 machine_mode mode;
1126 lra_live_range_t r;
1127 bitmap_iterator bi;
1128 int max_regno = max_reg_num ();
1130 if (! lra_risky_transformations_p)
1132 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1133 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1134 update_lives (i, false);
1135 return;
1137 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1138 if ((pic_offset_table_rtx == NULL_RTX
1139 || i != (int) REGNO (pic_offset_table_rtx))
1140 && reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1141 sorted_pseudos[n++] = i;
1142 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1143 if (pic_offset_table_rtx != NULL_RTX
1144 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1145 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1146 sorted_pseudos[n++] = regno;
1147 for (i = n - 1; i >= 0; i--)
1149 regno = sorted_pseudos[i];
1150 hard_regno = reg_renumber[regno];
1151 lra_assert (hard_regno >= 0);
1152 mode = lra_reg_info[regno].biggest_mode;
1153 sparseset_clear (live_range_hard_reg_pseudos);
1154 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1156 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1157 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1158 for (p = r->start + 1; p <= r->finish; p++)
1160 lra_live_range_t r2;
1162 for (r2 = start_point_ranges[p];
1163 r2 != NULL;
1164 r2 = r2->start_next)
1165 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1166 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1169 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1170 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1171 val = lra_reg_info[regno].val;
1172 offset = lra_reg_info[regno].offset;
1173 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1174 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1175 /* If it is multi-register pseudos they should start on
1176 the same hard register. */
1177 || hard_regno != reg_renumber[conflict_regno])
1178 add_to_hard_reg_set (&conflict_set,
1179 lra_reg_info[conflict_regno].biggest_mode,
1180 reg_renumber[conflict_regno]);
1181 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1183 update_lives (regno, false);
1184 continue;
1186 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1187 for (j = 0;
1188 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1189 j++)
1190 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1191 reg_renumber[regno] = -1;
1192 if (regno >= lra_constraint_new_regno_start)
1193 former_reload_pseudo_spill_p = true;
1194 if (lra_dump_file != NULL)
1195 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1196 regno);
1200 /* Improve allocation by assigning the same hard regno of inheritance
1201 pseudos to the connected pseudos. We need this because inheritance
1202 pseudos are allocated after reload pseudos in the thread and when
1203 we assign a hard register to a reload pseudo we don't know yet that
1204 the connected inheritance pseudos can get the same hard register.
1205 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1206 static void
1207 improve_inheritance (bitmap changed_pseudos)
1209 unsigned int k;
1210 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1211 lra_copy_t cp, next_cp;
1212 bitmap_iterator bi;
1214 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1215 return;
1216 n = 0;
1217 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1218 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1219 sorted_pseudos[n++] = k;
1220 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1221 for (i = 0; i < n; i++)
1223 regno = sorted_pseudos[i];
1224 hard_regno = reg_renumber[regno];
1225 lra_assert (hard_regno >= 0);
1226 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1228 if (cp->regno1 == regno)
1230 next_cp = cp->regno1_next;
1231 another_regno = cp->regno2;
1233 else if (cp->regno2 == regno)
1235 next_cp = cp->regno2_next;
1236 another_regno = cp->regno1;
1238 else
1239 gcc_unreachable ();
1240 /* Don't change reload pseudo allocation. It might have
1241 this allocation for a purpose and changing it can result
1242 in LRA cycling. */
1243 if ((another_regno < lra_constraint_new_regno_start
1244 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1245 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1246 && another_hard_regno != hard_regno)
1248 if (lra_dump_file != NULL)
1249 fprintf
1250 (lra_dump_file,
1251 " Improving inheritance for %d(%d) and %d(%d)...\n",
1252 regno, hard_regno, another_regno, another_hard_regno);
1253 update_lives (another_regno, true);
1254 lra_setup_reg_renumber (another_regno, -1, false);
1255 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1256 hard_regno, false))
1257 assign_hard_regno (hard_regno, another_regno);
1258 else
1259 assign_hard_regno (another_hard_regno, another_regno);
1260 bitmap_set_bit (changed_pseudos, another_regno);
1267 /* Bitmap finally containing all pseudos spilled on this assignment
1268 pass. */
1269 static bitmap_head all_spilled_pseudos;
1270 /* All pseudos whose allocation was changed. */
1271 static bitmap_head changed_pseudo_bitmap;
1274 /* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1275 REGNO and whose hard regs can be assigned to REGNO. */
1276 static void
1277 find_all_spills_for (int regno)
1279 int p;
1280 lra_live_range_t r;
1281 unsigned int k;
1282 bitmap_iterator bi;
1283 enum reg_class rclass;
1284 bool *rclass_intersect_p;
1286 rclass = regno_allocno_class_array[regno];
1287 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1288 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1290 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1291 if (rclass_intersect_p[regno_allocno_class_array[k]])
1292 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1293 for (p = r->start + 1; p <= r->finish; p++)
1295 lra_live_range_t r2;
1297 for (r2 = start_point_ranges[p];
1298 r2 != NULL;
1299 r2 = r2->start_next)
1301 if (live_pseudos_reg_renumber[r2->regno] >= 0
1302 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
1303 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1309 /* Assign hard registers to reload pseudos and other pseudos. */
1310 static void
1311 assign_by_spills (void)
1313 int i, n, nfails, iter, regno, hard_regno, cost;
1314 rtx restore_rtx;
1315 rtx_insn *insn;
1316 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1317 unsigned int u, conflict_regno;
1318 bitmap_iterator bi;
1319 bool reload_p;
1320 int max_regno = max_reg_num ();
1322 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1323 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1324 && regno_allocno_class_array[i] != NO_REGS)
1325 sorted_pseudos[n++] = i;
1326 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1327 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1328 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1329 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1330 curr_update_hard_regno_preference_check = 0;
1331 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1332 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1333 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1334 curr_pseudo_check = 0;
1335 bitmap_initialize (&changed_insns, &reg_obstack);
1336 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1337 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1338 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1339 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1340 for (iter = 0; iter <= 1; iter++)
1342 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1343 nfails = 0;
1344 for (i = 0; i < n; i++)
1346 regno = sorted_pseudos[i];
1347 if (reg_renumber[regno] >= 0)
1348 continue;
1349 if (lra_dump_file != NULL)
1350 fprintf (lra_dump_file, " Assigning to %d "
1351 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1352 regno, reg_class_names[regno_allocno_class_array[regno]],
1353 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1354 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1355 regno_assign_info[regno_assign_info[regno].first].freq);
1356 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
1357 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1358 if (hard_regno < 0 && reload_p)
1359 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
1360 if (hard_regno < 0)
1362 if (reload_p)
1363 sorted_pseudos[nfails++] = regno;
1365 else
1367 /* This register might have been spilled by the previous
1368 pass. Indicate that it is no longer spilled. */
1369 bitmap_clear_bit (&all_spilled_pseudos, regno);
1370 assign_hard_regno (hard_regno, regno);
1371 if (! reload_p)
1372 /* As non-reload pseudo assignment is changed we
1373 should reconsider insns referring for the
1374 pseudo. */
1375 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1378 if (nfails == 0)
1379 break;
1380 if (iter > 0)
1382 /* We did not assign hard regs to reload pseudos after two iterations.
1383 Either it's an asm and something is wrong with the constraints, or
1384 we have run out of spill registers; error out in either case. */
1385 bool asm_p = false;
1386 bitmap_head failed_reload_insns;
1388 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1389 for (i = 0; i < nfails; i++)
1391 regno = sorted_pseudos[i];
1392 bitmap_ior_into (&failed_reload_insns,
1393 &lra_reg_info[regno].insn_bitmap);
1394 /* Assign an arbitrary hard register of regno class to
1395 avoid further trouble with this insn. */
1396 bitmap_clear_bit (&all_spilled_pseudos, regno);
1397 assign_hard_regno
1398 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1399 regno);
1401 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1403 insn = lra_insn_recog_data[u]->insn;
1404 if (asm_noperands (PATTERN (insn)) >= 0)
1406 asm_p = true;
1407 error_for_asm (insn,
1408 "%<asm%> operand has impossible constraints");
1409 /* Avoid further trouble with this insn.
1410 For asm goto, instead of fixing up all the edges
1411 just clear the template and clear input operands
1412 (asm goto doesn't have any output operands). */
1413 if (JUMP_P (insn))
1415 rtx asm_op = extract_asm_operands (PATTERN (insn));
1416 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1417 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1418 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1419 lra_update_insn_regno_info (insn);
1421 else
1423 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1424 lra_set_insn_deleted (insn);
1427 else if (!asm_p)
1429 error ("unable to find a register to spill");
1430 fatal_insn ("this is the insn:", insn);
1433 break;
1435 /* This is a very rare event. We can not assign a hard register
1436 to reload pseudo because the hard register was assigned to
1437 another reload pseudo on a previous assignment pass. For x86
1438 example, on the 1st pass we assigned CX (although another
1439 hard register could be used for this) to reload pseudo in an
1440 insn, on the 2nd pass we need CX (and only this) hard
1441 register for a new reload pseudo in the same insn. Another
1442 possible situation may occur in assigning to multi-regs
1443 reload pseudos when hard regs pool is too fragmented even
1444 after spilling non-reload pseudos.
1446 We should do something radical here to succeed. Here we
1447 spill *all* conflicting pseudos and reassign them. */
1448 if (lra_dump_file != NULL)
1449 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1450 sparseset_clear (live_range_hard_reg_pseudos);
1451 for (i = 0; i < nfails; i++)
1453 if (lra_dump_file != NULL)
1454 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1455 sorted_pseudos[i]);
1456 find_all_spills_for (sorted_pseudos[i]);
1458 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1460 if ((int) conflict_regno >= lra_constraint_new_regno_start)
1462 sorted_pseudos[nfails++] = conflict_regno;
1463 former_reload_pseudo_spill_p = true;
1465 if (lra_dump_file != NULL)
1466 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1467 pseudo_prefix_title (conflict_regno), conflict_regno,
1468 reg_renumber[conflict_regno],
1469 lra_reg_info[conflict_regno].freq);
1470 update_lives (conflict_regno, true);
1471 lra_setup_reg_renumber (conflict_regno, -1, false);
1473 n = nfails;
1475 improve_inheritance (&changed_pseudo_bitmap);
1476 bitmap_clear (&non_reload_pseudos);
1477 bitmap_clear (&changed_insns);
1478 if (! lra_simple_p)
1480 /* We should not assign to original pseudos of inheritance
1481 pseudos or split pseudos if any its inheritance pseudo did
1482 not get hard register or any its split pseudo was not split
1483 because undo inheritance/split pass will extend live range of
1484 such inheritance or split pseudos. */
1485 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1486 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1487 if ((restore_rtx = lra_reg_info[u].restore_rtx) != NULL_RTX
1488 && REG_P (restore_rtx)
1489 && reg_renumber[u] < 0
1490 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1491 bitmap_set_bit (&do_not_assign_nonreload_pseudos, REGNO (restore_rtx));
1492 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1493 if ((restore_rtx = lra_reg_info[u].restore_rtx) != NULL_RTX
1494 && reg_renumber[u] >= 0)
1496 lra_assert (REG_P (restore_rtx));
1497 bitmap_set_bit (&do_not_assign_nonreload_pseudos, REGNO (restore_rtx));
1499 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1500 if (((i < lra_constraint_new_regno_start
1501 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1502 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1503 && lra_reg_info[i].restore_rtx != NULL_RTX)
1504 || (bitmap_bit_p (&lra_split_regs, i)
1505 && lra_reg_info[i].restore_rtx != NULL_RTX)
1506 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1507 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1508 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1509 && regno_allocno_class_array[i] != NO_REGS)
1510 sorted_pseudos[n++] = i;
1511 bitmap_clear (&do_not_assign_nonreload_pseudos);
1512 if (n != 0 && lra_dump_file != NULL)
1513 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1514 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1515 for (i = 0; i < n; i++)
1517 regno = sorted_pseudos[i];
1518 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1519 if (hard_regno >= 0)
1521 assign_hard_regno (hard_regno, regno);
1522 /* We change allocation for non-reload pseudo on this
1523 iteration -- mark the pseudo for invalidation of used
1524 alternatives of insns containing the pseudo. */
1525 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1527 else
1529 enum reg_class rclass = lra_get_allocno_class (regno);
1530 enum reg_class spill_class;
1532 if (targetm.spill_class == NULL
1533 || lra_reg_info[regno].restore_rtx == NULL_RTX
1534 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1535 || (spill_class
1536 = ((enum reg_class)
1537 targetm.spill_class
1538 ((reg_class_t) rclass,
1539 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1540 continue;
1541 regno_allocno_class_array[regno] = spill_class;
1542 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1543 if (hard_regno < 0)
1544 regno_allocno_class_array[regno] = rclass;
1545 else
1547 setup_reg_classes
1548 (regno, spill_class, spill_class, spill_class);
1549 assign_hard_regno (hard_regno, regno);
1550 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1555 free (update_hard_regno_preference_check);
1556 bitmap_clear (&best_spill_pseudos_bitmap);
1557 bitmap_clear (&spill_pseudos_bitmap);
1558 bitmap_clear (&insn_conflict_pseudos);
1562 /* Entry function to assign hard registers to new reload pseudos
1563 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1564 of old pseudos) and possibly to the old pseudos. The function adds
1565 what insns to process for the next constraint pass. Those are all
1566 insns who contains non-reload and non-inheritance pseudos with
1567 changed allocation.
1569 Return true if we did not spill any non-reload and non-inheritance
1570 pseudos. */
1571 bool
1572 lra_assign (void)
1574 int i;
1575 unsigned int u;
1576 bitmap_iterator bi;
1577 bitmap_head insns_to_process;
1578 bool no_spills_p;
1579 int max_regno = max_reg_num ();
1581 timevar_push (TV_LRA_ASSIGN);
1582 lra_assignment_iter++;
1583 if (lra_dump_file != NULL)
1584 fprintf (lra_dump_file, "\n********** Assignment #%d: **********\n\n",
1585 lra_assignment_iter);
1586 init_lives ();
1587 sorted_pseudos = XNEWVEC (int, max_regno);
1588 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1589 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1590 regno_live_length = XNEWVEC (int, max_regno);
1591 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1593 int l;
1594 lra_live_range_t r;
1596 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1597 for (l = 0, r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
1598 l += r->finish - r->start + 1;
1599 regno_live_length[i] = l;
1601 former_reload_pseudo_spill_p = false;
1602 init_regno_assign_info ();
1603 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1604 create_live_range_start_chains ();
1605 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1606 if (flag_checking && !flag_ipa_ra)
1607 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1608 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1609 && lra_reg_info[i].call_p
1610 && overlaps_hard_reg_set_p (call_used_reg_set,
1611 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1612 gcc_unreachable ();
1613 /* Setup insns to process on the next constraint pass. */
1614 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1615 init_live_reload_and_inheritance_pseudos ();
1616 assign_by_spills ();
1617 finish_live_reload_and_inheritance_pseudos ();
1618 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1619 no_spills_p = true;
1620 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1621 /* We ignore spilled pseudos created on last inheritance pass
1622 because they will be removed. */
1623 if (lra_reg_info[u].restore_rtx == NULL_RTX)
1625 no_spills_p = false;
1626 break;
1628 finish_live_range_start_chains ();
1629 bitmap_clear (&all_spilled_pseudos);
1630 bitmap_initialize (&insns_to_process, &reg_obstack);
1631 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1632 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1633 bitmap_clear (&changed_pseudo_bitmap);
1634 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1636 lra_push_insn_by_uid (u);
1637 /* Invalidate alternatives for insn should be processed. */
1638 lra_set_used_insn_alternative_by_uid (u, -1);
1640 bitmap_clear (&insns_to_process);
1641 finish_regno_assign_info ();
1642 free (regno_live_length);
1643 free (regno_allocno_class_array);
1644 free (sorted_pseudos);
1645 free (sorted_reload_pseudos);
1646 finish_lives ();
1647 timevar_pop (TV_LRA_ASSIGN);
1648 if (former_reload_pseudo_spill_p)
1649 lra_assignment_iter_after_spill++;
1650 /* This is conditional on flag_checking because valid code can take
1651 more than this maximum number of iteration, but at the same time
1652 the test can uncover errors in machine descriptions. */
1653 if (flag_checking
1654 && (lra_assignment_iter_after_spill
1655 > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER))
1656 internal_error
1657 ("Maximum number of LRA assignment passes is achieved (%d)\n",
1658 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER);
1659 return no_spills_p;