2013-07-08 Andreas Krebbel <Andreas.Krebbel@de.ibm.com>
[official-gcc.git] / gcc / lra-assigns.c
blobb5736268e693464fb83176fd4605b9271e4b1109
1 /* Assign reload pseudos.
2 Copyright (C) 2010-2013 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
22 /* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
67 The pseudo live-ranges are used to find conflicting pseudos.
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
77 #include "config.h"
78 #include "system.h"
79 #include "coretypes.h"
80 #include "tm.h"
81 #include "hard-reg-set.h"
82 #include "rtl.h"
83 #include "rtl-error.h"
84 #include "tm_p.h"
85 #include "target.h"
86 #include "insn-config.h"
87 #include "recog.h"
88 #include "output.h"
89 #include "regs.h"
90 #include "function.h"
91 #include "expr.h"
92 #include "basic-block.h"
93 #include "except.h"
94 #include "df.h"
95 #include "ira.h"
96 #include "sparseset.h"
97 #include "lra-int.h"
99 /* Array containing corresponding values of function
100 lra_get_allocno_class. It is used to speed up the code. */
101 static enum reg_class *regno_allocno_class_array;
103 /* Information about the thread to which a pseudo belongs. Threads are
104 a set of connected reload and inheritance pseudos with the same set of
105 available hard registers. Lone registers belong to their own threads. */
106 struct regno_assign_info
108 /* First/next pseudo of the same thread. */
109 int first, next;
110 /* Frequency of the thread (execution frequency of only reload
111 pseudos in the thread when the thread contains a reload pseudo).
112 Defined only for the first thread pseudo. */
113 int freq;
116 /* Map regno to the corresponding regno assignment info. */
117 static struct regno_assign_info *regno_assign_info;
119 /* Process a pseudo copy with execution frequency COPY_FREQ connecting
120 REGNO1 and REGNO2 to form threads. */
121 static void
122 process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
124 int last, regno1_first, regno2_first;
126 lra_assert (regno1 >= lra_constraint_new_regno_start
127 && regno2 >= lra_constraint_new_regno_start);
128 regno1_first = regno_assign_info[regno1].first;
129 regno2_first = regno_assign_info[regno2].first;
130 if (regno1_first != regno2_first)
132 for (last = regno2_first;
133 regno_assign_info[last].next >= 0;
134 last = regno_assign_info[last].next)
135 regno_assign_info[last].first = regno1_first;
136 regno_assign_info[last].first = regno1_first;
137 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
138 regno_assign_info[regno1_first].next = regno2_first;
139 regno_assign_info[regno1_first].freq
140 += regno_assign_info[regno2_first].freq;
142 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
143 lra_assert (regno_assign_info[regno1_first].freq >= 0);
146 /* Initialize REGNO_ASSIGN_INFO and form threads. */
147 static void
148 init_regno_assign_info (void)
150 int i, regno1, regno2, max_regno = max_reg_num ();
151 lra_copy_t cp;
153 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
154 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
156 regno_assign_info[i].first = i;
157 regno_assign_info[i].next = -1;
158 regno_assign_info[i].freq = lra_reg_info[i].freq;
160 /* Form the threads. */
161 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
162 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
163 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
164 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
165 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
166 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
167 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
168 process_copy_to_form_thread (regno1, regno2, cp->freq);
171 /* Free REGNO_ASSIGN_INFO. */
172 static void
173 finish_regno_assign_info (void)
175 free (regno_assign_info);
178 /* The function is used to sort *reload* and *inheritance* pseudos to
179 try to assign them hard registers. We put pseudos from the same
180 thread always nearby. */
181 static int
182 reload_pseudo_compare_func (const void *v1p, const void *v2p)
184 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
185 enum reg_class cl1 = regno_allocno_class_array[r1];
186 enum reg_class cl2 = regno_allocno_class_array[r2];
187 int diff;
189 lra_assert (r1 >= lra_constraint_new_regno_start
190 && r2 >= lra_constraint_new_regno_start);
192 /* Prefer to assign reload registers with smaller classes first to
193 guarantee assignment to all reload registers. */
194 if ((diff = (ira_class_hard_regs_num[cl1]
195 - ira_class_hard_regs_num[cl2])) != 0)
196 return diff;
197 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
198 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
199 return diff;
200 /* Allocate bigger pseudos first to avoid register file
201 fragmentation. */
202 if ((diff
203 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
204 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
205 return diff;
206 /* Put pseudos from the thread nearby. */
207 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
208 return diff;
209 /* If regs are equally good, sort by their numbers, so that the
210 results of qsort leave nothing to chance. */
211 return r1 - r2;
214 /* The function is used to sort *non-reload* pseudos to try to assign
215 them hard registers. The order calculation is simpler than in the
216 previous function and based on the pseudo frequency usage. */
217 static int
218 pseudo_compare_func (const void *v1p, const void *v2p)
220 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
221 int diff;
223 /* Prefer to assign more frequently used registers first. */
224 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
225 return diff;
227 /* If regs are equally good, sort by their numbers, so that the
228 results of qsort leave nothing to chance. */
229 return r1 - r2;
232 /* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
233 pseudo live ranges with given start point. We insert only live
234 ranges of pseudos interesting for assignment purposes. They are
235 reload pseudos and pseudos assigned to hard registers. */
236 static lra_live_range_t *start_point_ranges;
238 /* Used as a flag that a live range is not inserted in the start point
239 chain. */
240 static struct lra_live_range not_in_chain_mark;
242 /* Create and set up START_POINT_RANGES. */
243 static void
244 create_live_range_start_chains (void)
246 int i, max_regno;
247 lra_live_range_t r;
249 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
250 max_regno = max_reg_num ();
251 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
252 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
254 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
256 r->start_next = start_point_ranges[r->start];
257 start_point_ranges[r->start] = r;
260 else
262 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
263 r->start_next = &not_in_chain_mark;
267 /* Insert live ranges of pseudo REGNO into start chains if they are
268 not there yet. */
269 static void
270 insert_in_live_range_start_chain (int regno)
272 lra_live_range_t r = lra_reg_info[regno].live_ranges;
274 if (r->start_next != &not_in_chain_mark)
275 return;
276 for (; r != NULL; r = r->next)
278 r->start_next = start_point_ranges[r->start];
279 start_point_ranges[r->start] = r;
283 /* Free START_POINT_RANGES. */
284 static void
285 finish_live_range_start_chains (void)
287 gcc_assert (start_point_ranges != NULL);
288 free (start_point_ranges);
289 start_point_ranges = NULL;
292 /* Map: program point -> bitmap of all pseudos living at the point and
293 assigned to hard registers. */
294 static bitmap_head *live_hard_reg_pseudos;
295 static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
297 /* reg_renumber corresponding to pseudos marked in
298 live_hard_reg_pseudos. reg_renumber might be not matched to
299 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
300 live_hard_reg_pseudos. */
301 static int *live_pseudos_reg_renumber;
303 /* Sparseset used to calculate living hard reg pseudos for some program
304 point range. */
305 static sparseset live_range_hard_reg_pseudos;
307 /* Sparseset used to calculate living reload/inheritance pseudos for
308 some program point range. */
309 static sparseset live_range_reload_inheritance_pseudos;
311 /* Allocate and initialize the data about living pseudos at program
312 points. */
313 static void
314 init_lives (void)
316 int i, max_regno = max_reg_num ();
318 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
319 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
320 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
321 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
322 for (i = 0; i < lra_live_max_point; i++)
323 bitmap_initialize (&live_hard_reg_pseudos[i],
324 &live_hard_reg_pseudos_bitmap_obstack);
325 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
326 for (i = 0; i < max_regno; i++)
327 live_pseudos_reg_renumber[i] = -1;
330 /* Free the data about living pseudos at program points. */
331 static void
332 finish_lives (void)
334 sparseset_free (live_range_hard_reg_pseudos);
335 sparseset_free (live_range_reload_inheritance_pseudos);
336 free (live_hard_reg_pseudos);
337 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
338 free (live_pseudos_reg_renumber);
341 /* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
342 entries for pseudo REGNO. Assume that the register has been
343 spilled if FREE_P, otherwise assume that it has been assigned
344 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
345 ranges in the start chains when it is assumed to be assigned to a
346 hard register because we use the chains of pseudos assigned to hard
347 registers during allocation. */
348 static void
349 update_lives (int regno, bool free_p)
351 int p;
352 lra_live_range_t r;
354 if (reg_renumber[regno] < 0)
355 return;
356 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
357 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
359 for (p = r->start; p <= r->finish; p++)
360 if (free_p)
361 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
362 else
364 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
365 insert_in_live_range_start_chain (regno);
370 /* Sparseset used to calculate reload pseudos conflicting with a given
371 pseudo when we are trying to find a hard register for the given
372 pseudo. */
373 static sparseset conflict_reload_and_inheritance_pseudos;
375 /* Map: program point -> bitmap of all reload and inheritance pseudos
376 living at the point. */
377 static bitmap_head *live_reload_and_inheritance_pseudos;
378 static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
380 /* Allocate and initialize data about living reload pseudos at any
381 given program point. */
382 static void
383 init_live_reload_and_inheritance_pseudos (void)
385 int i, p, max_regno = max_reg_num ();
386 lra_live_range_t r;
388 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
389 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
390 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
391 for (p = 0; p < lra_live_max_point; p++)
392 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
393 &live_reload_and_inheritance_pseudos_bitmap_obstack);
394 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
396 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
397 for (p = r->start; p <= r->finish; p++)
398 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
402 /* Finalize data about living reload pseudos at any given program
403 point. */
404 static void
405 finish_live_reload_and_inheritance_pseudos (void)
407 sparseset_free (conflict_reload_and_inheritance_pseudos);
408 free (live_reload_and_inheritance_pseudos);
409 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
412 /* The value used to check that cost of given hard reg is really
413 defined currently. */
414 static int curr_hard_regno_costs_check = 0;
415 /* Array used to check that cost of the corresponding hard reg (the
416 array element index) is really defined currently. */
417 static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
418 /* The current costs of allocation of hard regs. Defined only if the
419 value of the corresponding element of the previous array is equal to
420 CURR_HARD_REGNO_COSTS_CHECK. */
421 static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
423 /* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
424 not defined yet. */
425 static inline void
426 adjust_hard_regno_cost (int hard_regno, int incr)
428 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
429 hard_regno_costs[hard_regno] = 0;
430 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
431 hard_regno_costs[hard_regno] += incr;
434 /* Try to find a free hard register for pseudo REGNO. Return the
435 hard register on success and set *COST to the cost of using
436 that register. (If several registers have equal cost, the one with
437 the highest priority wins.) Return -1 on failure.
439 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
440 otherwise consider all hard registers in REGNO's class. */
441 static int
442 find_hard_regno_for (int regno, int *cost, int try_only_hard_regno)
444 HARD_REG_SET conflict_set;
445 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
446 lra_live_range_t r;
447 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
448 int hr, conflict_hr, nregs;
449 enum machine_mode biggest_mode;
450 unsigned int k, conflict_regno;
451 int offset, val, biggest_nregs, nregs_diff;
452 enum reg_class rclass;
453 bitmap_iterator bi;
454 bool *rclass_intersect_p;
455 HARD_REG_SET impossible_start_hard_regs;
457 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
458 rclass = regno_allocno_class_array[regno];
459 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
460 curr_hard_regno_costs_check++;
461 sparseset_clear (conflict_reload_and_inheritance_pseudos);
462 sparseset_clear (live_range_hard_reg_pseudos);
463 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
464 biggest_mode = lra_reg_info[regno].biggest_mode;
465 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
467 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
468 if (rclass_intersect_p[regno_allocno_class_array[k]])
469 sparseset_set_bit (live_range_hard_reg_pseudos, k);
470 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
471 0, k, bi)
472 if (lra_reg_info[k].preferred_hard_regno1 >= 0
473 && live_pseudos_reg_renumber[k] < 0
474 && rclass_intersect_p[regno_allocno_class_array[k]])
475 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
476 for (p = r->start + 1; p <= r->finish; p++)
478 lra_live_range_t r2;
480 for (r2 = start_point_ranges[p];
481 r2 != NULL;
482 r2 = r2->start_next)
484 if (r2->regno >= lra_constraint_new_regno_start
485 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
486 && live_pseudos_reg_renumber[r2->regno] < 0
487 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
488 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
489 r2->regno);
490 if (live_pseudos_reg_renumber[r2->regno] >= 0
491 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
492 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
496 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
498 adjust_hard_regno_cost
499 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
500 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
501 adjust_hard_regno_cost
502 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
504 #ifdef STACK_REGS
505 if (lra_reg_info[regno].no_stack_p)
506 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
507 SET_HARD_REG_BIT (conflict_set, i);
508 #endif
509 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
510 val = lra_reg_info[regno].val;
511 offset = lra_reg_info[regno].offset;
512 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
513 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
514 if (lra_reg_val_equal_p (conflict_regno, val, offset))
516 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
517 nregs = (hard_regno_nregs[conflict_hr]
518 [lra_reg_info[conflict_regno].biggest_mode]);
519 /* Remember about multi-register pseudos. For example, 2 hard
520 register pseudos can start on the same hard register but can
521 not start on HR and HR+1/HR-1. */
522 for (hr = conflict_hr + 1;
523 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
524 hr++)
525 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
526 for (hr = conflict_hr - 1;
527 hr >= 0 && hr + hard_regno_nregs[hr][biggest_mode] > conflict_hr;
528 hr--)
529 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
531 else
533 add_to_hard_reg_set (&conflict_set,
534 lra_reg_info[conflict_regno].biggest_mode,
535 live_pseudos_reg_renumber[conflict_regno]);
536 if (hard_reg_set_subset_p (reg_class_contents[rclass],
537 conflict_set))
538 return -1;
540 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
541 conflict_regno)
542 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
544 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
545 if ((hard_regno
546 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
548 adjust_hard_regno_cost
549 (hard_regno,
550 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
551 if ((hard_regno
552 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
553 adjust_hard_regno_cost
554 (hard_regno,
555 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
558 /* Make sure that all registers in a multi-word pseudo belong to the
559 required class. */
560 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
561 lra_assert (rclass != NO_REGS);
562 rclass_size = ira_class_hard_regs_num[rclass];
563 best_hard_regno = -1;
564 hard_regno = ira_class_hard_regs[rclass][0];
565 biggest_nregs = hard_regno_nregs[hard_regno][biggest_mode];
566 nregs_diff = (biggest_nregs
567 - hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)]);
568 for (i = 0; i < rclass_size; i++)
570 if (try_only_hard_regno >= 0)
571 hard_regno = try_only_hard_regno;
572 else
573 hard_regno = ira_class_hard_regs[rclass][i];
574 if (! overlaps_hard_reg_set_p (conflict_set,
575 PSEUDO_REGNO_MODE (regno), hard_regno)
576 /* We can not use prohibited_class_mode_regs because it is
577 not defined for all classes. */
578 && HARD_REGNO_MODE_OK (hard_regno, PSEUDO_REGNO_MODE (regno))
579 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
580 && (nregs_diff == 0
581 || (WORDS_BIG_ENDIAN
582 ? (hard_regno - nregs_diff >= 0
583 && TEST_HARD_REG_BIT (reg_class_contents[rclass],
584 hard_regno - nregs_diff))
585 : TEST_HARD_REG_BIT (reg_class_contents[rclass],
586 hard_regno + nregs_diff))))
588 if (hard_regno_costs_check[hard_regno]
589 != curr_hard_regno_costs_check)
591 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
592 hard_regno_costs[hard_regno] = 0;
594 for (j = 0;
595 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
596 j++)
597 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
598 && ! df_regs_ever_live_p (hard_regno + j))
599 /* It needs save restore. */
600 hard_regno_costs[hard_regno]
601 += 2 * ENTRY_BLOCK_PTR->next_bb->frequency + 1;
602 priority = targetm.register_priority (hard_regno);
603 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
604 || (hard_regno_costs[hard_regno] == best_cost
605 && (priority > best_priority
606 || (targetm.register_usage_leveling_p ()
607 && priority == best_priority
608 && best_usage > lra_hard_reg_usage[hard_regno]))))
610 best_hard_regno = hard_regno;
611 best_cost = hard_regno_costs[hard_regno];
612 best_priority = priority;
613 best_usage = lra_hard_reg_usage[hard_regno];
616 if (try_only_hard_regno >= 0)
617 break;
619 if (best_hard_regno >= 0)
620 *cost = best_cost - lra_reg_info[regno].freq;
621 return best_hard_regno;
624 /* Current value used for checking elements in
625 update_hard_regno_preference_check. */
626 static int curr_update_hard_regno_preference_check;
627 /* If an element value is equal to the above variable value, then the
628 corresponding regno has been processed for preference
629 propagation. */
630 static int *update_hard_regno_preference_check;
632 /* Update the preference for using HARD_REGNO for pseudos that are
633 connected directly or indirectly with REGNO. Apply divisor DIV
634 to any preference adjustments.
636 The more indirectly a pseudo is connected, the smaller its effect
637 should be. We therefore increase DIV on each "hop". */
638 static void
639 update_hard_regno_preference (int regno, int hard_regno, int div)
641 int another_regno, cost;
642 lra_copy_t cp, next_cp;
644 /* Search depth 5 seems to be enough. */
645 if (div > (1 << 5))
646 return;
647 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
649 if (cp->regno1 == regno)
651 next_cp = cp->regno1_next;
652 another_regno = cp->regno2;
654 else if (cp->regno2 == regno)
656 next_cp = cp->regno2_next;
657 another_regno = cp->regno1;
659 else
660 gcc_unreachable ();
661 if (reg_renumber[another_regno] < 0
662 && (update_hard_regno_preference_check[another_regno]
663 != curr_update_hard_regno_preference_check))
665 update_hard_regno_preference_check[another_regno]
666 = curr_update_hard_regno_preference_check;
667 cost = cp->freq < div ? 1 : cp->freq / div;
668 lra_setup_reload_pseudo_preferenced_hard_reg
669 (another_regno, hard_regno, cost);
670 update_hard_regno_preference (another_regno, hard_regno, div * 2);
675 /* Return prefix title for pseudo REGNO. */
676 static const char *
677 pseudo_prefix_title (int regno)
679 return
680 (regno < lra_constraint_new_regno_start ? ""
681 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
682 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
683 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
684 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
685 : "reload ");
688 /* Update REG_RENUMBER and other pseudo preferences by assignment of
689 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
690 void
691 lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
693 int i, hr;
695 /* We can not just reassign hard register. */
696 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
697 if ((hr = hard_regno) < 0)
698 hr = reg_renumber[regno];
699 reg_renumber[regno] = hard_regno;
700 lra_assert (hr >= 0);
701 for (i = 0; i < hard_regno_nregs[hr][PSEUDO_REGNO_MODE (regno)]; i++)
702 if (hard_regno < 0)
703 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
704 else
705 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
706 if (print_p && lra_dump_file != NULL)
707 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
708 reg_renumber[regno], pseudo_prefix_title (regno),
709 regno, lra_reg_info[regno].freq);
710 if (hard_regno >= 0)
712 curr_update_hard_regno_preference_check++;
713 update_hard_regno_preference (regno, hard_regno, 1);
717 /* Pseudos which occur in insns containing a particular pseudo. */
718 static bitmap_head insn_conflict_pseudos;
720 /* Bitmaps used to contain spill pseudos for given pseudo hard regno
721 and best spill pseudos for given pseudo (and best hard regno). */
722 static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
724 /* Current pseudo check for validity of elements in
725 TRY_HARD_REG_PSEUDOS. */
726 static int curr_pseudo_check;
727 /* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
728 static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
729 /* Pseudos who hold given hard register at the considered points. */
730 static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
732 /* Set up try_hard_reg_pseudos for given program point P and class
733 RCLASS. Those are pseudos living at P and assigned to a hard
734 register of RCLASS. In other words, those are pseudos which can be
735 spilled to assign a hard register of RCLASS to a pseudo living at
736 P. */
737 static void
738 setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
740 int i, hard_regno;
741 enum machine_mode mode;
742 unsigned int spill_regno;
743 bitmap_iterator bi;
745 /* Find what pseudos could be spilled. */
746 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
748 mode = PSEUDO_REGNO_MODE (spill_regno);
749 hard_regno = live_pseudos_reg_renumber[spill_regno];
750 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
751 mode, hard_regno))
753 for (i = hard_regno_nregs[hard_regno][mode] - 1; i >= 0; i--)
755 if (try_hard_reg_pseudos_check[hard_regno + i]
756 != curr_pseudo_check)
758 try_hard_reg_pseudos_check[hard_regno + i]
759 = curr_pseudo_check;
760 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
762 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
763 spill_regno);
769 /* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
770 assignment means that we might undo the data change. */
771 static void
772 assign_temporarily (int regno, int hard_regno)
774 int p;
775 lra_live_range_t r;
777 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
779 for (p = r->start; p <= r->finish; p++)
780 if (hard_regno < 0)
781 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
782 else
784 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
785 insert_in_live_range_start_chain (regno);
788 live_pseudos_reg_renumber[regno] = hard_regno;
791 /* Array used for sorting reload pseudos for subsequent allocation
792 after spilling some pseudo. */
793 static int *sorted_reload_pseudos;
795 /* Spill some pseudos for a reload pseudo REGNO and return hard
796 register which should be used for pseudo after spilling. The
797 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
798 choose hard register (and pseudos occupying the hard registers and
799 to be spilled), we take into account not only how REGNO will
800 benefit from the spills but also how other reload pseudos not yet
801 assigned to hard registers benefit from the spills too. In very
802 rare cases, the function can fail and return -1. */
803 static int
804 spill_for (int regno, bitmap spilled_pseudo_bitmap)
806 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
807 int reload_hard_regno, reload_cost;
808 enum machine_mode mode;
809 enum reg_class rclass;
810 unsigned int spill_regno, reload_regno, uid;
811 int insn_pseudos_num, best_insn_pseudos_num;
812 lra_live_range_t r;
813 bitmap_iterator bi;
815 rclass = regno_allocno_class_array[regno];
816 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
817 bitmap_clear (&insn_conflict_pseudos);
818 bitmap_clear (&best_spill_pseudos_bitmap);
819 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
821 struct lra_insn_reg *ir;
823 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
824 if (ir->regno >= FIRST_PSEUDO_REGISTER)
825 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
827 best_hard_regno = -1;
828 best_cost = INT_MAX;
829 best_insn_pseudos_num = INT_MAX;
830 rclass_size = ira_class_hard_regs_num[rclass];
831 mode = PSEUDO_REGNO_MODE (regno);
832 /* Invalidate try_hard_reg_pseudos elements. */
833 curr_pseudo_check++;
834 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
835 for (p = r->start; p <= r->finish; p++)
836 setup_try_hard_regno_pseudos (p, rclass);
837 for (i = 0; i < rclass_size; i++)
839 hard_regno = ira_class_hard_regs[rclass][i];
840 bitmap_clear (&spill_pseudos_bitmap);
841 for (j = hard_regno_nregs[hard_regno][mode] - 1; j >= 0; j--)
843 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
844 continue;
845 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
846 bitmap_ior_into (&spill_pseudos_bitmap,
847 &try_hard_reg_pseudos[hard_regno + j]);
849 /* Spill pseudos. */
850 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
851 if ((int) spill_regno >= lra_constraint_new_regno_start
852 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
853 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
854 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
855 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno))
856 goto fail;
857 insn_pseudos_num = 0;
858 if (lra_dump_file != NULL)
859 fprintf (lra_dump_file, " Trying %d:", hard_regno);
860 sparseset_clear (live_range_reload_inheritance_pseudos);
861 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
863 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
864 insn_pseudos_num++;
865 for (r = lra_reg_info[spill_regno].live_ranges;
866 r != NULL;
867 r = r->next)
869 for (p = r->start; p <= r->finish; p++)
871 lra_live_range_t r2;
873 for (r2 = start_point_ranges[p];
874 r2 != NULL;
875 r2 = r2->start_next)
876 if (r2->regno >= lra_constraint_new_regno_start)
877 sparseset_set_bit (live_range_reload_inheritance_pseudos,
878 r2->regno);
882 n = 0;
883 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
884 reload_regno)
885 if ((int) reload_regno != regno
886 && (ira_reg_classes_intersect_p
887 [rclass][regno_allocno_class_array[reload_regno]])
888 && live_pseudos_reg_renumber[reload_regno] < 0
889 && find_hard_regno_for (reload_regno, &cost, -1) < 0)
890 sorted_reload_pseudos[n++] = reload_regno;
891 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
893 update_lives (spill_regno, true);
894 if (lra_dump_file != NULL)
895 fprintf (lra_dump_file, " spill %d(freq=%d)",
896 spill_regno, lra_reg_info[spill_regno].freq);
898 hard_regno = find_hard_regno_for (regno, &cost, -1);
899 if (hard_regno >= 0)
901 assign_temporarily (regno, hard_regno);
902 qsort (sorted_reload_pseudos, n, sizeof (int),
903 reload_pseudo_compare_func);
904 for (j = 0; j < n; j++)
906 reload_regno = sorted_reload_pseudos[j];
907 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
908 if ((reload_hard_regno
909 = find_hard_regno_for (reload_regno,
910 &reload_cost, -1)) >= 0)
912 if (lra_dump_file != NULL)
913 fprintf (lra_dump_file, " assign %d(cost=%d)",
914 reload_regno, reload_cost);
915 assign_temporarily (reload_regno, reload_hard_regno);
916 cost += reload_cost;
919 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
921 rtx x;
923 cost += lra_reg_info[spill_regno].freq;
924 if (ira_reg_equiv[spill_regno].memory != NULL
925 || ira_reg_equiv[spill_regno].constant != NULL)
926 for (x = ira_reg_equiv[spill_regno].init_insns;
927 x != NULL;
928 x = XEXP (x, 1))
929 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (XEXP (x, 0)));
931 if (best_insn_pseudos_num > insn_pseudos_num
932 || (best_insn_pseudos_num == insn_pseudos_num
933 && best_cost > cost))
935 best_insn_pseudos_num = insn_pseudos_num;
936 best_cost = cost;
937 best_hard_regno = hard_regno;
938 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
939 if (lra_dump_file != NULL)
940 fprintf (lra_dump_file, " Now best %d(cost=%d)\n",
941 hard_regno, cost);
943 assign_temporarily (regno, -1);
944 for (j = 0; j < n; j++)
946 reload_regno = sorted_reload_pseudos[j];
947 if (live_pseudos_reg_renumber[reload_regno] >= 0)
948 assign_temporarily (reload_regno, -1);
951 if (lra_dump_file != NULL)
952 fprintf (lra_dump_file, "\n");
953 /* Restore the live hard reg pseudo info for spilled pseudos. */
954 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
955 update_lives (spill_regno, false);
956 fail:
959 /* Spill: */
960 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
962 if (lra_dump_file != NULL)
963 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
964 pseudo_prefix_title (spill_regno),
965 spill_regno, reg_renumber[spill_regno],
966 lra_reg_info[spill_regno].freq, regno);
967 update_lives (spill_regno, true);
968 lra_setup_reg_renumber (spill_regno, -1, false);
970 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
971 return best_hard_regno;
974 /* Assign HARD_REGNO to REGNO. */
975 static void
976 assign_hard_regno (int hard_regno, int regno)
978 int i;
980 lra_assert (hard_regno >= 0);
981 lra_setup_reg_renumber (regno, hard_regno, true);
982 update_lives (regno, false);
983 for (i = 0;
984 i < hard_regno_nregs[hard_regno][lra_reg_info[regno].biggest_mode];
985 i++)
986 df_set_regs_ever_live (hard_regno + i, true);
989 /* Array used for sorting different pseudos. */
990 static int *sorted_pseudos;
992 /* The constraints pass is allowed to create equivalences between
993 pseudos that make the current allocation "incorrect" (in the sense
994 that pseudos are assigned to hard registers from their own conflict
995 sets). The global variable lra_risky_transformations_p says
996 whether this might have happened.
998 Process pseudos assigned to hard registers (less frequently used
999 first), spill if a conflict is found, and mark the spilled pseudos
1000 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1001 pseudos, assigned to hard registers. */
1002 static void
1003 setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1004 spilled_pseudo_bitmap)
1006 int p, i, j, n, regno, hard_regno;
1007 unsigned int k, conflict_regno;
1008 int val, offset;
1009 HARD_REG_SET conflict_set;
1010 enum machine_mode mode;
1011 lra_live_range_t r;
1012 bitmap_iterator bi;
1013 int max_regno = max_reg_num ();
1015 if (! lra_risky_transformations_p)
1017 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1018 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1019 update_lives (i, false);
1020 return;
1022 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1023 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1024 sorted_pseudos[n++] = i;
1025 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1026 for (i = n - 1; i >= 0; i--)
1028 regno = sorted_pseudos[i];
1029 hard_regno = reg_renumber[regno];
1030 lra_assert (hard_regno >= 0);
1031 mode = lra_reg_info[regno].biggest_mode;
1032 sparseset_clear (live_range_hard_reg_pseudos);
1033 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1035 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1036 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1037 for (p = r->start + 1; p <= r->finish; p++)
1039 lra_live_range_t r2;
1041 for (r2 = start_point_ranges[p];
1042 r2 != NULL;
1043 r2 = r2->start_next)
1044 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1045 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1048 COPY_HARD_REG_SET (conflict_set, lra_no_alloc_regs);
1049 IOR_HARD_REG_SET (conflict_set, lra_reg_info[regno].conflict_hard_regs);
1050 val = lra_reg_info[regno].val;
1051 offset = lra_reg_info[regno].offset;
1052 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1053 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
1054 /* If it is multi-register pseudos they should start on
1055 the same hard register. */
1056 || hard_regno != reg_renumber[conflict_regno])
1057 add_to_hard_reg_set (&conflict_set,
1058 lra_reg_info[conflict_regno].biggest_mode,
1059 reg_renumber[conflict_regno]);
1060 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1062 update_lives (regno, false);
1063 continue;
1065 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1066 for (j = 0;
1067 j < hard_regno_nregs[hard_regno][PSEUDO_REGNO_MODE (regno)];
1068 j++)
1069 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1070 reg_renumber[regno] = -1;
1071 if (lra_dump_file != NULL)
1072 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1073 regno);
1077 /* Improve allocation by assigning the same hard regno of inheritance
1078 pseudos to the connected pseudos. We need this because inheritance
1079 pseudos are allocated after reload pseudos in the thread and when
1080 we assign a hard register to a reload pseudo we don't know yet that
1081 the connected inheritance pseudos can get the same hard register.
1082 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1083 static void
1084 improve_inheritance (bitmap changed_pseudos)
1086 unsigned int k;
1087 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1088 lra_copy_t cp, next_cp;
1089 bitmap_iterator bi;
1091 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1092 return;
1093 n = 0;
1094 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1095 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1096 sorted_pseudos[n++] = k;
1097 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1098 for (i = 0; i < n; i++)
1100 regno = sorted_pseudos[i];
1101 hard_regno = reg_renumber[regno];
1102 lra_assert (hard_regno >= 0);
1103 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1105 if (cp->regno1 == regno)
1107 next_cp = cp->regno1_next;
1108 another_regno = cp->regno2;
1110 else if (cp->regno2 == regno)
1112 next_cp = cp->regno2_next;
1113 another_regno = cp->regno1;
1115 else
1116 gcc_unreachable ();
1117 /* Don't change reload pseudo allocation. It might have
1118 this allocation for a purpose and changing it can result
1119 in LRA cycling. */
1120 if ((another_regno < lra_constraint_new_regno_start
1121 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1122 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1123 && another_hard_regno != hard_regno)
1125 if (lra_dump_file != NULL)
1126 fprintf
1127 (lra_dump_file,
1128 " Improving inheritance for %d(%d) and %d(%d)...\n",
1129 regno, hard_regno, another_regno, another_hard_regno);
1130 update_lives (another_regno, true);
1131 lra_setup_reg_renumber (another_regno, -1, false);
1132 if (hard_regno
1133 == find_hard_regno_for (another_regno, &cost, hard_regno))
1134 assign_hard_regno (hard_regno, another_regno);
1135 else
1136 assign_hard_regno (another_hard_regno, another_regno);
1137 bitmap_set_bit (changed_pseudos, another_regno);
1144 /* Bitmap finally containing all pseudos spilled on this assignment
1145 pass. */
1146 static bitmap_head all_spilled_pseudos;
1147 /* All pseudos whose allocation was changed. */
1148 static bitmap_head changed_pseudo_bitmap;
1150 /* Assign hard registers to reload pseudos and other pseudos. */
1151 static void
1152 assign_by_spills (void)
1154 int i, n, nfails, iter, regno, hard_regno, cost, restore_regno;
1155 rtx insn;
1156 basic_block bb;
1157 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
1158 bitmap_head non_reload_pseudos;
1159 unsigned int u;
1160 bitmap_iterator bi;
1161 bool reload_p;
1162 int max_regno = max_reg_num ();
1164 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1165 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1166 && regno_allocno_class_array[i] != NO_REGS)
1167 sorted_pseudos[n++] = i;
1168 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1169 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1170 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1171 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1172 curr_update_hard_regno_preference_check = 0;
1173 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1174 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1175 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1176 curr_pseudo_check = 0;
1177 bitmap_initialize (&changed_insns, &reg_obstack);
1178 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1179 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1180 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1181 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1182 for (iter = 0; iter <= 1; iter++)
1184 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1185 nfails = 0;
1186 for (i = 0; i < n; i++)
1188 regno = sorted_pseudos[i];
1189 if (lra_dump_file != NULL)
1190 fprintf (lra_dump_file, " Assigning to %d "
1191 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1192 regno, reg_class_names[regno_allocno_class_array[regno]],
1193 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1194 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1195 regno_assign_info[regno_assign_info[regno].first].freq);
1196 hard_regno = find_hard_regno_for (regno, &cost, -1);
1197 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1198 if (hard_regno < 0 && reload_p)
1199 hard_regno = spill_for (regno, &all_spilled_pseudos);
1200 if (hard_regno < 0)
1202 if (reload_p)
1203 sorted_pseudos[nfails++] = regno;
1205 else
1207 /* This register might have been spilled by the previous
1208 pass. Indicate that it is no longer spilled. */
1209 bitmap_clear_bit (&all_spilled_pseudos, regno);
1210 assign_hard_regno (hard_regno, regno);
1211 if (! reload_p)
1212 /* As non-reload pseudo assignment is changed we
1213 should reconsider insns referring for the
1214 pseudo. */
1215 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1218 if (nfails == 0)
1219 break;
1220 if (iter > 0)
1222 /* We did not assign hard regs to reload pseudos after two
1223 iteration. It means something is wrong with asm insn
1224 constraints. Report it. */
1225 bool asm_p = false;
1226 bitmap_head failed_reload_insns;
1228 bitmap_initialize (&failed_reload_insns, &reg_obstack);
1229 for (i = 0; i < nfails; i++)
1231 regno = sorted_pseudos[i];
1232 bitmap_ior_into (&failed_reload_insns,
1233 &lra_reg_info[regno].insn_bitmap);
1234 /* Assign an arbitrary hard register of regno class to
1235 avoid further trouble with the asm insns. */
1236 bitmap_clear_bit (&all_spilled_pseudos, regno);
1237 assign_hard_regno
1238 (ira_class_hard_regs[regno_allocno_class_array[regno]][0],
1239 regno);
1241 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1243 insn = lra_insn_recog_data[u]->insn;
1244 if (asm_noperands (PATTERN (insn)) >= 0)
1246 asm_p = true;
1247 error_for_asm (insn,
1248 "%<asm%> operand has impossible constraints");
1249 /* Avoid further trouble with this insn.
1250 For asm goto, instead of fixing up all the edges
1251 just clear the template and clear input operands
1252 (asm goto doesn't have any output operands). */
1253 if (JUMP_P (insn))
1255 rtx asm_op = extract_asm_operands (PATTERN (insn));
1256 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1257 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1258 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1259 lra_update_insn_regno_info (insn);
1261 else
1263 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1264 lra_set_insn_deleted (insn);
1268 lra_assert (asm_p);
1269 break;
1271 /* This is a very rare event. We can not assign a hard
1272 register to reload pseudo because the hard register was
1273 assigned to another reload pseudo on a previous
1274 assignment pass. For x86 example, on the 1st pass we
1275 assigned CX (although another hard register could be used
1276 for this) to reload pseudo in an insn, on the 2nd pass we
1277 need CX (and only this) hard register for a new reload
1278 pseudo in the same insn. */
1279 if (lra_dump_file != NULL)
1280 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
1281 for (i = 0; i < nfails; i++)
1283 if (lra_dump_file != NULL)
1284 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1285 sorted_pseudos[i]);
1286 bitmap_ior_into (&changed_insns,
1287 &lra_reg_info[sorted_pseudos[i]].insn_bitmap);
1290 /* FIXME: Look up the changed insns in the cached LRA insn data using
1291 an EXECUTE_IF_SET_IN_BITMAP over changed_insns. */
1292 FOR_EACH_BB (bb)
1293 FOR_BB_INSNS (bb, insn)
1294 if (bitmap_bit_p (&changed_insns, INSN_UID (insn)))
1296 lra_insn_recog_data_t data;
1297 struct lra_insn_reg *r;
1299 data = lra_get_insn_recog_data (insn);
1300 for (r = data->regs; r != NULL; r = r->next)
1302 regno = r->regno;
1303 /* A reload pseudo did not get a hard register on the
1304 first iteration because of the conflict with
1305 another reload pseudos in the same insn. So we
1306 consider only reload pseudos assigned to hard
1307 registers. We shall exclude inheritance pseudos as
1308 they can occur in original insns (not reload ones).
1309 We can omit the check for split pseudos because
1310 they occur only in move insns containing non-reload
1311 pseudos. */
1312 if (regno < lra_constraint_new_regno_start
1313 || bitmap_bit_p (&lra_inheritance_pseudos, regno)
1314 || reg_renumber[regno] < 0)
1315 continue;
1316 sorted_pseudos[nfails++] = regno;
1317 if (lra_dump_file != NULL)
1318 fprintf (lra_dump_file,
1319 " Spill reload r%d(hr=%d, freq=%d)\n",
1320 regno, reg_renumber[regno],
1321 lra_reg_info[regno].freq);
1322 update_lives (regno, true);
1323 lra_setup_reg_renumber (regno, -1, false);
1326 n = nfails;
1328 improve_inheritance (&changed_pseudo_bitmap);
1329 bitmap_clear (&non_reload_pseudos);
1330 bitmap_clear (&changed_insns);
1331 if (! lra_simple_p)
1333 /* We should not assign to original pseudos of inheritance
1334 pseudos or split pseudos if any its inheritance pseudo did
1335 not get hard register or any its split pseudo was not split
1336 because undo inheritance/split pass will extend live range of
1337 such inheritance or split pseudos. */
1338 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1339 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
1340 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1341 && reg_renumber[u] < 0
1342 && bitmap_bit_p (&lra_inheritance_pseudos, u))
1343 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1344 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
1345 if ((restore_regno = lra_reg_info[u].restore_regno) >= 0
1346 && reg_renumber[u] >= 0)
1347 bitmap_set_bit (&do_not_assign_nonreload_pseudos, restore_regno);
1348 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1349 if (((i < lra_constraint_new_regno_start
1350 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1351 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
1352 && lra_reg_info[i].restore_regno >= 0)
1353 || (bitmap_bit_p (&lra_split_regs, i)
1354 && lra_reg_info[i].restore_regno >= 0)
1355 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
1356 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1357 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1358 && regno_allocno_class_array[i] != NO_REGS)
1359 sorted_pseudos[n++] = i;
1360 bitmap_clear (&do_not_assign_nonreload_pseudos);
1361 if (n != 0 && lra_dump_file != NULL)
1362 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1363 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1364 for (i = 0; i < n; i++)
1366 regno = sorted_pseudos[i];
1367 hard_regno = find_hard_regno_for (regno, &cost, -1);
1368 if (hard_regno >= 0)
1370 assign_hard_regno (hard_regno, regno);
1371 /* We change allocation for non-reload pseudo on this
1372 iteration -- mark the pseudo for invalidation of used
1373 alternatives of insns containing the pseudo. */
1374 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1378 free (update_hard_regno_preference_check);
1379 bitmap_clear (&best_spill_pseudos_bitmap);
1380 bitmap_clear (&spill_pseudos_bitmap);
1381 bitmap_clear (&insn_conflict_pseudos);
1385 /* Entry function to assign hard registers to new reload pseudos
1386 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1387 of old pseudos) and possibly to the old pseudos. The function adds
1388 what insns to process for the next constraint pass. Those are all
1389 insns who contains non-reload and non-inheritance pseudos with
1390 changed allocation.
1392 Return true if we did not spill any non-reload and non-inheritance
1393 pseudos. */
1394 bool
1395 lra_assign (void)
1397 int i;
1398 unsigned int u;
1399 bitmap_iterator bi;
1400 bitmap_head insns_to_process;
1401 bool no_spills_p;
1402 int max_regno = max_reg_num ();
1404 timevar_push (TV_LRA_ASSIGN);
1405 init_lives ();
1406 sorted_pseudos = XNEWVEC (int, max_regno);
1407 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1408 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
1409 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1410 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1411 init_regno_assign_info ();
1412 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1413 create_live_range_start_chains ();
1414 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
1415 #ifdef ENABLE_CHECKING
1416 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1417 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
1418 && lra_reg_info[i].call_p
1419 && overlaps_hard_reg_set_p (call_used_reg_set,
1420 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1421 gcc_unreachable ();
1422 #endif
1423 /* Setup insns to process on the next constraint pass. */
1424 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1425 init_live_reload_and_inheritance_pseudos ();
1426 assign_by_spills ();
1427 finish_live_reload_and_inheritance_pseudos ();
1428 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1429 no_spills_p = true;
1430 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1431 /* We ignore spilled pseudos created on last inheritance pass
1432 because they will be removed. */
1433 if (lra_reg_info[u].restore_regno < 0)
1435 no_spills_p = false;
1436 break;
1438 finish_live_range_start_chains ();
1439 bitmap_clear (&all_spilled_pseudos);
1440 bitmap_initialize (&insns_to_process, &reg_obstack);
1441 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1442 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1443 bitmap_clear (&changed_pseudo_bitmap);
1444 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1446 lra_push_insn_by_uid (u);
1447 /* Invalidate alternatives for insn should be processed. */
1448 lra_set_used_insn_alternative_by_uid (u, -1);
1450 bitmap_clear (&insns_to_process);
1451 finish_regno_assign_info ();
1452 free (regno_allocno_class_array);
1453 free (sorted_pseudos);
1454 free (sorted_reload_pseudos);
1455 finish_lives ();
1456 timevar_pop (TV_LRA_ASSIGN);
1457 return no_spills_p;