1 /* Decompose multiword subregs.
2 Copyright (C) 2007-2013 Free Software Foundation, Inc.
3 Contributed by Richard Henderson <rth@redhat.com>
4 Ian Lance Taylor <iant@google.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
24 #include "coretypes.h"
30 #include "insn-config.h"
32 #include "basic-block.h"
39 #include "tree-pass.h"
41 #include "lower-subreg.h"
43 #ifdef STACK_GROWS_DOWNWARD
44 # undef STACK_GROWS_DOWNWARD
45 # define STACK_GROWS_DOWNWARD 1
47 # define STACK_GROWS_DOWNWARD 0
51 /* Decompose multi-word pseudo-registers into individual
52 pseudo-registers when possible and profitable. This is possible
53 when all the uses of a multi-word register are via SUBREG, or are
54 copies of the register to another location. Breaking apart the
55 register permits more CSE and permits better register allocation.
56 This is profitable if the machine does not have move instructions
59 This pass only splits moves with modes that are wider than
60 word_mode and ASHIFTs, LSHIFTRTs, ASHIFTRTs and ZERO_EXTENDs with
61 integer modes that are twice the width of word_mode. The latter
62 could be generalized if there was a need to do this, but the trend in
63 architectures is to not need this.
65 There are two useful preprocessor defines for use by maintainers:
69 if you wish to see the actual cost estimates that are being used
70 for each mode wider than word mode and the cost estimates for zero
71 extension and the shifts. This can be useful when port maintainers
72 are tuning insn rtx costs.
74 #define FORCE_LOWERING 1
76 if you wish to test the pass with all the transformation forced on.
77 This can be useful for finding bugs in the transformations. */
80 #define FORCE_LOWERING 0
82 /* Bit N in this bitmap is set if regno N is used in a context in
83 which we can decompose it. */
84 static bitmap decomposable_context
;
86 /* Bit N in this bitmap is set if regno N is used in a context in
87 which it can not be decomposed. */
88 static bitmap non_decomposable_context
;
90 /* Bit N in this bitmap is set if regno N is used in a subreg
91 which changes the mode but not the size. This typically happens
92 when the register accessed as a floating-point value; we want to
93 avoid generating accesses to its subwords in integer modes. */
94 static bitmap subreg_context
;
96 /* Bit N in the bitmap in element M of this array is set if there is a
97 copy from reg M to reg N. */
98 static vec
<bitmap
> reg_copy_graph
;
100 struct target_lower_subreg default_target_lower_subreg
;
101 #if SWITCHABLE_TARGET
102 struct target_lower_subreg
*this_target_lower_subreg
103 = &default_target_lower_subreg
;
106 #define twice_word_mode \
107 this_target_lower_subreg->x_twice_word_mode
109 this_target_lower_subreg->x_choices
111 /* RTXes used while computing costs. */
113 /* Source and target registers. */
117 /* A twice_word_mode ZERO_EXTEND of SOURCE. */
120 /* A shift of SOURCE. */
123 /* A SET of TARGET. */
127 /* Return the cost of a CODE shift in mode MODE by OP1 bits, using the
128 rtxes in RTXES. SPEED_P selects between the speed and size cost. */
131 shift_cost (bool speed_p
, struct cost_rtxes
*rtxes
, enum rtx_code code
,
132 enum machine_mode mode
, int op1
)
134 PUT_CODE (rtxes
->shift
, code
);
135 PUT_MODE (rtxes
->shift
, mode
);
136 PUT_MODE (rtxes
->source
, mode
);
137 XEXP (rtxes
->shift
, 1) = GEN_INT (op1
);
138 return set_src_cost (rtxes
->shift
, speed_p
);
141 /* For each X in the range [0, BITS_PER_WORD), set SPLITTING[X]
142 to true if it is profitable to split a double-word CODE shift
143 of X + BITS_PER_WORD bits. SPEED_P says whether we are testing
144 for speed or size profitability.
146 Use the rtxes in RTXES to calculate costs. WORD_MOVE_ZERO_COST is
147 the cost of moving zero into a word-mode register. WORD_MOVE_COST
148 is the cost of moving between word registers. */
151 compute_splitting_shift (bool speed_p
, struct cost_rtxes
*rtxes
,
152 bool *splitting
, enum rtx_code code
,
153 int word_move_zero_cost
, int word_move_cost
)
155 int wide_cost
, narrow_cost
, upper_cost
, i
;
157 for (i
= 0; i
< BITS_PER_WORD
; i
++)
159 wide_cost
= shift_cost (speed_p
, rtxes
, code
, twice_word_mode
,
162 narrow_cost
= word_move_cost
;
164 narrow_cost
= shift_cost (speed_p
, rtxes
, code
, word_mode
, i
);
166 if (code
!= ASHIFTRT
)
167 upper_cost
= word_move_zero_cost
;
168 else if (i
== BITS_PER_WORD
- 1)
169 upper_cost
= word_move_cost
;
171 upper_cost
= shift_cost (speed_p
, rtxes
, code
, word_mode
,
175 fprintf (stderr
, "%s %s by %d: original cost %d, split cost %d + %d\n",
176 GET_MODE_NAME (twice_word_mode
), GET_RTX_NAME (code
),
177 i
+ BITS_PER_WORD
, wide_cost
, narrow_cost
, upper_cost
);
179 if (FORCE_LOWERING
|| wide_cost
>= narrow_cost
+ upper_cost
)
184 /* Compute what we should do when optimizing for speed or size; SPEED_P
185 selects which. Use RTXES for computing costs. */
188 compute_costs (bool speed_p
, struct cost_rtxes
*rtxes
)
191 int word_move_zero_cost
, word_move_cost
;
193 PUT_MODE (rtxes
->target
, word_mode
);
194 SET_SRC (rtxes
->set
) = CONST0_RTX (word_mode
);
195 word_move_zero_cost
= set_rtx_cost (rtxes
->set
, speed_p
);
197 SET_SRC (rtxes
->set
) = rtxes
->source
;
198 word_move_cost
= set_rtx_cost (rtxes
->set
, speed_p
);
201 fprintf (stderr
, "%s move: from zero cost %d, from reg cost %d\n",
202 GET_MODE_NAME (word_mode
), word_move_zero_cost
, word_move_cost
);
204 for (i
= 0; i
< MAX_MACHINE_MODE
; i
++)
206 enum machine_mode mode
= (enum machine_mode
) i
;
207 int factor
= GET_MODE_SIZE (mode
) / UNITS_PER_WORD
;
212 PUT_MODE (rtxes
->target
, mode
);
213 PUT_MODE (rtxes
->source
, mode
);
214 mode_move_cost
= set_rtx_cost (rtxes
->set
, speed_p
);
217 fprintf (stderr
, "%s move: original cost %d, split cost %d * %d\n",
218 GET_MODE_NAME (mode
), mode_move_cost
,
219 word_move_cost
, factor
);
221 if (FORCE_LOWERING
|| mode_move_cost
>= word_move_cost
* factor
)
223 choices
[speed_p
].move_modes_to_split
[i
] = true;
224 choices
[speed_p
].something_to_do
= true;
229 /* For the moves and shifts, the only case that is checked is one
230 where the mode of the target is an integer mode twice the width
233 If it is not profitable to split a double word move then do not
234 even consider the shifts or the zero extension. */
235 if (choices
[speed_p
].move_modes_to_split
[(int) twice_word_mode
])
239 /* The only case here to check to see if moving the upper part with a
240 zero is cheaper than doing the zext itself. */
241 PUT_MODE (rtxes
->source
, word_mode
);
242 zext_cost
= set_src_cost (rtxes
->zext
, speed_p
);
245 fprintf (stderr
, "%s %s: original cost %d, split cost %d + %d\n",
246 GET_MODE_NAME (twice_word_mode
), GET_RTX_NAME (ZERO_EXTEND
),
247 zext_cost
, word_move_cost
, word_move_zero_cost
);
249 if (FORCE_LOWERING
|| zext_cost
>= word_move_cost
+ word_move_zero_cost
)
250 choices
[speed_p
].splitting_zext
= true;
252 compute_splitting_shift (speed_p
, rtxes
,
253 choices
[speed_p
].splitting_ashift
, ASHIFT
,
254 word_move_zero_cost
, word_move_cost
);
255 compute_splitting_shift (speed_p
, rtxes
,
256 choices
[speed_p
].splitting_lshiftrt
, LSHIFTRT
,
257 word_move_zero_cost
, word_move_cost
);
258 compute_splitting_shift (speed_p
, rtxes
,
259 choices
[speed_p
].splitting_ashiftrt
, ASHIFTRT
,
260 word_move_zero_cost
, word_move_cost
);
264 /* Do one-per-target initialisation. This involves determining
265 which operations on the machine are profitable. If none are found,
266 then the pass just returns when called. */
269 init_lower_subreg (void)
271 struct cost_rtxes rtxes
;
273 memset (this_target_lower_subreg
, 0, sizeof (*this_target_lower_subreg
));
275 twice_word_mode
= GET_MODE_2XWIDER_MODE (word_mode
);
277 rtxes
.target
= gen_rtx_REG (word_mode
, FIRST_PSEUDO_REGISTER
);
278 rtxes
.source
= gen_rtx_REG (word_mode
, FIRST_PSEUDO_REGISTER
+ 1);
279 rtxes
.set
= gen_rtx_SET (VOIDmode
, rtxes
.target
, rtxes
.source
);
280 rtxes
.zext
= gen_rtx_ZERO_EXTEND (twice_word_mode
, rtxes
.source
);
281 rtxes
.shift
= gen_rtx_ASHIFT (twice_word_mode
, rtxes
.source
, const0_rtx
);
284 fprintf (stderr
, "\nSize costs\n==========\n\n");
285 compute_costs (false, &rtxes
);
288 fprintf (stderr
, "\nSpeed costs\n===========\n\n");
289 compute_costs (true, &rtxes
);
293 simple_move_operand (rtx x
)
295 if (GET_CODE (x
) == SUBREG
)
301 if (GET_CODE (x
) == LABEL_REF
302 || GET_CODE (x
) == SYMBOL_REF
303 || GET_CODE (x
) == HIGH
304 || GET_CODE (x
) == CONST
)
308 && (MEM_VOLATILE_P (x
)
309 || mode_dependent_address_p (XEXP (x
, 0), MEM_ADDR_SPACE (x
))))
315 /* If INSN is a single set between two objects that we want to split,
316 return the single set. SPEED_P says whether we are optimizing
317 INSN for speed or size.
319 INSN should have been passed to recog and extract_insn before this
323 simple_move (rtx insn
, bool speed_p
)
327 enum machine_mode mode
;
329 if (recog_data
.n_operands
!= 2)
332 set
= single_set (insn
);
337 if (x
!= recog_data
.operand
[0] && x
!= recog_data
.operand
[1])
339 if (!simple_move_operand (x
))
343 if (x
!= recog_data
.operand
[0] && x
!= recog_data
.operand
[1])
345 /* For the src we can handle ASM_OPERANDS, and it is beneficial for
346 things like x86 rdtsc which returns a DImode value. */
347 if (GET_CODE (x
) != ASM_OPERANDS
348 && !simple_move_operand (x
))
351 /* We try to decompose in integer modes, to avoid generating
352 inefficient code copying between integer and floating point
353 registers. That means that we can't decompose if this is a
354 non-integer mode for which there is no integer mode of the same
356 mode
= GET_MODE (SET_DEST (set
));
357 if (!SCALAR_INT_MODE_P (mode
)
358 && (mode_for_size (GET_MODE_SIZE (mode
) * BITS_PER_UNIT
, MODE_INT
, 0)
362 /* Reject PARTIAL_INT modes. They are used for processor specific
363 purposes and it's probably best not to tamper with them. */
364 if (GET_MODE_CLASS (mode
) == MODE_PARTIAL_INT
)
367 if (!choices
[speed_p
].move_modes_to_split
[(int) mode
])
373 /* If SET is a copy from one multi-word pseudo-register to another,
374 record that in reg_copy_graph. Return whether it is such a
378 find_pseudo_copy (rtx set
)
380 rtx dest
= SET_DEST (set
);
381 rtx src
= SET_SRC (set
);
385 if (!REG_P (dest
) || !REG_P (src
))
390 if (HARD_REGISTER_NUM_P (rd
) || HARD_REGISTER_NUM_P (rs
))
393 b
= reg_copy_graph
[rs
];
396 b
= BITMAP_ALLOC (NULL
);
397 reg_copy_graph
[rs
] = b
;
400 bitmap_set_bit (b
, rd
);
405 /* Look through the registers in DECOMPOSABLE_CONTEXT. For each case
406 where they are copied to another register, add the register to
407 which they are copied to DECOMPOSABLE_CONTEXT. Use
408 NON_DECOMPOSABLE_CONTEXT to limit this--we don't bother to track
409 copies of registers which are in NON_DECOMPOSABLE_CONTEXT. */
412 propagate_pseudo_copies (void)
414 bitmap queue
, propagate
;
416 queue
= BITMAP_ALLOC (NULL
);
417 propagate
= BITMAP_ALLOC (NULL
);
419 bitmap_copy (queue
, decomposable_context
);
422 bitmap_iterator iter
;
425 bitmap_clear (propagate
);
427 EXECUTE_IF_SET_IN_BITMAP (queue
, 0, i
, iter
)
429 bitmap b
= reg_copy_graph
[i
];
431 bitmap_ior_and_compl_into (propagate
, b
, non_decomposable_context
);
434 bitmap_and_compl (queue
, propagate
, decomposable_context
);
435 bitmap_ior_into (decomposable_context
, propagate
);
437 while (!bitmap_empty_p (queue
));
440 BITMAP_FREE (propagate
);
443 /* A pointer to one of these values is passed to
444 find_decomposable_subregs via for_each_rtx. */
446 enum classify_move_insn
448 /* Not a simple move from one location to another. */
450 /* A simple move we want to decompose. */
451 DECOMPOSABLE_SIMPLE_MOVE
,
452 /* Any other simple move. */
456 /* This is called via for_each_rtx. If we find a SUBREG which we
457 could use to decompose a pseudo-register, set a bit in
458 DECOMPOSABLE_CONTEXT. If we find an unadorned register which is
459 not a simple pseudo-register copy, DATA will point at the type of
460 move, and we set a bit in DECOMPOSABLE_CONTEXT or
461 NON_DECOMPOSABLE_CONTEXT as appropriate. */
464 find_decomposable_subregs (rtx
*px
, void *data
)
466 enum classify_move_insn
*pcmi
= (enum classify_move_insn
*) data
;
472 if (GET_CODE (x
) == SUBREG
)
474 rtx inner
= SUBREG_REG (x
);
475 unsigned int regno
, outer_size
, inner_size
, outer_words
, inner_words
;
480 regno
= REGNO (inner
);
481 if (HARD_REGISTER_NUM_P (regno
))
484 outer_size
= GET_MODE_SIZE (GET_MODE (x
));
485 inner_size
= GET_MODE_SIZE (GET_MODE (inner
));
486 outer_words
= (outer_size
+ UNITS_PER_WORD
- 1) / UNITS_PER_WORD
;
487 inner_words
= (inner_size
+ UNITS_PER_WORD
- 1) / UNITS_PER_WORD
;
489 /* We only try to decompose single word subregs of multi-word
490 registers. When we find one, we return -1 to avoid iterating
491 over the inner register.
493 ??? This doesn't allow, e.g., DImode subregs of TImode values
494 on 32-bit targets. We would need to record the way the
495 pseudo-register was used, and only decompose if all the uses
496 were the same number and size of pieces. Hopefully this
497 doesn't happen much. */
499 if (outer_words
== 1 && inner_words
> 1)
501 bitmap_set_bit (decomposable_context
, regno
);
505 /* If this is a cast from one mode to another, where the modes
506 have the same size, and they are not tieable, then mark this
507 register as non-decomposable. If we decompose it we are
508 likely to mess up whatever the backend is trying to do. */
510 && outer_size
== inner_size
511 && !MODES_TIEABLE_P (GET_MODE (x
), GET_MODE (inner
)))
513 bitmap_set_bit (non_decomposable_context
, regno
);
514 bitmap_set_bit (subreg_context
, regno
);
522 /* We will see an outer SUBREG before we see the inner REG, so
523 when we see a plain REG here it means a direct reference to
526 If this is not a simple copy from one location to another,
527 then we can not decompose this register. If this is a simple
528 copy we want to decompose, and the mode is right,
529 then we mark the register as decomposable.
530 Otherwise we don't say anything about this register --
531 it could be decomposed, but whether that would be
532 profitable depends upon how it is used elsewhere.
534 We only set bits in the bitmap for multi-word
535 pseudo-registers, since those are the only ones we care about
536 and it keeps the size of the bitmaps down. */
539 if (!HARD_REGISTER_NUM_P (regno
)
540 && GET_MODE_SIZE (GET_MODE (x
)) > UNITS_PER_WORD
)
544 case NOT_SIMPLE_MOVE
:
545 bitmap_set_bit (non_decomposable_context
, regno
);
547 case DECOMPOSABLE_SIMPLE_MOVE
:
548 if (MODES_TIEABLE_P (GET_MODE (x
), word_mode
))
549 bitmap_set_bit (decomposable_context
, regno
);
560 enum classify_move_insn cmi_mem
= NOT_SIMPLE_MOVE
;
562 /* Any registers used in a MEM do not participate in a
563 SIMPLE_MOVE or DECOMPOSABLE_SIMPLE_MOVE. Do our own recursion
564 here, and return -1 to block the parent's recursion. */
565 for_each_rtx (&XEXP (x
, 0), find_decomposable_subregs
, &cmi_mem
);
572 /* Decompose REGNO into word-sized components. We smash the REG node
573 in place. This ensures that (1) something goes wrong quickly if we
574 fail to make some replacement, and (2) the debug information inside
575 the symbol table is automatically kept up to date. */
578 decompose_register (unsigned int regno
)
581 unsigned int words
, i
;
584 reg
= regno_reg_rtx
[regno
];
586 regno_reg_rtx
[regno
] = NULL_RTX
;
588 words
= GET_MODE_SIZE (GET_MODE (reg
));
589 words
= (words
+ UNITS_PER_WORD
- 1) / UNITS_PER_WORD
;
591 v
= rtvec_alloc (words
);
592 for (i
= 0; i
< words
; ++i
)
593 RTVEC_ELT (v
, i
) = gen_reg_rtx_offset (reg
, word_mode
, i
* UNITS_PER_WORD
);
595 PUT_CODE (reg
, CONCATN
);
600 fprintf (dump_file
, "; Splitting reg %u ->", regno
);
601 for (i
= 0; i
< words
; ++i
)
602 fprintf (dump_file
, " %u", REGNO (XVECEXP (reg
, 0, i
)));
603 fputc ('\n', dump_file
);
607 /* Get a SUBREG of a CONCATN. */
610 simplify_subreg_concatn (enum machine_mode outermode
, rtx op
,
613 unsigned int inner_size
;
614 enum machine_mode innermode
, partmode
;
616 unsigned int final_offset
;
618 gcc_assert (GET_CODE (op
) == CONCATN
);
619 gcc_assert (byte
% GET_MODE_SIZE (outermode
) == 0);
621 innermode
= GET_MODE (op
);
622 gcc_assert (byte
< GET_MODE_SIZE (innermode
));
623 gcc_assert (GET_MODE_SIZE (outermode
) <= GET_MODE_SIZE (innermode
));
625 inner_size
= GET_MODE_SIZE (innermode
) / XVECLEN (op
, 0);
626 part
= XVECEXP (op
, 0, byte
/ inner_size
);
627 partmode
= GET_MODE (part
);
629 /* VECTOR_CSTs in debug expressions are expanded into CONCATN instead of
630 regular CONST_VECTORs. They have vector or integer modes, depending
631 on the capabilities of the target. Cope with them. */
632 if (partmode
== VOIDmode
&& VECTOR_MODE_P (innermode
))
633 partmode
= GET_MODE_INNER (innermode
);
634 else if (partmode
== VOIDmode
)
636 enum mode_class mclass
= GET_MODE_CLASS (innermode
);
637 partmode
= mode_for_size (inner_size
* BITS_PER_UNIT
, mclass
, 0);
640 final_offset
= byte
% inner_size
;
641 if (final_offset
+ GET_MODE_SIZE (outermode
) > inner_size
)
644 return simplify_gen_subreg (outermode
, part
, partmode
, final_offset
);
647 /* Wrapper around simplify_gen_subreg which handles CONCATN. */
650 simplify_gen_subreg_concatn (enum machine_mode outermode
, rtx op
,
651 enum machine_mode innermode
, unsigned int byte
)
655 /* We have to handle generating a SUBREG of a SUBREG of a CONCATN.
656 If OP is a SUBREG of a CONCATN, then it must be a simple mode
657 change with the same size and offset 0, or it must extract a
658 part. We shouldn't see anything else here. */
659 if (GET_CODE (op
) == SUBREG
&& GET_CODE (SUBREG_REG (op
)) == CONCATN
)
663 if ((GET_MODE_SIZE (GET_MODE (op
))
664 == GET_MODE_SIZE (GET_MODE (SUBREG_REG (op
))))
665 && SUBREG_BYTE (op
) == 0)
666 return simplify_gen_subreg_concatn (outermode
, SUBREG_REG (op
),
667 GET_MODE (SUBREG_REG (op
)), byte
);
669 op2
= simplify_subreg_concatn (GET_MODE (op
), SUBREG_REG (op
),
673 /* We don't handle paradoxical subregs here. */
674 gcc_assert (GET_MODE_SIZE (outermode
)
675 <= GET_MODE_SIZE (GET_MODE (op
)));
676 gcc_assert (GET_MODE_SIZE (GET_MODE (op
))
677 <= GET_MODE_SIZE (GET_MODE (SUBREG_REG (op
))));
678 op2
= simplify_subreg_concatn (outermode
, SUBREG_REG (op
),
679 byte
+ SUBREG_BYTE (op
));
680 gcc_assert (op2
!= NULL_RTX
);
685 gcc_assert (op
!= NULL_RTX
);
686 gcc_assert (innermode
== GET_MODE (op
));
689 if (GET_CODE (op
) == CONCATN
)
690 return simplify_subreg_concatn (outermode
, op
, byte
);
692 ret
= simplify_gen_subreg (outermode
, op
, innermode
, byte
);
694 /* If we see an insn like (set (reg:DI) (subreg:DI (reg:SI) 0)) then
695 resolve_simple_move will ask for the high part of the paradoxical
696 subreg, which does not have a value. Just return a zero. */
698 && GET_CODE (op
) == SUBREG
699 && SUBREG_BYTE (op
) == 0
700 && (GET_MODE_SIZE (innermode
)
701 > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op
)))))
702 return CONST0_RTX (outermode
);
704 gcc_assert (ret
!= NULL_RTX
);
708 /* Return whether we should resolve X into the registers into which it
712 resolve_reg_p (rtx x
)
714 return GET_CODE (x
) == CONCATN
;
717 /* Return whether X is a SUBREG of a register which we need to
721 resolve_subreg_p (rtx x
)
723 if (GET_CODE (x
) != SUBREG
)
725 return resolve_reg_p (SUBREG_REG (x
));
728 /* This is called via for_each_rtx. Look for SUBREGs which need to be
732 resolve_subreg_use (rtx
*px
, void *data
)
734 rtx insn
= (rtx
) data
;
740 if (resolve_subreg_p (x
))
742 x
= simplify_subreg_concatn (GET_MODE (x
), SUBREG_REG (x
),
745 /* It is possible for a note to contain a reference which we can
746 decompose. In this case, return 1 to the caller to indicate
747 that the note must be removed. */
754 validate_change (insn
, px
, x
, 1);
758 if (resolve_reg_p (x
))
760 /* Return 1 to the caller to indicate that we found a direct
761 reference to a register which is being decomposed. This can
762 happen inside notes, multiword shift or zero-extend
770 /* This is called via for_each_rtx. Look for SUBREGs which can be
771 decomposed and decomposed REGs that need copying. */
774 adjust_decomposed_uses (rtx
*px
, void *data ATTRIBUTE_UNUSED
)
781 if (resolve_subreg_p (x
))
783 x
= simplify_subreg_concatn (GET_MODE (x
), SUBREG_REG (x
),
792 if (resolve_reg_p (x
))
798 /* Resolve any decomposed registers which appear in register notes on
802 resolve_reg_notes (rtx insn
)
806 note
= find_reg_equal_equiv_note (insn
);
809 int old_count
= num_validated_changes ();
810 if (for_each_rtx (&XEXP (note
, 0), resolve_subreg_use
, NULL
))
811 remove_note (insn
, note
);
813 if (old_count
!= num_validated_changes ())
814 df_notes_rescan (insn
);
817 pnote
= ®_NOTES (insn
);
818 while (*pnote
!= NULL_RTX
)
823 switch (REG_NOTE_KIND (note
))
827 if (resolve_reg_p (XEXP (note
, 0)))
836 *pnote
= XEXP (note
, 1);
838 pnote
= &XEXP (note
, 1);
842 /* Return whether X can be decomposed into subwords. */
845 can_decompose_p (rtx x
)
849 unsigned int regno
= REGNO (x
);
851 if (HARD_REGISTER_NUM_P (regno
))
853 unsigned int byte
, num_bytes
;
855 num_bytes
= GET_MODE_SIZE (GET_MODE (x
));
856 for (byte
= 0; byte
< num_bytes
; byte
+= UNITS_PER_WORD
)
857 if (simplify_subreg_regno (regno
, GET_MODE (x
), byte
, word_mode
) < 0)
862 return !bitmap_bit_p (subreg_context
, regno
);
868 /* Decompose the registers used in a simple move SET within INSN. If
869 we don't change anything, return INSN, otherwise return the start
870 of the sequence of moves. */
873 resolve_simple_move (rtx set
, rtx insn
)
875 rtx src
, dest
, real_dest
, insns
;
876 enum machine_mode orig_mode
, dest_mode
;
881 dest
= SET_DEST (set
);
882 orig_mode
= GET_MODE (dest
);
884 words
= (GET_MODE_SIZE (orig_mode
) + UNITS_PER_WORD
- 1) / UNITS_PER_WORD
;
885 gcc_assert (words
> 1);
889 /* We have to handle copying from a SUBREG of a decomposed reg where
890 the SUBREG is larger than word size. Rather than assume that we
891 can take a word_mode SUBREG of the destination, we copy to a new
892 register and then copy that to the destination. */
894 real_dest
= NULL_RTX
;
896 if (GET_CODE (src
) == SUBREG
897 && resolve_reg_p (SUBREG_REG (src
))
898 && (SUBREG_BYTE (src
) != 0
899 || (GET_MODE_SIZE (orig_mode
)
900 != GET_MODE_SIZE (GET_MODE (SUBREG_REG (src
))))))
903 dest
= gen_reg_rtx (orig_mode
);
904 if (REG_P (real_dest
))
905 REG_ATTRS (dest
) = REG_ATTRS (real_dest
);
908 /* Similarly if we are copying to a SUBREG of a decomposed reg where
909 the SUBREG is larger than word size. */
911 if (GET_CODE (dest
) == SUBREG
912 && resolve_reg_p (SUBREG_REG (dest
))
913 && (SUBREG_BYTE (dest
) != 0
914 || (GET_MODE_SIZE (orig_mode
)
915 != GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest
))))))
917 rtx reg
, minsn
, smove
;
919 reg
= gen_reg_rtx (orig_mode
);
920 minsn
= emit_move_insn (reg
, src
);
921 smove
= single_set (minsn
);
922 gcc_assert (smove
!= NULL_RTX
);
923 resolve_simple_move (smove
, minsn
);
927 /* If we didn't have any big SUBREGS of decomposed registers, and
928 neither side of the move is a register we are decomposing, then
929 we don't have to do anything here. */
931 if (src
== SET_SRC (set
)
932 && dest
== SET_DEST (set
)
933 && !resolve_reg_p (src
)
934 && !resolve_subreg_p (src
)
935 && !resolve_reg_p (dest
)
936 && !resolve_subreg_p (dest
))
942 /* It's possible for the code to use a subreg of a decomposed
943 register while forming an address. We need to handle that before
944 passing the address to emit_move_insn. We pass NULL_RTX as the
945 insn parameter to resolve_subreg_use because we can not validate
947 if (MEM_P (src
) || MEM_P (dest
))
952 for_each_rtx (&XEXP (src
, 0), resolve_subreg_use
, NULL_RTX
);
954 for_each_rtx (&XEXP (dest
, 0), resolve_subreg_use
, NULL_RTX
);
955 acg
= apply_change_group ();
959 /* If SRC is a register which we can't decompose, or has side
960 effects, we need to move via a temporary register. */
962 if (!can_decompose_p (src
)
963 || side_effects_p (src
)
964 || GET_CODE (src
) == ASM_OPERANDS
)
968 reg
= gen_reg_rtx (orig_mode
);
969 emit_move_insn (reg
, src
);
973 /* If DEST is a register which we can't decompose, or has side
974 effects, we need to first move to a temporary register. We
975 handle the common case of pushing an operand directly. We also
976 go through a temporary register if it holds a floating point
977 value. This gives us better code on systems which can't move
978 data easily between integer and floating point registers. */
980 dest_mode
= orig_mode
;
981 pushing
= push_operand (dest
, dest_mode
);
982 if (!can_decompose_p (dest
)
983 || (side_effects_p (dest
) && !pushing
)
984 || (!SCALAR_INT_MODE_P (dest_mode
)
985 && !resolve_reg_p (dest
)
986 && !resolve_subreg_p (dest
)))
988 if (real_dest
== NULL_RTX
)
990 if (!SCALAR_INT_MODE_P (dest_mode
))
992 dest_mode
= mode_for_size (GET_MODE_SIZE (dest_mode
) * BITS_PER_UNIT
,
994 gcc_assert (dest_mode
!= BLKmode
);
996 dest
= gen_reg_rtx (dest_mode
);
997 if (REG_P (real_dest
))
998 REG_ATTRS (dest
) = REG_ATTRS (real_dest
);
1003 unsigned int i
, j
, jinc
;
1005 gcc_assert (GET_MODE_SIZE (orig_mode
) % UNITS_PER_WORD
== 0);
1006 gcc_assert (GET_CODE (XEXP (dest
, 0)) != PRE_MODIFY
);
1007 gcc_assert (GET_CODE (XEXP (dest
, 0)) != POST_MODIFY
);
1009 if (WORDS_BIG_ENDIAN
== STACK_GROWS_DOWNWARD
)
1020 for (i
= 0; i
< words
; ++i
, j
+= jinc
)
1024 temp
= copy_rtx (XEXP (dest
, 0));
1025 temp
= adjust_automodify_address_nv (dest
, word_mode
, temp
,
1026 j
* UNITS_PER_WORD
);
1027 emit_move_insn (temp
,
1028 simplify_gen_subreg_concatn (word_mode
, src
,
1030 j
* UNITS_PER_WORD
));
1037 if (REG_P (dest
) && !HARD_REGISTER_NUM_P (REGNO (dest
)))
1038 emit_clobber (dest
);
1040 for (i
= 0; i
< words
; ++i
)
1041 emit_move_insn (simplify_gen_subreg_concatn (word_mode
, dest
,
1043 i
* UNITS_PER_WORD
),
1044 simplify_gen_subreg_concatn (word_mode
, src
,
1046 i
* UNITS_PER_WORD
));
1049 if (real_dest
!= NULL_RTX
)
1051 rtx mdest
, minsn
, smove
;
1053 if (dest_mode
== orig_mode
)
1056 mdest
= simplify_gen_subreg (orig_mode
, dest
, GET_MODE (dest
), 0);
1057 minsn
= emit_move_insn (real_dest
, mdest
);
1059 smove
= single_set (minsn
);
1060 gcc_assert (smove
!= NULL_RTX
);
1062 resolve_simple_move (smove
, minsn
);
1065 insns
= get_insns ();
1068 copy_reg_eh_region_note_forward (insn
, insns
, NULL_RTX
);
1070 emit_insn_before (insns
, insn
);
1072 /* If we get here via self-recutsion, then INSN is not yet in the insns
1073 chain and delete_insn will fail. We only want to remove INSN from the
1074 current sequence. See PR56738. */
1075 if (in_sequence_p ())
1083 /* Change a CLOBBER of a decomposed register into a CLOBBER of the
1084 component registers. Return whether we changed something. */
1087 resolve_clobber (rtx pat
, rtx insn
)
1090 enum machine_mode orig_mode
;
1091 unsigned int words
, i
;
1094 reg
= XEXP (pat
, 0);
1095 if (!resolve_reg_p (reg
) && !resolve_subreg_p (reg
))
1098 orig_mode
= GET_MODE (reg
);
1099 words
= GET_MODE_SIZE (orig_mode
);
1100 words
= (words
+ UNITS_PER_WORD
- 1) / UNITS_PER_WORD
;
1102 ret
= validate_change (NULL_RTX
, &XEXP (pat
, 0),
1103 simplify_gen_subreg_concatn (word_mode
, reg
,
1106 df_insn_rescan (insn
);
1107 gcc_assert (ret
!= 0);
1109 for (i
= words
- 1; i
> 0; --i
)
1113 x
= simplify_gen_subreg_concatn (word_mode
, reg
, orig_mode
,
1114 i
* UNITS_PER_WORD
);
1115 x
= gen_rtx_CLOBBER (VOIDmode
, x
);
1116 emit_insn_after (x
, insn
);
1119 resolve_reg_notes (insn
);
1124 /* A USE of a decomposed register is no longer meaningful. Return
1125 whether we changed something. */
1128 resolve_use (rtx pat
, rtx insn
)
1130 if (resolve_reg_p (XEXP (pat
, 0)) || resolve_subreg_p (XEXP (pat
, 0)))
1136 resolve_reg_notes (insn
);
1141 /* A VAR_LOCATION can be simplified. */
1144 resolve_debug (rtx insn
)
1146 for_each_rtx (&PATTERN (insn
), adjust_decomposed_uses
, NULL_RTX
);
1148 df_insn_rescan (insn
);
1150 resolve_reg_notes (insn
);
1153 /* Check if INSN is a decomposable multiword-shift or zero-extend and
1154 set the decomposable_context bitmap accordingly. SPEED_P is true
1155 if we are optimizing INSN for speed rather than size. Return true
1156 if INSN is decomposable. */
1159 find_decomposable_shift_zext (rtx insn
, bool speed_p
)
1165 set
= single_set (insn
);
1170 if (GET_CODE (op
) != ASHIFT
1171 && GET_CODE (op
) != LSHIFTRT
1172 && GET_CODE (op
) != ASHIFTRT
1173 && GET_CODE (op
) != ZERO_EXTEND
)
1176 op_operand
= XEXP (op
, 0);
1177 if (!REG_P (SET_DEST (set
)) || !REG_P (op_operand
)
1178 || HARD_REGISTER_NUM_P (REGNO (SET_DEST (set
)))
1179 || HARD_REGISTER_NUM_P (REGNO (op_operand
))
1180 || GET_MODE (op
) != twice_word_mode
)
1183 if (GET_CODE (op
) == ZERO_EXTEND
)
1185 if (GET_MODE (op_operand
) != word_mode
1186 || !choices
[speed_p
].splitting_zext
)
1189 else /* left or right shift */
1191 bool *splitting
= (GET_CODE (op
) == ASHIFT
1192 ? choices
[speed_p
].splitting_ashift
1193 : GET_CODE (op
) == ASHIFTRT
1194 ? choices
[speed_p
].splitting_ashiftrt
1195 : choices
[speed_p
].splitting_lshiftrt
);
1196 if (!CONST_INT_P (XEXP (op
, 1))
1197 || !IN_RANGE (INTVAL (XEXP (op
, 1)), BITS_PER_WORD
,
1198 2 * BITS_PER_WORD
- 1)
1199 || !splitting
[INTVAL (XEXP (op
, 1)) - BITS_PER_WORD
])
1202 bitmap_set_bit (decomposable_context
, REGNO (op_operand
));
1205 bitmap_set_bit (decomposable_context
, REGNO (SET_DEST (set
)));
1210 /* Decompose a more than word wide shift (in INSN) of a multiword
1211 pseudo or a multiword zero-extend of a wordmode pseudo into a move
1212 and 'set to zero' insn. Return a pointer to the new insn when a
1213 replacement was done. */
1216 resolve_shift_zext (rtx insn
)
1222 rtx src_reg
, dest_reg
, dest_upper
, upper_src
= NULL_RTX
;
1223 int src_reg_num
, dest_reg_num
, offset1
, offset2
, src_offset
;
1225 set
= single_set (insn
);
1230 if (GET_CODE (op
) != ASHIFT
1231 && GET_CODE (op
) != LSHIFTRT
1232 && GET_CODE (op
) != ASHIFTRT
1233 && GET_CODE (op
) != ZERO_EXTEND
)
1236 op_operand
= XEXP (op
, 0);
1238 /* We can tear this operation apart only if the regs were already
1240 if (!resolve_reg_p (SET_DEST (set
)) && !resolve_reg_p (op_operand
))
1243 /* src_reg_num is the number of the word mode register which we
1244 are operating on. For a left shift and a zero_extend on little
1245 endian machines this is register 0. */
1246 src_reg_num
= (GET_CODE (op
) == LSHIFTRT
|| GET_CODE (op
) == ASHIFTRT
)
1249 if (WORDS_BIG_ENDIAN
1250 && GET_MODE_SIZE (GET_MODE (op_operand
)) > UNITS_PER_WORD
)
1251 src_reg_num
= 1 - src_reg_num
;
1253 if (GET_CODE (op
) == ZERO_EXTEND
)
1254 dest_reg_num
= WORDS_BIG_ENDIAN
? 1 : 0;
1256 dest_reg_num
= 1 - src_reg_num
;
1258 offset1
= UNITS_PER_WORD
* dest_reg_num
;
1259 offset2
= UNITS_PER_WORD
* (1 - dest_reg_num
);
1260 src_offset
= UNITS_PER_WORD
* src_reg_num
;
1264 dest_reg
= simplify_gen_subreg_concatn (word_mode
, SET_DEST (set
),
1265 GET_MODE (SET_DEST (set
)),
1267 dest_upper
= simplify_gen_subreg_concatn (word_mode
, SET_DEST (set
),
1268 GET_MODE (SET_DEST (set
)),
1270 src_reg
= simplify_gen_subreg_concatn (word_mode
, op_operand
,
1271 GET_MODE (op_operand
),
1273 if (GET_CODE (op
) == ASHIFTRT
1274 && INTVAL (XEXP (op
, 1)) != 2 * BITS_PER_WORD
- 1)
1275 upper_src
= expand_shift (RSHIFT_EXPR
, word_mode
, copy_rtx (src_reg
),
1276 BITS_PER_WORD
- 1, NULL_RTX
, 0);
1278 if (GET_CODE (op
) != ZERO_EXTEND
)
1280 int shift_count
= INTVAL (XEXP (op
, 1));
1281 if (shift_count
> BITS_PER_WORD
)
1282 src_reg
= expand_shift (GET_CODE (op
) == ASHIFT
?
1283 LSHIFT_EXPR
: RSHIFT_EXPR
,
1285 shift_count
- BITS_PER_WORD
,
1286 dest_reg
, GET_CODE (op
) != ASHIFTRT
);
1289 if (dest_reg
!= src_reg
)
1290 emit_move_insn (dest_reg
, src_reg
);
1291 if (GET_CODE (op
) != ASHIFTRT
)
1292 emit_move_insn (dest_upper
, CONST0_RTX (word_mode
));
1293 else if (INTVAL (XEXP (op
, 1)) == 2 * BITS_PER_WORD
- 1)
1294 emit_move_insn (dest_upper
, copy_rtx (src_reg
));
1296 emit_move_insn (dest_upper
, upper_src
);
1297 insns
= get_insns ();
1301 emit_insn_before (insns
, insn
);
1306 fprintf (dump_file
, "; Replacing insn: %d with insns: ", INSN_UID (insn
));
1307 for (in
= insns
; in
!= insn
; in
= NEXT_INSN (in
))
1308 fprintf (dump_file
, "%d ", INSN_UID (in
));
1309 fprintf (dump_file
, "\n");
1316 /* Print to dump_file a description of what we're doing with shift code CODE.
1317 SPLITTING[X] is true if we are splitting shifts by X + BITS_PER_WORD. */
1320 dump_shift_choices (enum rtx_code code
, bool *splitting
)
1326 " Splitting mode %s for %s lowering with shift amounts = ",
1327 GET_MODE_NAME (twice_word_mode
), GET_RTX_NAME (code
));
1329 for (i
= 0; i
< BITS_PER_WORD
; i
++)
1332 fprintf (dump_file
, "%s%d", sep
, i
+ BITS_PER_WORD
);
1335 fprintf (dump_file
, "\n");
1338 /* Print to dump_file a description of what we're doing when optimizing
1339 for speed or size; SPEED_P says which. DESCRIPTION is a description
1340 of the SPEED_P choice. */
1343 dump_choices (bool speed_p
, const char *description
)
1347 fprintf (dump_file
, "Choices when optimizing for %s:\n", description
);
1349 for (i
= 0; i
< MAX_MACHINE_MODE
; i
++)
1350 if (GET_MODE_SIZE (i
) > UNITS_PER_WORD
)
1351 fprintf (dump_file
, " %s mode %s for copy lowering.\n",
1352 choices
[speed_p
].move_modes_to_split
[i
]
1355 GET_MODE_NAME ((enum machine_mode
) i
));
1357 fprintf (dump_file
, " %s mode %s for zero_extend lowering.\n",
1358 choices
[speed_p
].splitting_zext
? "Splitting" : "Skipping",
1359 GET_MODE_NAME (twice_word_mode
));
1361 dump_shift_choices (ASHIFT
, choices
[speed_p
].splitting_ashift
);
1362 dump_shift_choices (LSHIFTRT
, choices
[speed_p
].splitting_lshiftrt
);
1363 dump_shift_choices (ASHIFTRT
, choices
[speed_p
].splitting_ashiftrt
);
1364 fprintf (dump_file
, "\n");
1367 /* Look for registers which are always accessed via word-sized SUBREGs
1368 or -if DECOMPOSE_COPIES is true- via copies. Decompose these
1369 registers into several word-sized pseudo-registers. */
1372 decompose_multiword_subregs (bool decompose_copies
)
1380 dump_choices (false, "size");
1381 dump_choices (true, "speed");
1384 /* Check if this target even has any modes to consider lowering. */
1385 if (!choices
[false].something_to_do
&& !choices
[true].something_to_do
)
1388 fprintf (dump_file
, "Nothing to do!\n");
1392 max
= max_reg_num ();
1394 /* First see if there are any multi-word pseudo-registers. If there
1395 aren't, there is nothing we can do. This should speed up this
1396 pass in the normal case, since it should be faster than scanning
1400 bool useful_modes_seen
= false;
1402 for (i
= FIRST_PSEUDO_REGISTER
; i
< max
; ++i
)
1403 if (regno_reg_rtx
[i
] != NULL
)
1405 enum machine_mode mode
= GET_MODE (regno_reg_rtx
[i
]);
1406 if (choices
[false].move_modes_to_split
[(int) mode
]
1407 || choices
[true].move_modes_to_split
[(int) mode
])
1409 useful_modes_seen
= true;
1414 if (!useful_modes_seen
)
1417 fprintf (dump_file
, "Nothing to lower in this function.\n");
1424 df_set_flags (DF_DEFER_INSN_RESCAN
);
1428 /* FIXME: It may be possible to change this code to look for each
1429 multi-word pseudo-register and to find each insn which sets or
1430 uses that register. That should be faster than scanning all the
1433 decomposable_context
= BITMAP_ALLOC (NULL
);
1434 non_decomposable_context
= BITMAP_ALLOC (NULL
);
1435 subreg_context
= BITMAP_ALLOC (NULL
);
1437 reg_copy_graph
.create (max
);
1438 reg_copy_graph
.safe_grow_cleared (max
);
1439 memset (reg_copy_graph
.address (), 0, sizeof (bitmap
) * max
);
1441 speed_p
= optimize_function_for_speed_p (cfun
);
1446 FOR_BB_INSNS (bb
, insn
)
1449 enum classify_move_insn cmi
;
1453 || GET_CODE (PATTERN (insn
)) == CLOBBER
1454 || GET_CODE (PATTERN (insn
)) == USE
)
1457 recog_memoized (insn
);
1459 if (find_decomposable_shift_zext (insn
, speed_p
))
1462 extract_insn (insn
);
1464 set
= simple_move (insn
, speed_p
);
1467 cmi
= NOT_SIMPLE_MOVE
;
1470 /* We mark pseudo-to-pseudo copies as decomposable during the
1471 second pass only. The first pass is so early that there is
1472 good chance such moves will be optimized away completely by
1473 subsequent optimizations anyway.
1475 However, we call find_pseudo_copy even during the first pass
1476 so as to properly set up the reg_copy_graph. */
1477 if (find_pseudo_copy (set
))
1478 cmi
= decompose_copies
? DECOMPOSABLE_SIMPLE_MOVE
: SIMPLE_MOVE
;
1483 n
= recog_data
.n_operands
;
1484 for (i
= 0; i
< n
; ++i
)
1486 for_each_rtx (&recog_data
.operand
[i
],
1487 find_decomposable_subregs
,
1490 /* We handle ASM_OPERANDS as a special case to support
1491 things like x86 rdtsc which returns a DImode value.
1492 We can decompose the output, which will certainly be
1493 operand 0, but not the inputs. */
1495 if (cmi
== SIMPLE_MOVE
1496 && GET_CODE (SET_SRC (set
)) == ASM_OPERANDS
)
1498 gcc_assert (i
== 0);
1499 cmi
= NOT_SIMPLE_MOVE
;
1505 bitmap_and_compl_into (decomposable_context
, non_decomposable_context
);
1506 if (!bitmap_empty_p (decomposable_context
))
1510 sbitmap_iterator sbi
;
1511 bitmap_iterator iter
;
1514 propagate_pseudo_copies ();
1516 sub_blocks
= sbitmap_alloc (last_basic_block
);
1517 bitmap_clear (sub_blocks
);
1519 EXECUTE_IF_SET_IN_BITMAP (decomposable_context
, 0, regno
, iter
)
1520 decompose_register (regno
);
1526 FOR_BB_INSNS (bb
, insn
)
1533 pat
= PATTERN (insn
);
1534 if (GET_CODE (pat
) == CLOBBER
)
1535 resolve_clobber (pat
, insn
);
1536 else if (GET_CODE (pat
) == USE
)
1537 resolve_use (pat
, insn
);
1538 else if (DEBUG_INSN_P (insn
))
1539 resolve_debug (insn
);
1545 recog_memoized (insn
);
1546 extract_insn (insn
);
1548 set
= simple_move (insn
, speed_p
);
1551 rtx orig_insn
= insn
;
1552 bool cfi
= control_flow_insn_p (insn
);
1554 /* We can end up splitting loads to multi-word pseudos
1555 into separate loads to machine word size pseudos.
1556 When this happens, we first had one load that can
1557 throw, and after resolve_simple_move we'll have a
1558 bunch of loads (at least two). All those loads may
1559 trap if we can have non-call exceptions, so they
1560 all will end the current basic block. We split the
1561 block after the outer loop over all insns, but we
1562 make sure here that we will be able to split the
1563 basic block and still produce the correct control
1564 flow graph for it. */
1566 || (cfun
->can_throw_non_call_exceptions
1567 && can_throw_internal (insn
)));
1569 insn
= resolve_simple_move (set
, insn
);
1570 if (insn
!= orig_insn
)
1572 recog_memoized (insn
);
1573 extract_insn (insn
);
1576 bitmap_set_bit (sub_blocks
, bb
->index
);
1581 rtx decomposed_shift
;
1583 decomposed_shift
= resolve_shift_zext (insn
);
1584 if (decomposed_shift
!= NULL_RTX
)
1586 insn
= decomposed_shift
;
1587 recog_memoized (insn
);
1588 extract_insn (insn
);
1592 for (i
= recog_data
.n_operands
- 1; i
>= 0; --i
)
1593 for_each_rtx (recog_data
.operand_loc
[i
],
1597 resolve_reg_notes (insn
);
1599 if (num_validated_changes () > 0)
1601 for (i
= recog_data
.n_dups
- 1; i
>= 0; --i
)
1603 rtx
*pl
= recog_data
.dup_loc
[i
];
1604 int dup_num
= recog_data
.dup_num
[i
];
1605 rtx
*px
= recog_data
.operand_loc
[dup_num
];
1607 validate_unshare_change (insn
, pl
, *px
, 1);
1610 i
= apply_change_group ();
1617 /* If we had insns to split that caused control flow insns in the middle
1618 of a basic block, split those blocks now. Note that we only handle
1619 the case where splitting a load has caused multiple possibly trapping
1621 EXECUTE_IF_SET_IN_BITMAP (sub_blocks
, 0, i
, sbi
)
1626 bb
= BASIC_BLOCK (i
);
1627 insn
= BB_HEAD (bb
);
1632 if (control_flow_insn_p (insn
))
1634 /* Split the block after insn. There will be a fallthru
1635 edge, which is OK so we keep it. We have to create the
1636 exception edges ourselves. */
1637 fallthru
= split_block (bb
, insn
);
1638 rtl_make_eh_edge (NULL
, bb
, BB_END (bb
));
1639 bb
= fallthru
->dest
;
1640 insn
= BB_HEAD (bb
);
1643 insn
= NEXT_INSN (insn
);
1647 sbitmap_free (sub_blocks
);
1654 FOR_EACH_VEC_ELT (reg_copy_graph
, i
, b
)
1659 reg_copy_graph
.release ();
1661 BITMAP_FREE (decomposable_context
);
1662 BITMAP_FREE (non_decomposable_context
);
1663 BITMAP_FREE (subreg_context
);
1666 /* Gate function for lower subreg pass. */
1669 gate_handle_lower_subreg (void)
1671 return flag_split_wide_types
!= 0;
1674 /* Implement first lower subreg pass. */
1677 rest_of_handle_lower_subreg (void)
1679 decompose_multiword_subregs (false);
1683 /* Implement second lower subreg pass. */
1686 rest_of_handle_lower_subreg2 (void)
1688 decompose_multiword_subregs (true);
1694 const pass_data pass_data_lower_subreg
=
1696 RTL_PASS
, /* type */
1697 "subreg1", /* name */
1698 OPTGROUP_NONE
, /* optinfo_flags */
1699 true, /* has_gate */
1700 true, /* has_execute */
1701 TV_LOWER_SUBREG
, /* tv_id */
1702 0, /* properties_required */
1703 0, /* properties_provided */
1704 0, /* properties_destroyed */
1705 0, /* todo_flags_start */
1706 TODO_verify_flow
, /* todo_flags_finish */
1709 class pass_lower_subreg
: public rtl_opt_pass
1712 pass_lower_subreg (gcc::context
*ctxt
)
1713 : rtl_opt_pass (pass_data_lower_subreg
, ctxt
)
1716 /* opt_pass methods: */
1717 bool gate () { return gate_handle_lower_subreg (); }
1718 unsigned int execute () { return rest_of_handle_lower_subreg (); }
1720 }; // class pass_lower_subreg
1725 make_pass_lower_subreg (gcc::context
*ctxt
)
1727 return new pass_lower_subreg (ctxt
);
1732 const pass_data pass_data_lower_subreg2
=
1734 RTL_PASS
, /* type */
1735 "subreg2", /* name */
1736 OPTGROUP_NONE
, /* optinfo_flags */
1737 true, /* has_gate */
1738 true, /* has_execute */
1739 TV_LOWER_SUBREG
, /* tv_id */
1740 0, /* properties_required */
1741 0, /* properties_provided */
1742 0, /* properties_destroyed */
1743 0, /* todo_flags_start */
1744 ( TODO_df_finish
| TODO_verify_rtl_sharing
1745 | TODO_verify_flow
), /* todo_flags_finish */
1748 class pass_lower_subreg2
: public rtl_opt_pass
1751 pass_lower_subreg2 (gcc::context
*ctxt
)
1752 : rtl_opt_pass (pass_data_lower_subreg2
, ctxt
)
1755 /* opt_pass methods: */
1756 bool gate () { return gate_handle_lower_subreg (); }
1757 unsigned int execute () { return rest_of_handle_lower_subreg2 (); }
1759 }; // class pass_lower_subreg2
1764 make_pass_lower_subreg2 (gcc::context
*ctxt
)
1766 return new pass_lower_subreg2 (ctxt
);