1 /* Combine stack adjustments.
2 Copyright (C) 1987-2020 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 /* Track stack adjustments and stack memory references. Attempt to
21 reduce the number of stack adjustments by back-propagating across
22 the memory references.
24 This is intended primarily for use with targets that do not define
25 ACCUMULATE_OUTGOING_ARGS. It is of significantly more value to
26 targets that define PREFERRED_STACK_BOUNDARY more aligned than
27 STACK_BOUNDARY (e.g. x86), or if not all registers can be pushed
28 (e.g. x86 fp regs) which would ordinarily have to be implemented
29 as a sub/mov pair due to restrictions in calls.c.
31 Propagation stops when any of the insns that need adjusting are
32 (a) no longer valid because we've exceeded their range, (b) a
33 non-trivial push instruction, or (c) a call instruction.
35 Restriction B is based on the assumption that push instructions
36 are smaller or faster. If a port really wants to remove all
37 pushes, it should have defined ACCUMULATE_OUTGOING_ARGS. The
38 one exception that is made is for an add immediately followed
43 #include "coretypes.h"
47 #include "insn-config.h"
52 #include "tree-pass.h"
56 /* This structure records two kinds of stack references between stack
57 adjusting instructions: stack references in memory addresses for
58 regular insns and all stack references for debug insns. */
62 HOST_WIDE_INT sp_offset
;
65 struct csa_reflist
*next
;
68 static int stack_memref_p (rtx
);
69 static rtx
single_set_for_csa (rtx_insn
*);
70 static void free_csa_reflist (struct csa_reflist
*);
71 static struct csa_reflist
*record_one_stack_ref (rtx_insn
*, rtx
*,
72 struct csa_reflist
*);
73 static int try_apply_stack_adjustment (rtx_insn
*, struct csa_reflist
*,
74 HOST_WIDE_INT
, HOST_WIDE_INT
);
75 static void combine_stack_adjustments_for_block (basic_block
);
78 /* Main entry point for stack adjustment combination. */
81 combine_stack_adjustments (void)
85 FOR_EACH_BB_FN (bb
, cfun
)
86 combine_stack_adjustments_for_block (bb
);
89 /* Recognize a MEM of the form (sp) or (plus sp const). */
92 stack_memref_p (rtx x
)
98 if (x
== stack_pointer_rtx
)
100 if (GET_CODE (x
) == PLUS
101 && XEXP (x
, 0) == stack_pointer_rtx
102 && CONST_INT_P (XEXP (x
, 1)))
108 /* Recognize either normal single_set or the hack in i386.md for
109 tying fp and sp adjustments. */
112 single_set_for_csa (rtx_insn
*insn
)
115 rtx tmp
= single_set (insn
);
119 if (!NONJUMP_INSN_P (insn
)
120 || GET_CODE (PATTERN (insn
)) != PARALLEL
)
123 tmp
= PATTERN (insn
);
124 if (GET_CODE (XVECEXP (tmp
, 0, 0)) != SET
)
127 for (i
= 1; i
< XVECLEN (tmp
, 0); ++i
)
129 rtx this_rtx
= XVECEXP (tmp
, 0, i
);
131 /* The special case is allowing a no-op set. */
132 if (GET_CODE (this_rtx
) == SET
133 && SET_SRC (this_rtx
) == SET_DEST (this_rtx
))
135 else if (GET_CODE (this_rtx
) != CLOBBER
136 && GET_CODE (this_rtx
) != USE
)
140 return XVECEXP (tmp
, 0, 0);
143 /* Free the list of csa_reflist nodes. */
146 free_csa_reflist (struct csa_reflist
*reflist
)
148 struct csa_reflist
*next
;
149 for (; reflist
; reflist
= next
)
151 next
= reflist
->next
;
156 /* Create a new csa_reflist node from the given stack reference.
157 It is already known that the reference is either a MEM satisfying the
158 predicate stack_memref_p or a REG representing the stack pointer. */
160 static struct csa_reflist
*
161 record_one_stack_ref (rtx_insn
*insn
, rtx
*ref
, struct csa_reflist
*next_reflist
)
163 struct csa_reflist
*ml
;
165 ml
= XNEW (struct csa_reflist
);
167 if (REG_P (*ref
) || XEXP (*ref
, 0) == stack_pointer_rtx
)
170 ml
->sp_offset
= INTVAL (XEXP (XEXP (*ref
, 0), 1));
174 ml
->next
= next_reflist
;
179 /* We only know how to adjust the CFA; no other frame-related changes
180 may appear in any insn to be deleted. */
183 no_unhandled_cfa (rtx_insn
*insn
)
185 if (!RTX_FRAME_RELATED_P (insn
))
188 /* No CFA notes at all is a legacy interpretation like
189 FRAME_RELATED_EXPR, and is context sensitive within
190 the prologue state machine. We can't handle that here. */
191 bool has_cfa_adjust
= false;
193 for (rtx link
= REG_NOTES (insn
); link
; link
= XEXP (link
, 1))
194 switch (REG_NOTE_KIND (link
))
198 case REG_CFA_ADJUST_CFA
:
199 has_cfa_adjust
= true;
202 case REG_FRAME_RELATED_EXPR
:
203 case REG_CFA_DEF_CFA
:
205 case REG_CFA_REGISTER
:
206 case REG_CFA_EXPRESSION
:
207 case REG_CFA_RESTORE
:
208 case REG_CFA_SET_VDRAP
:
209 case REG_CFA_WINDOW_SAVE
:
210 case REG_CFA_FLUSH_QUEUE
:
211 case REG_CFA_TOGGLE_RA_MANGLE
:
215 return has_cfa_adjust
;
218 /* Attempt to apply ADJUST to the stack adjusting insn INSN, as well
219 as each of the memories and stack references in REFLIST. Return true
223 try_apply_stack_adjustment (rtx_insn
*insn
, struct csa_reflist
*reflist
,
224 HOST_WIDE_INT new_adjust
, HOST_WIDE_INT delta
)
226 struct csa_reflist
*ml
;
229 set
= single_set_for_csa (insn
);
230 if (MEM_P (SET_DEST (set
)))
231 validate_change (insn
, &SET_DEST (set
),
232 replace_equiv_address (SET_DEST (set
), stack_pointer_rtx
),
235 validate_change (insn
, &XEXP (SET_SRC (set
), 1), GEN_INT (new_adjust
), 1);
237 for (ml
= reflist
; ml
; ml
= ml
->next
)
239 rtx new_addr
= plus_constant (Pmode
, stack_pointer_rtx
,
240 ml
->sp_offset
- delta
);
243 if (MEM_P (*ml
->ref
))
244 new_val
= replace_equiv_address_nv (*ml
->ref
, new_addr
);
245 else if (GET_MODE (*ml
->ref
) == GET_MODE (stack_pointer_rtx
))
248 new_val
= lowpart_subreg (GET_MODE (*ml
->ref
), new_addr
,
249 GET_MODE (new_addr
));
250 validate_change (ml
->insn
, ml
->ref
, new_val
, 1);
253 if (apply_change_group ())
255 /* Succeeded. Update our knowledge of the stack references. */
256 for (ml
= reflist
; ml
; ml
= ml
->next
)
257 ml
->sp_offset
-= delta
;
265 /* For non-debug insns, record all stack memory references in INSN
266 and return true if there were no other (unrecorded) references to the
267 stack pointer. For debug insns, record all stack references regardless
268 of context and unconditionally return true. */
271 record_stack_refs (rtx_insn
*insn
, struct csa_reflist
**reflist
)
273 subrtx_ptr_iterator::array_type array
;
274 FOR_EACH_SUBRTX_PTR (iter
, array
, &PATTERN (insn
), NONCONST
)
278 switch (GET_CODE (x
))
281 if (!reg_mentioned_p (stack_pointer_rtx
, x
))
282 iter
.skip_subrtxes ();
283 /* We are not able to handle correctly all possible memrefs
284 containing stack pointer, so this check is necessary. */
285 else if (stack_memref_p (x
))
287 *reflist
= record_one_stack_ref (insn
, loc
, *reflist
);
288 iter
.skip_subrtxes ();
290 /* Try harder for DEBUG_INSNs, handle e.g.
291 (mem (mem (sp + 16) + 4). */
292 else if (!DEBUG_INSN_P (insn
))
297 /* ??? We want be able to handle non-memory stack pointer
298 references later. For now just discard all insns referring to
299 stack pointer outside mem expressions. We would probably
300 want to teach validate_replace to simplify expressions first.
302 We can't just compare with STACK_POINTER_RTX because the
303 reference to the stack pointer might be in some other mode.
304 In particular, an explicit clobber in an asm statement will
305 result in a QImode clobber.
307 In DEBUG_INSNs, we want to replace all occurrences, otherwise
308 they will cause -fcompare-debug failures. */
309 if (REGNO (x
) == STACK_POINTER_REGNUM
)
311 if (!DEBUG_INSN_P (insn
))
313 *reflist
= record_one_stack_ref (insn
, loc
, *reflist
);
324 /* If INSN has a REG_ARGS_SIZE note, move it to LAST.
325 AFTER is true iff LAST follows INSN in the instruction stream. */
328 maybe_move_args_size_note (rtx_insn
*last
, rtx_insn
*insn
, bool after
)
332 note
= find_reg_note (insn
, REG_ARGS_SIZE
, NULL_RTX
);
336 last_note
= find_reg_note (last
, REG_ARGS_SIZE
, NULL_RTX
);
339 /* The ARGS_SIZE notes are *not* cumulative. They represent an
340 absolute value, and the "most recent" note wins. */
342 XEXP (last_note
, 0) = XEXP (note
, 0);
345 add_reg_note (last
, REG_ARGS_SIZE
, XEXP (note
, 0));
348 /* Merge any REG_CFA_ADJUST_CFA note from SRC into DST.
349 AFTER is true iff DST follows SRC in the instruction stream. */
352 maybe_merge_cfa_adjust (rtx_insn
*dst
, rtx_insn
*src
, bool after
)
354 rtx snote
= NULL
, dnote
= NULL
;
358 if (RTX_FRAME_RELATED_P (src
))
359 snote
= find_reg_note (src
, REG_CFA_ADJUST_CFA
, NULL_RTX
);
362 sexp
= XEXP (snote
, 0);
364 if (RTX_FRAME_RELATED_P (dst
))
365 dnote
= find_reg_note (dst
, REG_CFA_ADJUST_CFA
, NULL_RTX
);
368 add_reg_note (dst
, REG_CFA_ADJUST_CFA
, sexp
);
371 dexp
= XEXP (dnote
, 0);
373 gcc_assert (GET_CODE (sexp
) == SET
);
374 gcc_assert (GET_CODE (dexp
) == SET
);
377 exp1
= dexp
, exp2
= sexp
;
379 exp1
= sexp
, exp2
= dexp
;
381 SET_SRC (exp1
) = simplify_replace_rtx (SET_SRC (exp1
), SET_DEST (exp2
),
383 XEXP (dnote
, 0) = exp1
;
386 /* Return the next (or previous) active insn within BB. */
389 prev_active_insn_bb (basic_block bb
, rtx_insn
*insn
)
391 for (insn
= PREV_INSN (insn
);
392 insn
!= PREV_INSN (BB_HEAD (bb
));
393 insn
= PREV_INSN (insn
))
394 if (active_insn_p (insn
))
400 next_active_insn_bb (basic_block bb
, rtx_insn
*insn
)
402 for (insn
= NEXT_INSN (insn
);
403 insn
!= NEXT_INSN (BB_END (bb
));
404 insn
= NEXT_INSN (insn
))
405 if (active_insn_p (insn
))
410 /* If INSN has a REG_ARGS_SIZE note, if possible move it to PREV. Otherwise
411 search for a nearby candidate within BB where we can stick the note. */
414 force_move_args_size_note (basic_block bb
, rtx_insn
*prev
, rtx_insn
*insn
)
417 rtx_insn
*test
, *next_candidate
, *prev_candidate
;
419 /* If PREV exists, tail-call to the logic in the other function. */
422 maybe_move_args_size_note (prev
, insn
, false);
426 /* First, make sure there's anything that needs doing. */
427 note
= find_reg_note (insn
, REG_ARGS_SIZE
, NULL_RTX
);
431 /* We need to find a spot between the previous and next exception points
432 where we can place the note and "properly" deallocate the arguments. */
433 next_candidate
= prev_candidate
= NULL
;
435 /* It is often the case that we have insns in the order:
437 add sp (previous deallocation)
438 sub sp (align for next arglist)
440 and the add/sub cancel. Therefore we begin by searching forward. */
443 while ((test
= next_active_insn_bb (bb
, test
)) != NULL
)
445 /* Found an existing note: nothing to do. */
446 if (find_reg_note (test
, REG_ARGS_SIZE
, NULL_RTX
))
448 /* Found something that affects unwinding. Stop searching. */
449 if (CALL_P (test
) || !insn_nothrow_p (test
))
451 if (next_candidate
== NULL
)
452 next_candidate
= test
;
456 while ((test
= prev_active_insn_bb (bb
, test
)) != NULL
)
459 /* Found a place that seems logical to adjust the stack. */
460 tnote
= find_reg_note (test
, REG_ARGS_SIZE
, NULL_RTX
);
463 XEXP (tnote
, 0) = XEXP (note
, 0);
466 if (prev_candidate
== NULL
)
467 prev_candidate
= test
;
468 /* Found something that affects unwinding. Stop searching. */
469 if (CALL_P (test
) || !insn_nothrow_p (test
))
474 test
= prev_candidate
;
475 else if (next_candidate
)
476 test
= next_candidate
;
479 /* ??? We *must* have a place, lest we ICE on the lost adjustment.
480 Options are: dummy clobber insn, nop, or prevent the removal of
482 /* TODO: Find another way to indicate to the dwarf2 code that we
483 have not in fact lost an adjustment. */
484 test
= emit_insn_before (gen_rtx_CLOBBER (VOIDmode
, const0_rtx
), insn
);
486 add_reg_note (test
, REG_ARGS_SIZE
, XEXP (note
, 0));
489 /* Subroutine of combine_stack_adjustments, called for each basic block. */
492 combine_stack_adjustments_for_block (basic_block bb
)
494 HOST_WIDE_INT last_sp_adjust
= 0;
495 rtx_insn
*last_sp_set
= NULL
;
496 rtx_insn
*last2_sp_set
= NULL
;
497 struct csa_reflist
*reflist
= NULL
;
498 rtx_insn
*insn
, *next
;
500 bool end_of_block
= false;
502 for (insn
= BB_HEAD (bb
); !end_of_block
; insn
= next
)
504 end_of_block
= insn
== BB_END (bb
);
505 next
= NEXT_INSN (insn
);
510 set
= single_set_for_csa (insn
);
511 if (set
&& find_reg_note (insn
, REG_STACK_CHECK
, NULL_RTX
))
515 rtx dest
= SET_DEST (set
);
516 rtx src
= SET_SRC (set
);
518 /* Find constant additions to the stack pointer. */
519 if (dest
== stack_pointer_rtx
520 && GET_CODE (src
) == PLUS
521 && XEXP (src
, 0) == stack_pointer_rtx
522 && CONST_INT_P (XEXP (src
, 1)))
524 HOST_WIDE_INT this_adjust
= INTVAL (XEXP (src
, 1));
526 /* If we've not seen an adjustment previously, record
527 it now and continue. */
531 last_sp_adjust
= this_adjust
;
535 /* If not all recorded refs can be adjusted, or the
536 adjustment is now too large for a constant addition,
537 we cannot merge the two stack adjustments.
539 Also we need to be careful to not move stack pointer
540 such that we create stack accesses outside the allocated
541 area. We can combine an allocation into the first insn,
542 or a deallocation into the second insn. We cannot
543 combine an allocation followed by a deallocation.
545 The only somewhat frequent occurrence of the later is when
546 a function allocates a stack frame but does not use it.
547 For this case, we would need to analyze rtl stream to be
548 sure that allocated area is really unused. This means not
549 only checking the memory references, but also all registers
550 or global memory references possibly containing a stack
553 Perhaps the best way to address this problem is to teach
554 gcc not to allocate stack for objects never used. */
556 /* Combine an allocation into the first instruction. */
557 if (STACK_GROWS_DOWNWARD
? this_adjust
<= 0 : this_adjust
>= 0)
559 if (no_unhandled_cfa (insn
)
560 && try_apply_stack_adjustment (last_sp_set
, reflist
,
566 maybe_move_args_size_note (last_sp_set
, insn
, false);
567 maybe_merge_cfa_adjust (last_sp_set
, insn
, false);
569 last_sp_adjust
+= this_adjust
;
574 /* Otherwise we have a deallocation. Do not combine with
575 a previous allocation. Combine into the second insn. */
576 else if (STACK_GROWS_DOWNWARD
577 ? last_sp_adjust
>= 0 : last_sp_adjust
<= 0)
579 if (no_unhandled_cfa (last_sp_set
)
580 && try_apply_stack_adjustment (insn
, reflist
,
586 maybe_move_args_size_note (insn
, last_sp_set
, true);
587 maybe_merge_cfa_adjust (insn
, last_sp_set
, true);
588 delete_insn (last_sp_set
);
590 last_sp_adjust
+= this_adjust
;
591 free_csa_reflist (reflist
);
597 /* Combination failed. Restart processing from here. If
598 deallocation+allocation conspired to cancel, we can
599 delete the old deallocation insn. */
602 if (last_sp_adjust
== 0 && no_unhandled_cfa (last_sp_set
))
604 maybe_move_args_size_note (insn
, last_sp_set
, true);
605 maybe_merge_cfa_adjust (insn
, last_sp_set
, true);
606 delete_insn (last_sp_set
);
609 last2_sp_set
= last_sp_set
;
611 free_csa_reflist (reflist
);
614 last_sp_adjust
= this_adjust
;
618 /* Find a store with pre-(dec|inc)rement or pre-modify of exactly
619 the previous adjustment and turn it into a simple store. This
620 is equivalent to anticipating the stack adjustment so this must
623 && ((STACK_GROWS_DOWNWARD
624 ? (GET_CODE (XEXP (dest
, 0)) == PRE_DEC
625 && known_eq (last_sp_adjust
,
626 GET_MODE_SIZE (GET_MODE (dest
))))
627 : (GET_CODE (XEXP (dest
, 0)) == PRE_INC
628 && known_eq (-last_sp_adjust
,
629 GET_MODE_SIZE (GET_MODE (dest
)))))
630 || ((STACK_GROWS_DOWNWARD
631 ? last_sp_adjust
>= 0 : last_sp_adjust
<= 0)
632 && GET_CODE (XEXP (dest
, 0)) == PRE_MODIFY
633 && GET_CODE (XEXP (XEXP (dest
, 0), 1)) == PLUS
634 && XEXP (XEXP (XEXP (dest
, 0), 1), 0)
636 && GET_CODE (XEXP (XEXP (XEXP (dest
, 0), 1), 1))
638 && INTVAL (XEXP (XEXP (XEXP (dest
, 0), 1), 1))
640 && XEXP (XEXP (dest
, 0), 0) == stack_pointer_rtx
641 && !reg_mentioned_p (stack_pointer_rtx
, src
)
642 && memory_address_p (GET_MODE (dest
), stack_pointer_rtx
)
643 && try_apply_stack_adjustment (insn
, reflist
, 0,
647 maybe_move_args_size_note (last2_sp_set
, last_sp_set
, false);
649 maybe_move_args_size_note (insn
, last_sp_set
, true);
650 delete_insn (last_sp_set
);
651 free_csa_reflist (reflist
);
659 if (!CALL_P (insn
) && last_sp_set
660 && record_stack_refs (insn
, &reflist
))
663 /* Otherwise, we were not able to process the instruction.
664 Do not continue collecting data across such a one. */
667 || reg_mentioned_p (stack_pointer_rtx
, PATTERN (insn
))))
669 if (last_sp_set
&& last_sp_adjust
== 0)
671 force_move_args_size_note (bb
, last2_sp_set
, last_sp_set
);
672 delete_insn (last_sp_set
);
674 free_csa_reflist (reflist
);
682 if (last_sp_set
&& last_sp_adjust
== 0)
684 force_move_args_size_note (bb
, last2_sp_set
, last_sp_set
);
685 delete_insn (last_sp_set
);
689 free_csa_reflist (reflist
);
693 rest_of_handle_stack_adjustments (void)
695 df_note_add_problem ();
697 combine_stack_adjustments ();
703 const pass_data pass_data_stack_adjustments
=
707 OPTGROUP_NONE
, /* optinfo_flags */
708 TV_COMBINE_STACK_ADJUST
, /* tv_id */
709 0, /* properties_required */
710 0, /* properties_provided */
711 0, /* properties_destroyed */
712 0, /* todo_flags_start */
713 TODO_df_finish
, /* todo_flags_finish */
716 class pass_stack_adjustments
: public rtl_opt_pass
719 pass_stack_adjustments (gcc::context
*ctxt
)
720 : rtl_opt_pass (pass_data_stack_adjustments
, ctxt
)
723 /* opt_pass methods: */
724 virtual bool gate (function
*);
725 virtual unsigned int execute (function
*)
727 return rest_of_handle_stack_adjustments ();
730 }; // class pass_stack_adjustments
733 pass_stack_adjustments::gate (function
*)
735 /* This is kind of a heuristic. We need to run combine_stack_adjustments
736 even for machines with possibly nonzero TARGET_RETURN_POPS_ARGS
737 and ACCUMULATE_OUTGOING_ARGS. We expect that only ports having
738 push instructions will have popping returns. */
739 #ifndef PUSH_ROUNDING
740 if (ACCUMULATE_OUTGOING_ARGS
)
743 return flag_combine_stack_adjustments
;
749 make_pass_stack_adjustments (gcc::context
*ctxt
)
751 return new pass_stack_adjustments (ctxt
);