1 /* Expands front end tree to back end RTL for GCC.
2 Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
3 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009,
4 2010, 2011 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* This file handles the generation of rtl code from tree structure
23 at the level of the function as a whole.
24 It creates the rtl expressions for parameters and auto variables
25 and has full responsibility for allocating stack slots.
27 `expand_function_start' is called at the beginning of a function,
28 before the function body is parsed, and `expand_function_end' is
29 called after parsing the body.
31 Call `assign_stack_local' to allocate a stack slot for a local variable.
32 This is usually done during the RTL generation for the function body,
33 but it can also be done in the reload pass when a pseudo-register does
34 not get a hard register. */
38 #include "coretypes.h"
40 #include "rtl-error.h"
49 #include "hard-reg-set.h"
50 #include "insn-config.h"
53 #include "basic-block.h"
57 #include "integrate.h"
58 #include "langhooks.h"
60 #include "cfglayout.h"
62 #include "tree-pass.h"
68 /* So we can assign to cfun in this file. */
71 #ifndef STACK_ALIGNMENT_NEEDED
72 #define STACK_ALIGNMENT_NEEDED 1
75 #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT)
77 /* Some systems use __main in a way incompatible with its use in gcc, in these
78 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
79 give the same symbol without quotes for an alternative entry point. You
80 must define both, or neither. */
82 #define NAME__MAIN "__main"
85 /* Round a value to the lowest integer less than it that is a multiple of
86 the required alignment. Avoid using division in case the value is
87 negative. Assume the alignment is a power of two. */
88 #define FLOOR_ROUND(VALUE,ALIGN) ((VALUE) & ~((ALIGN) - 1))
90 /* Similar, but round to the next highest integer that meets the
92 #define CEIL_ROUND(VALUE,ALIGN) (((VALUE) + (ALIGN) - 1) & ~((ALIGN)- 1))
94 /* Nonzero if function being compiled doesn't contain any calls
95 (ignoring the prologue and epilogue). This is set prior to
96 local register allocation and is valid for the remaining
98 int current_function_is_leaf
;
100 /* Nonzero if function being compiled doesn't modify the stack pointer
101 (ignoring the prologue and epilogue). This is only valid after
102 pass_stack_ptr_mod has run. */
103 int current_function_sp_is_unchanging
;
105 /* Nonzero if the function being compiled is a leaf function which only
106 uses leaf registers. This is valid after reload (specifically after
107 sched2) and is useful only if the port defines LEAF_REGISTERS. */
108 int current_function_uses_only_leaf_regs
;
110 /* Nonzero once virtual register instantiation has been done.
111 assign_stack_local uses frame_pointer_rtx when this is nonzero.
112 calls.c:emit_library_call_value_1 uses it to set up
113 post-instantiation libcalls. */
114 int virtuals_instantiated
;
116 /* Assign unique numbers to labels generated for profiling, debugging, etc. */
117 static GTY(()) int funcdef_no
;
119 /* These variables hold pointers to functions to create and destroy
120 target specific, per-function data structures. */
121 struct machine_function
* (*init_machine_status
) (void);
123 /* The currently compiled function. */
124 struct function
*cfun
= 0;
126 /* These hashes record the prologue and epilogue insns. */
127 static GTY((if_marked ("ggc_marked_p"), param_is (struct rtx_def
)))
128 htab_t prologue_insn_hash
;
129 static GTY((if_marked ("ggc_marked_p"), param_is (struct rtx_def
)))
130 htab_t epilogue_insn_hash
;
133 htab_t types_used_by_vars_hash
= NULL
;
134 VEC(tree
,gc
) *types_used_by_cur_var_decl
;
136 /* Forward declarations. */
138 static struct temp_slot
*find_temp_slot_from_address (rtx
);
139 static void pad_to_arg_alignment (struct args_size
*, int, struct args_size
*);
140 static void pad_below (struct args_size
*, enum machine_mode
, tree
);
141 static void reorder_blocks_1 (rtx
, tree
, VEC(tree
,heap
) **);
142 static int all_blocks (tree
, tree
*);
143 static tree
*get_block_vector (tree
, int *);
144 extern tree
debug_find_var_in_block_tree (tree
, tree
);
145 /* We always define `record_insns' even if it's not used so that we
146 can always export `prologue_epilogue_contains'. */
147 static void record_insns (rtx
, rtx
, htab_t
*) ATTRIBUTE_UNUSED
;
148 static bool contains (const_rtx
, htab_t
);
150 static void emit_return_into_block (basic_block
);
152 static void prepare_function_start (void);
153 static void do_clobber_return_reg (rtx
, void *);
154 static void do_use_return_reg (rtx
, void *);
155 static void set_insn_locators (rtx
, int) ATTRIBUTE_UNUSED
;
157 /* Stack of nested functions. */
158 /* Keep track of the cfun stack. */
160 typedef struct function
*function_p
;
162 DEF_VEC_P(function_p
);
163 DEF_VEC_ALLOC_P(function_p
,heap
);
164 static VEC(function_p
,heap
) *function_context_stack
;
166 /* Save the current context for compilation of a nested function.
167 This is called from language-specific code. */
170 push_function_context (void)
173 allocate_struct_function (NULL
, false);
175 VEC_safe_push (function_p
, heap
, function_context_stack
, cfun
);
179 /* Restore the last saved context, at the end of a nested function.
180 This function is called from language-specific code. */
183 pop_function_context (void)
185 struct function
*p
= VEC_pop (function_p
, function_context_stack
);
187 current_function_decl
= p
->decl
;
189 /* Reset variables that have known state during rtx generation. */
190 virtuals_instantiated
= 0;
191 generating_concat_p
= 1;
194 /* Clear out all parts of the state in F that can safely be discarded
195 after the function has been parsed, but not compiled, to let
196 garbage collection reclaim the memory. */
199 free_after_parsing (struct function
*f
)
204 /* Clear out all parts of the state in F that can safely be discarded
205 after the function has been compiled, to let garbage collection
206 reclaim the memory. */
209 free_after_compilation (struct function
*f
)
211 prologue_insn_hash
= NULL
;
212 epilogue_insn_hash
= NULL
;
214 free (crtl
->emit
.regno_pointer_align
);
216 memset (crtl
, 0, sizeof (struct rtl_data
));
221 regno_reg_rtx
= NULL
;
222 insn_locators_free ();
225 /* Return size needed for stack frame based on slots so far allocated.
226 This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY;
227 the caller may have to do that. */
230 get_frame_size (void)
232 if (FRAME_GROWS_DOWNWARD
)
233 return -frame_offset
;
238 /* Issue an error message and return TRUE if frame OFFSET overflows in
239 the signed target pointer arithmetics for function FUNC. Otherwise
243 frame_offset_overflow (HOST_WIDE_INT offset
, tree func
)
245 unsigned HOST_WIDE_INT size
= FRAME_GROWS_DOWNWARD
? -offset
: offset
;
247 if (size
> ((unsigned HOST_WIDE_INT
) 1 << (GET_MODE_BITSIZE (Pmode
) - 1))
248 /* Leave room for the fixed part of the frame. */
249 - 64 * UNITS_PER_WORD
)
251 error_at (DECL_SOURCE_LOCATION (func
),
252 "total size of local objects too large");
259 /* Return stack slot alignment in bits for TYPE and MODE. */
262 get_stack_local_alignment (tree type
, enum machine_mode mode
)
264 unsigned int alignment
;
267 alignment
= BIGGEST_ALIGNMENT
;
269 alignment
= GET_MODE_ALIGNMENT (mode
);
271 /* Allow the frond-end to (possibly) increase the alignment of this
274 type
= lang_hooks
.types
.type_for_mode (mode
, 0);
276 return STACK_SLOT_ALIGNMENT (type
, mode
, alignment
);
279 /* Determine whether it is possible to fit a stack slot of size SIZE and
280 alignment ALIGNMENT into an area in the stack frame that starts at
281 frame offset START and has a length of LENGTH. If so, store the frame
282 offset to be used for the stack slot in *POFFSET and return true;
283 return false otherwise. This function will extend the frame size when
284 given a start/length pair that lies at the end of the frame. */
287 try_fit_stack_local (HOST_WIDE_INT start
, HOST_WIDE_INT length
,
288 HOST_WIDE_INT size
, unsigned int alignment
,
289 HOST_WIDE_INT
*poffset
)
291 HOST_WIDE_INT this_frame_offset
;
292 int frame_off
, frame_alignment
, frame_phase
;
294 /* Calculate how many bytes the start of local variables is off from
296 frame_alignment
= PREFERRED_STACK_BOUNDARY
/ BITS_PER_UNIT
;
297 frame_off
= STARTING_FRAME_OFFSET
% frame_alignment
;
298 frame_phase
= frame_off
? frame_alignment
- frame_off
: 0;
300 /* Round the frame offset to the specified alignment. */
302 /* We must be careful here, since FRAME_OFFSET might be negative and
303 division with a negative dividend isn't as well defined as we might
304 like. So we instead assume that ALIGNMENT is a power of two and
305 use logical operations which are unambiguous. */
306 if (FRAME_GROWS_DOWNWARD
)
308 = (FLOOR_ROUND (start
+ length
- size
- frame_phase
,
309 (unsigned HOST_WIDE_INT
) alignment
)
313 = (CEIL_ROUND (start
- frame_phase
,
314 (unsigned HOST_WIDE_INT
) alignment
)
317 /* See if it fits. If this space is at the edge of the frame,
318 consider extending the frame to make it fit. Our caller relies on
319 this when allocating a new slot. */
320 if (frame_offset
== start
&& this_frame_offset
< frame_offset
)
321 frame_offset
= this_frame_offset
;
322 else if (this_frame_offset
< start
)
324 else if (start
+ length
== frame_offset
325 && this_frame_offset
+ size
> start
+ length
)
326 frame_offset
= this_frame_offset
+ size
;
327 else if (this_frame_offset
+ size
> start
+ length
)
330 *poffset
= this_frame_offset
;
334 /* Create a new frame_space structure describing free space in the stack
335 frame beginning at START and ending at END, and chain it into the
336 function's frame_space_list. */
339 add_frame_space (HOST_WIDE_INT start
, HOST_WIDE_INT end
)
341 struct frame_space
*space
= ggc_alloc_frame_space ();
342 space
->next
= crtl
->frame_space_list
;
343 crtl
->frame_space_list
= space
;
344 space
->start
= start
;
345 space
->length
= end
- start
;
348 /* Allocate a stack slot of SIZE bytes and return a MEM rtx for it
349 with machine mode MODE.
351 ALIGN controls the amount of alignment for the address of the slot:
352 0 means according to MODE,
353 -1 means use BIGGEST_ALIGNMENT and round size to multiple of that,
354 -2 means use BITS_PER_UNIT,
355 positive specifies alignment boundary in bits.
357 KIND has ASLK_REDUCE_ALIGN bit set if it is OK to reduce
358 alignment and ASLK_RECORD_PAD bit set if we should remember
359 extra space we allocated for alignment purposes. When we are
360 called from assign_stack_temp_for_type, it is not set so we don't
361 track the same stack slot in two independent lists.
363 We do not round to stack_boundary here. */
366 assign_stack_local_1 (enum machine_mode mode
, HOST_WIDE_INT size
,
370 int bigend_correction
= 0;
371 HOST_WIDE_INT slot_offset
= 0, old_frame_offset
;
372 unsigned int alignment
, alignment_in_bits
;
376 alignment
= get_stack_local_alignment (NULL
, mode
);
377 alignment
/= BITS_PER_UNIT
;
379 else if (align
== -1)
381 alignment
= BIGGEST_ALIGNMENT
/ BITS_PER_UNIT
;
382 size
= CEIL_ROUND (size
, alignment
);
384 else if (align
== -2)
385 alignment
= 1; /* BITS_PER_UNIT / BITS_PER_UNIT */
387 alignment
= align
/ BITS_PER_UNIT
;
389 alignment_in_bits
= alignment
* BITS_PER_UNIT
;
391 /* Ignore alignment if it exceeds MAX_SUPPORTED_STACK_ALIGNMENT. */
392 if (alignment_in_bits
> MAX_SUPPORTED_STACK_ALIGNMENT
)
394 alignment_in_bits
= MAX_SUPPORTED_STACK_ALIGNMENT
;
395 alignment
= alignment_in_bits
/ BITS_PER_UNIT
;
398 if (SUPPORTS_STACK_ALIGNMENT
)
400 if (crtl
->stack_alignment_estimated
< alignment_in_bits
)
402 if (!crtl
->stack_realign_processed
)
403 crtl
->stack_alignment_estimated
= alignment_in_bits
;
406 /* If stack is realigned and stack alignment value
407 hasn't been finalized, it is OK not to increase
408 stack_alignment_estimated. The bigger alignment
409 requirement is recorded in stack_alignment_needed
411 gcc_assert (!crtl
->stack_realign_finalized
);
412 if (!crtl
->stack_realign_needed
)
414 /* It is OK to reduce the alignment as long as the
415 requested size is 0 or the estimated stack
416 alignment >= mode alignment. */
417 gcc_assert ((kind
& ASLK_REDUCE_ALIGN
)
419 || (crtl
->stack_alignment_estimated
420 >= GET_MODE_ALIGNMENT (mode
)));
421 alignment_in_bits
= crtl
->stack_alignment_estimated
;
422 alignment
= alignment_in_bits
/ BITS_PER_UNIT
;
428 if (crtl
->stack_alignment_needed
< alignment_in_bits
)
429 crtl
->stack_alignment_needed
= alignment_in_bits
;
430 if (crtl
->max_used_stack_slot_alignment
< alignment_in_bits
)
431 crtl
->max_used_stack_slot_alignment
= alignment_in_bits
;
433 if (mode
!= BLKmode
|| size
!= 0)
435 if (kind
& ASLK_RECORD_PAD
)
437 struct frame_space
**psp
;
439 for (psp
= &crtl
->frame_space_list
; *psp
; psp
= &(*psp
)->next
)
441 struct frame_space
*space
= *psp
;
442 if (!try_fit_stack_local (space
->start
, space
->length
, size
,
443 alignment
, &slot_offset
))
446 if (slot_offset
> space
->start
)
447 add_frame_space (space
->start
, slot_offset
);
448 if (slot_offset
+ size
< space
->start
+ space
->length
)
449 add_frame_space (slot_offset
+ size
,
450 space
->start
+ space
->length
);
455 else if (!STACK_ALIGNMENT_NEEDED
)
457 slot_offset
= frame_offset
;
461 old_frame_offset
= frame_offset
;
463 if (FRAME_GROWS_DOWNWARD
)
465 frame_offset
-= size
;
466 try_fit_stack_local (frame_offset
, size
, size
, alignment
, &slot_offset
);
468 if (kind
& ASLK_RECORD_PAD
)
470 if (slot_offset
> frame_offset
)
471 add_frame_space (frame_offset
, slot_offset
);
472 if (slot_offset
+ size
< old_frame_offset
)
473 add_frame_space (slot_offset
+ size
, old_frame_offset
);
478 frame_offset
+= size
;
479 try_fit_stack_local (old_frame_offset
, size
, size
, alignment
, &slot_offset
);
481 if (kind
& ASLK_RECORD_PAD
)
483 if (slot_offset
> old_frame_offset
)
484 add_frame_space (old_frame_offset
, slot_offset
);
485 if (slot_offset
+ size
< frame_offset
)
486 add_frame_space (slot_offset
+ size
, frame_offset
);
491 /* On a big-endian machine, if we are allocating more space than we will use,
492 use the least significant bytes of those that are allocated. */
493 if (BYTES_BIG_ENDIAN
&& mode
!= BLKmode
&& GET_MODE_SIZE (mode
) < size
)
494 bigend_correction
= size
- GET_MODE_SIZE (mode
);
496 /* If we have already instantiated virtual registers, return the actual
497 address relative to the frame pointer. */
498 if (virtuals_instantiated
)
499 addr
= plus_constant (frame_pointer_rtx
,
501 (slot_offset
+ bigend_correction
502 + STARTING_FRAME_OFFSET
, Pmode
));
504 addr
= plus_constant (virtual_stack_vars_rtx
,
506 (slot_offset
+ bigend_correction
,
509 x
= gen_rtx_MEM (mode
, addr
);
510 set_mem_align (x
, alignment_in_bits
);
511 MEM_NOTRAP_P (x
) = 1;
514 = gen_rtx_EXPR_LIST (VOIDmode
, x
, stack_slot_list
);
516 if (frame_offset_overflow (frame_offset
, current_function_decl
))
522 /* Wrap up assign_stack_local_1 with last parameter as false. */
525 assign_stack_local (enum machine_mode mode
, HOST_WIDE_INT size
, int align
)
527 return assign_stack_local_1 (mode
, size
, align
, ASLK_RECORD_PAD
);
531 /* In order to evaluate some expressions, such as function calls returning
532 structures in memory, we need to temporarily allocate stack locations.
533 We record each allocated temporary in the following structure.
535 Associated with each temporary slot is a nesting level. When we pop up
536 one level, all temporaries associated with the previous level are freed.
537 Normally, all temporaries are freed after the execution of the statement
538 in which they were created. However, if we are inside a ({...}) grouping,
539 the result may be in a temporary and hence must be preserved. If the
540 result could be in a temporary, we preserve it if we can determine which
541 one it is in. If we cannot determine which temporary may contain the
542 result, all temporaries are preserved. A temporary is preserved by
543 pretending it was allocated at the previous nesting level.
545 Automatic variables are also assigned temporary slots, at the nesting
546 level where they are defined. They are marked a "kept" so that
547 free_temp_slots will not free them. */
549 struct GTY(()) temp_slot
{
550 /* Points to next temporary slot. */
551 struct temp_slot
*next
;
552 /* Points to previous temporary slot. */
553 struct temp_slot
*prev
;
554 /* The rtx to used to reference the slot. */
556 /* The size, in units, of the slot. */
558 /* The type of the object in the slot, or zero if it doesn't correspond
559 to a type. We use this to determine whether a slot can be reused.
560 It can be reused if objects of the type of the new slot will always
561 conflict with objects of the type of the old slot. */
563 /* The alignment (in bits) of the slot. */
565 /* Nonzero if this temporary is currently in use. */
567 /* Nonzero if this temporary has its address taken. */
569 /* Nesting level at which this slot is being used. */
571 /* Nonzero if this should survive a call to free_temp_slots. */
573 /* The offset of the slot from the frame_pointer, including extra space
574 for alignment. This info is for combine_temp_slots. */
575 HOST_WIDE_INT base_offset
;
576 /* The size of the slot, including extra space for alignment. This
577 info is for combine_temp_slots. */
578 HOST_WIDE_INT full_size
;
581 /* A table of addresses that represent a stack slot. The table is a mapping
582 from address RTXen to a temp slot. */
583 static GTY((param_is(struct temp_slot_address_entry
))) htab_t temp_slot_address_table
;
585 /* Entry for the above hash table. */
586 struct GTY(()) temp_slot_address_entry
{
589 struct temp_slot
*temp_slot
;
592 /* Removes temporary slot TEMP from LIST. */
595 cut_slot_from_list (struct temp_slot
*temp
, struct temp_slot
**list
)
598 temp
->next
->prev
= temp
->prev
;
600 temp
->prev
->next
= temp
->next
;
604 temp
->prev
= temp
->next
= NULL
;
607 /* Inserts temporary slot TEMP to LIST. */
610 insert_slot_to_list (struct temp_slot
*temp
, struct temp_slot
**list
)
614 (*list
)->prev
= temp
;
619 /* Returns the list of used temp slots at LEVEL. */
621 static struct temp_slot
**
622 temp_slots_at_level (int level
)
624 if (level
>= (int) VEC_length (temp_slot_p
, used_temp_slots
))
625 VEC_safe_grow_cleared (temp_slot_p
, gc
, used_temp_slots
, level
+ 1);
627 return &(VEC_address (temp_slot_p
, used_temp_slots
)[level
]);
630 /* Returns the maximal temporary slot level. */
633 max_slot_level (void)
635 if (!used_temp_slots
)
638 return VEC_length (temp_slot_p
, used_temp_slots
) - 1;
641 /* Moves temporary slot TEMP to LEVEL. */
644 move_slot_to_level (struct temp_slot
*temp
, int level
)
646 cut_slot_from_list (temp
, temp_slots_at_level (temp
->level
));
647 insert_slot_to_list (temp
, temp_slots_at_level (level
));
651 /* Make temporary slot TEMP available. */
654 make_slot_available (struct temp_slot
*temp
)
656 cut_slot_from_list (temp
, temp_slots_at_level (temp
->level
));
657 insert_slot_to_list (temp
, &avail_temp_slots
);
662 /* Compute the hash value for an address -> temp slot mapping.
663 The value is cached on the mapping entry. */
665 temp_slot_address_compute_hash (struct temp_slot_address_entry
*t
)
667 int do_not_record
= 0;
668 return hash_rtx (t
->address
, GET_MODE (t
->address
),
669 &do_not_record
, NULL
, false);
672 /* Return the hash value for an address -> temp slot mapping. */
674 temp_slot_address_hash (const void *p
)
676 const struct temp_slot_address_entry
*t
;
677 t
= (const struct temp_slot_address_entry
*) p
;
681 /* Compare two address -> temp slot mapping entries. */
683 temp_slot_address_eq (const void *p1
, const void *p2
)
685 const struct temp_slot_address_entry
*t1
, *t2
;
686 t1
= (const struct temp_slot_address_entry
*) p1
;
687 t2
= (const struct temp_slot_address_entry
*) p2
;
688 return exp_equiv_p (t1
->address
, t2
->address
, 0, true);
691 /* Add ADDRESS as an alias of TEMP_SLOT to the addess -> temp slot mapping. */
693 insert_temp_slot_address (rtx address
, struct temp_slot
*temp_slot
)
696 struct temp_slot_address_entry
*t
= ggc_alloc_temp_slot_address_entry ();
697 t
->address
= address
;
698 t
->temp_slot
= temp_slot
;
699 t
->hash
= temp_slot_address_compute_hash (t
);
700 slot
= htab_find_slot_with_hash (temp_slot_address_table
, t
, t
->hash
, INSERT
);
704 /* Remove an address -> temp slot mapping entry if the temp slot is
705 not in use anymore. Callback for remove_unused_temp_slot_addresses. */
707 remove_unused_temp_slot_addresses_1 (void **slot
, void *data ATTRIBUTE_UNUSED
)
709 const struct temp_slot_address_entry
*t
;
710 t
= (const struct temp_slot_address_entry
*) *slot
;
711 if (! t
->temp_slot
->in_use
)
716 /* Remove all mappings of addresses to unused temp slots. */
718 remove_unused_temp_slot_addresses (void)
720 htab_traverse (temp_slot_address_table
,
721 remove_unused_temp_slot_addresses_1
,
725 /* Find the temp slot corresponding to the object at address X. */
727 static struct temp_slot
*
728 find_temp_slot_from_address (rtx x
)
731 struct temp_slot_address_entry tmp
, *t
;
733 /* First try the easy way:
734 See if X exists in the address -> temp slot mapping. */
736 tmp
.temp_slot
= NULL
;
737 tmp
.hash
= temp_slot_address_compute_hash (&tmp
);
738 t
= (struct temp_slot_address_entry
*)
739 htab_find_with_hash (temp_slot_address_table
, &tmp
, tmp
.hash
);
743 /* If we have a sum involving a register, see if it points to a temp
745 if (GET_CODE (x
) == PLUS
&& REG_P (XEXP (x
, 0))
746 && (p
= find_temp_slot_from_address (XEXP (x
, 0))) != 0)
748 else if (GET_CODE (x
) == PLUS
&& REG_P (XEXP (x
, 1))
749 && (p
= find_temp_slot_from_address (XEXP (x
, 1))) != 0)
752 /* Last resort: Address is a virtual stack var address. */
753 if (GET_CODE (x
) == PLUS
754 && XEXP (x
, 0) == virtual_stack_vars_rtx
755 && CONST_INT_P (XEXP (x
, 1)))
758 for (i
= max_slot_level (); i
>= 0; i
--)
759 for (p
= *temp_slots_at_level (i
); p
; p
= p
->next
)
761 if (INTVAL (XEXP (x
, 1)) >= p
->base_offset
762 && INTVAL (XEXP (x
, 1)) < p
->base_offset
+ p
->full_size
)
770 /* Allocate a temporary stack slot and record it for possible later
773 MODE is the machine mode to be given to the returned rtx.
775 SIZE is the size in units of the space required. We do no rounding here
776 since assign_stack_local will do any required rounding.
778 KEEP is 1 if this slot is to be retained after a call to
779 free_temp_slots. Automatic variables for a block are allocated
780 with this flag. KEEP values of 2 or 3 were needed respectively
781 for variables whose lifetime is controlled by CLEANUP_POINT_EXPRs
782 or for SAVE_EXPRs, but they are now unused.
784 TYPE is the type that will be used for the stack slot. */
787 assign_stack_temp_for_type (enum machine_mode mode
, HOST_WIDE_INT size
,
791 struct temp_slot
*p
, *best_p
= 0, *selected
= NULL
, **pp
;
794 /* If SIZE is -1 it means that somebody tried to allocate a temporary
795 of a variable size. */
796 gcc_assert (size
!= -1);
798 /* These are now unused. */
799 gcc_assert (keep
<= 1);
801 align
= get_stack_local_alignment (type
, mode
);
803 /* Try to find an available, already-allocated temporary of the proper
804 mode which meets the size and alignment requirements. Choose the
805 smallest one with the closest alignment.
807 If assign_stack_temp is called outside of the tree->rtl expansion,
808 we cannot reuse the stack slots (that may still refer to
809 VIRTUAL_STACK_VARS_REGNUM). */
810 if (!virtuals_instantiated
)
812 for (p
= avail_temp_slots
; p
; p
= p
->next
)
814 if (p
->align
>= align
&& p
->size
>= size
815 && GET_MODE (p
->slot
) == mode
816 && objects_must_conflict_p (p
->type
, type
)
817 && (best_p
== 0 || best_p
->size
> p
->size
818 || (best_p
->size
== p
->size
&& best_p
->align
> p
->align
)))
820 if (p
->align
== align
&& p
->size
== size
)
823 cut_slot_from_list (selected
, &avail_temp_slots
);
832 /* Make our best, if any, the one to use. */
836 cut_slot_from_list (selected
, &avail_temp_slots
);
838 /* If there are enough aligned bytes left over, make them into a new
839 temp_slot so that the extra bytes don't get wasted. Do this only
840 for BLKmode slots, so that we can be sure of the alignment. */
841 if (GET_MODE (best_p
->slot
) == BLKmode
)
843 int alignment
= best_p
->align
/ BITS_PER_UNIT
;
844 HOST_WIDE_INT rounded_size
= CEIL_ROUND (size
, alignment
);
846 if (best_p
->size
- rounded_size
>= alignment
)
848 p
= ggc_alloc_temp_slot ();
849 p
->in_use
= p
->addr_taken
= 0;
850 p
->size
= best_p
->size
- rounded_size
;
851 p
->base_offset
= best_p
->base_offset
+ rounded_size
;
852 p
->full_size
= best_p
->full_size
- rounded_size
;
853 p
->slot
= adjust_address_nv (best_p
->slot
, BLKmode
, rounded_size
);
854 p
->align
= best_p
->align
;
855 p
->type
= best_p
->type
;
856 insert_slot_to_list (p
, &avail_temp_slots
);
858 stack_slot_list
= gen_rtx_EXPR_LIST (VOIDmode
, p
->slot
,
861 best_p
->size
= rounded_size
;
862 best_p
->full_size
= rounded_size
;
867 /* If we still didn't find one, make a new temporary. */
870 HOST_WIDE_INT frame_offset_old
= frame_offset
;
872 p
= ggc_alloc_temp_slot ();
874 /* We are passing an explicit alignment request to assign_stack_local.
875 One side effect of that is assign_stack_local will not round SIZE
876 to ensure the frame offset remains suitably aligned.
878 So for requests which depended on the rounding of SIZE, we go ahead
879 and round it now. We also make sure ALIGNMENT is at least
880 BIGGEST_ALIGNMENT. */
881 gcc_assert (mode
!= BLKmode
|| align
== BIGGEST_ALIGNMENT
);
882 p
->slot
= assign_stack_local_1 (mode
,
892 /* The following slot size computation is necessary because we don't
893 know the actual size of the temporary slot until assign_stack_local
894 has performed all the frame alignment and size rounding for the
895 requested temporary. Note that extra space added for alignment
896 can be either above or below this stack slot depending on which
897 way the frame grows. We include the extra space if and only if it
898 is above this slot. */
899 if (FRAME_GROWS_DOWNWARD
)
900 p
->size
= frame_offset_old
- frame_offset
;
904 /* Now define the fields used by combine_temp_slots. */
905 if (FRAME_GROWS_DOWNWARD
)
907 p
->base_offset
= frame_offset
;
908 p
->full_size
= frame_offset_old
- frame_offset
;
912 p
->base_offset
= frame_offset_old
;
913 p
->full_size
= frame_offset
- frame_offset_old
;
923 p
->level
= temp_slot_level
;
926 pp
= temp_slots_at_level (p
->level
);
927 insert_slot_to_list (p
, pp
);
928 insert_temp_slot_address (XEXP (p
->slot
, 0), p
);
930 /* Create a new MEM rtx to avoid clobbering MEM flags of old slots. */
931 slot
= gen_rtx_MEM (mode
, XEXP (p
->slot
, 0));
932 stack_slot_list
= gen_rtx_EXPR_LIST (VOIDmode
, slot
, stack_slot_list
);
934 /* If we know the alias set for the memory that will be used, use
935 it. If there's no TYPE, then we don't know anything about the
936 alias set for the memory. */
937 set_mem_alias_set (slot
, type
? get_alias_set (type
) : 0);
938 set_mem_align (slot
, align
);
940 /* If a type is specified, set the relevant flags. */
943 MEM_VOLATILE_P (slot
) = TYPE_VOLATILE (type
);
944 gcc_checking_assert (!MEM_SCALAR_P (slot
) && !MEM_IN_STRUCT_P (slot
));
945 if (AGGREGATE_TYPE_P (type
) || TREE_CODE (type
) == COMPLEX_TYPE
)
946 MEM_IN_STRUCT_P (slot
) = 1;
948 MEM_SCALAR_P (slot
) = 1;
950 MEM_NOTRAP_P (slot
) = 1;
955 /* Allocate a temporary stack slot and record it for possible later
956 reuse. First three arguments are same as in preceding function. */
959 assign_stack_temp (enum machine_mode mode
, HOST_WIDE_INT size
, int keep
)
961 return assign_stack_temp_for_type (mode
, size
, keep
, NULL_TREE
);
964 /* Assign a temporary.
965 If TYPE_OR_DECL is a decl, then we are doing it on behalf of the decl
966 and so that should be used in error messages. In either case, we
967 allocate of the given type.
968 KEEP is as for assign_stack_temp.
969 MEMORY_REQUIRED is 1 if the result must be addressable stack memory;
970 it is 0 if a register is OK.
971 DONT_PROMOTE is 1 if we should not promote values in register
975 assign_temp (tree type_or_decl
, int keep
, int memory_required
,
976 int dont_promote ATTRIBUTE_UNUSED
)
979 enum machine_mode mode
;
984 if (DECL_P (type_or_decl
))
985 decl
= type_or_decl
, type
= TREE_TYPE (decl
);
987 decl
= NULL
, type
= type_or_decl
;
989 mode
= TYPE_MODE (type
);
991 unsignedp
= TYPE_UNSIGNED (type
);
994 if (mode
== BLKmode
|| memory_required
)
996 HOST_WIDE_INT size
= int_size_in_bytes (type
);
999 /* Zero sized arrays are GNU C extension. Set size to 1 to avoid
1000 problems with allocating the stack space. */
1004 /* Unfortunately, we don't yet know how to allocate variable-sized
1005 temporaries. However, sometimes we can find a fixed upper limit on
1006 the size, so try that instead. */
1007 else if (size
== -1)
1008 size
= max_int_size_in_bytes (type
);
1010 /* The size of the temporary may be too large to fit into an integer. */
1011 /* ??? Not sure this should happen except for user silliness, so limit
1012 this to things that aren't compiler-generated temporaries. The
1013 rest of the time we'll die in assign_stack_temp_for_type. */
1014 if (decl
&& size
== -1
1015 && TREE_CODE (TYPE_SIZE_UNIT (type
)) == INTEGER_CST
)
1017 error ("size of variable %q+D is too large", decl
);
1021 tmp
= assign_stack_temp_for_type (mode
, size
, keep
, type
);
1027 mode
= promote_mode (type
, mode
, &unsignedp
);
1030 return gen_reg_rtx (mode
);
1033 /* Combine temporary stack slots which are adjacent on the stack.
1035 This allows for better use of already allocated stack space. This is only
1036 done for BLKmode slots because we can be sure that we won't have alignment
1037 problems in this case. */
1040 combine_temp_slots (void)
1042 struct temp_slot
*p
, *q
, *next
, *next_q
;
1045 /* We can't combine slots, because the information about which slot
1046 is in which alias set will be lost. */
1047 if (flag_strict_aliasing
)
1050 /* If there are a lot of temp slots, don't do anything unless
1051 high levels of optimization. */
1052 if (! flag_expensive_optimizations
)
1053 for (p
= avail_temp_slots
, num_slots
= 0; p
; p
= p
->next
, num_slots
++)
1054 if (num_slots
> 100 || (num_slots
> 10 && optimize
== 0))
1057 for (p
= avail_temp_slots
; p
; p
= next
)
1063 if (GET_MODE (p
->slot
) != BLKmode
)
1066 for (q
= p
->next
; q
; q
= next_q
)
1072 if (GET_MODE (q
->slot
) != BLKmode
)
1075 if (p
->base_offset
+ p
->full_size
== q
->base_offset
)
1077 /* Q comes after P; combine Q into P. */
1079 p
->full_size
+= q
->full_size
;
1082 else if (q
->base_offset
+ q
->full_size
== p
->base_offset
)
1084 /* P comes after Q; combine P into Q. */
1086 q
->full_size
+= p
->full_size
;
1091 cut_slot_from_list (q
, &avail_temp_slots
);
1094 /* Either delete P or advance past it. */
1096 cut_slot_from_list (p
, &avail_temp_slots
);
1100 /* Indicate that NEW_RTX is an alternate way of referring to the temp
1101 slot that previously was known by OLD_RTX. */
1104 update_temp_slot_address (rtx old_rtx
, rtx new_rtx
)
1106 struct temp_slot
*p
;
1108 if (rtx_equal_p (old_rtx
, new_rtx
))
1111 p
= find_temp_slot_from_address (old_rtx
);
1113 /* If we didn't find one, see if both OLD_RTX is a PLUS. If so, and
1114 NEW_RTX is a register, see if one operand of the PLUS is a
1115 temporary location. If so, NEW_RTX points into it. Otherwise,
1116 if both OLD_RTX and NEW_RTX are a PLUS and if there is a register
1117 in common between them. If so, try a recursive call on those
1121 if (GET_CODE (old_rtx
) != PLUS
)
1124 if (REG_P (new_rtx
))
1126 update_temp_slot_address (XEXP (old_rtx
, 0), new_rtx
);
1127 update_temp_slot_address (XEXP (old_rtx
, 1), new_rtx
);
1130 else if (GET_CODE (new_rtx
) != PLUS
)
1133 if (rtx_equal_p (XEXP (old_rtx
, 0), XEXP (new_rtx
, 0)))
1134 update_temp_slot_address (XEXP (old_rtx
, 1), XEXP (new_rtx
, 1));
1135 else if (rtx_equal_p (XEXP (old_rtx
, 1), XEXP (new_rtx
, 0)))
1136 update_temp_slot_address (XEXP (old_rtx
, 0), XEXP (new_rtx
, 1));
1137 else if (rtx_equal_p (XEXP (old_rtx
, 0), XEXP (new_rtx
, 1)))
1138 update_temp_slot_address (XEXP (old_rtx
, 1), XEXP (new_rtx
, 0));
1139 else if (rtx_equal_p (XEXP (old_rtx
, 1), XEXP (new_rtx
, 1)))
1140 update_temp_slot_address (XEXP (old_rtx
, 0), XEXP (new_rtx
, 0));
1145 /* Otherwise add an alias for the temp's address. */
1146 insert_temp_slot_address (new_rtx
, p
);
1149 /* If X could be a reference to a temporary slot, mark the fact that its
1150 address was taken. */
1153 mark_temp_addr_taken (rtx x
)
1155 struct temp_slot
*p
;
1160 /* If X is not in memory or is at a constant address, it cannot be in
1161 a temporary slot. */
1162 if (!MEM_P (x
) || CONSTANT_P (XEXP (x
, 0)))
1165 p
= find_temp_slot_from_address (XEXP (x
, 0));
1170 /* If X could be a reference to a temporary slot, mark that slot as
1171 belonging to the to one level higher than the current level. If X
1172 matched one of our slots, just mark that one. Otherwise, we can't
1173 easily predict which it is, so upgrade all of them. Kept slots
1174 need not be touched.
1176 This is called when an ({...}) construct occurs and a statement
1177 returns a value in memory. */
1180 preserve_temp_slots (rtx x
)
1182 struct temp_slot
*p
= 0, *next
;
1184 /* If there is no result, we still might have some objects whose address
1185 were taken, so we need to make sure they stay around. */
1188 for (p
= *temp_slots_at_level (temp_slot_level
); p
; p
= next
)
1193 move_slot_to_level (p
, temp_slot_level
- 1);
1199 /* If X is a register that is being used as a pointer, see if we have
1200 a temporary slot we know it points to. To be consistent with
1201 the code below, we really should preserve all non-kept slots
1202 if we can't find a match, but that seems to be much too costly. */
1203 if (REG_P (x
) && REG_POINTER (x
))
1204 p
= find_temp_slot_from_address (x
);
1206 /* If X is not in memory or is at a constant address, it cannot be in
1207 a temporary slot, but it can contain something whose address was
1209 if (p
== 0 && (!MEM_P (x
) || CONSTANT_P (XEXP (x
, 0))))
1211 for (p
= *temp_slots_at_level (temp_slot_level
); p
; p
= next
)
1216 move_slot_to_level (p
, temp_slot_level
- 1);
1222 /* First see if we can find a match. */
1224 p
= find_temp_slot_from_address (XEXP (x
, 0));
1228 /* Move everything at our level whose address was taken to our new
1229 level in case we used its address. */
1230 struct temp_slot
*q
;
1232 if (p
->level
== temp_slot_level
)
1234 for (q
= *temp_slots_at_level (temp_slot_level
); q
; q
= next
)
1238 if (p
!= q
&& q
->addr_taken
)
1239 move_slot_to_level (q
, temp_slot_level
- 1);
1242 move_slot_to_level (p
, temp_slot_level
- 1);
1248 /* Otherwise, preserve all non-kept slots at this level. */
1249 for (p
= *temp_slots_at_level (temp_slot_level
); p
; p
= next
)
1254 move_slot_to_level (p
, temp_slot_level
- 1);
1258 /* Free all temporaries used so far. This is normally called at the
1259 end of generating code for a statement. */
1262 free_temp_slots (void)
1264 struct temp_slot
*p
, *next
;
1265 bool some_available
= false;
1267 for (p
= *temp_slots_at_level (temp_slot_level
); p
; p
= next
)
1273 make_slot_available (p
);
1274 some_available
= true;
1280 remove_unused_temp_slot_addresses ();
1281 combine_temp_slots ();
1285 /* Push deeper into the nesting level for stack temporaries. */
1288 push_temp_slots (void)
1293 /* Pop a temporary nesting level. All slots in use in the current level
1297 pop_temp_slots (void)
1299 struct temp_slot
*p
, *next
;
1300 bool some_available
= false;
1302 for (p
= *temp_slots_at_level (temp_slot_level
); p
; p
= next
)
1305 make_slot_available (p
);
1306 some_available
= true;
1311 remove_unused_temp_slot_addresses ();
1312 combine_temp_slots ();
1318 /* Initialize temporary slots. */
1321 init_temp_slots (void)
1323 /* We have not allocated any temporaries yet. */
1324 avail_temp_slots
= 0;
1325 used_temp_slots
= 0;
1326 temp_slot_level
= 0;
1328 /* Set up the table to map addresses to temp slots. */
1329 if (! temp_slot_address_table
)
1330 temp_slot_address_table
= htab_create_ggc (32,
1331 temp_slot_address_hash
,
1332 temp_slot_address_eq
,
1335 htab_empty (temp_slot_address_table
);
1338 /* These routines are responsible for converting virtual register references
1339 to the actual hard register references once RTL generation is complete.
1341 The following four variables are used for communication between the
1342 routines. They contain the offsets of the virtual registers from their
1343 respective hard registers. */
1345 static int in_arg_offset
;
1346 static int var_offset
;
1347 static int dynamic_offset
;
1348 static int out_arg_offset
;
1349 static int cfa_offset
;
1351 /* In most machines, the stack pointer register is equivalent to the bottom
1354 #ifndef STACK_POINTER_OFFSET
1355 #define STACK_POINTER_OFFSET 0
1358 /* If not defined, pick an appropriate default for the offset of dynamically
1359 allocated memory depending on the value of ACCUMULATE_OUTGOING_ARGS,
1360 REG_PARM_STACK_SPACE, and OUTGOING_REG_PARM_STACK_SPACE. */
1362 #ifndef STACK_DYNAMIC_OFFSET
1364 /* The bottom of the stack points to the actual arguments. If
1365 REG_PARM_STACK_SPACE is defined, this includes the space for the register
1366 parameters. However, if OUTGOING_REG_PARM_STACK space is not defined,
1367 stack space for register parameters is not pushed by the caller, but
1368 rather part of the fixed stack areas and hence not included in
1369 `crtl->outgoing_args_size'. Nevertheless, we must allow
1370 for it when allocating stack dynamic objects. */
1372 #if defined(REG_PARM_STACK_SPACE)
1373 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1374 ((ACCUMULATE_OUTGOING_ARGS \
1375 ? (crtl->outgoing_args_size \
1376 + (OUTGOING_REG_PARM_STACK_SPACE ((!(FNDECL) ? NULL_TREE : TREE_TYPE (FNDECL))) ? 0 \
1377 : REG_PARM_STACK_SPACE (FNDECL))) \
1378 : 0) + (STACK_POINTER_OFFSET))
1380 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1381 ((ACCUMULATE_OUTGOING_ARGS ? crtl->outgoing_args_size : 0) \
1382 + (STACK_POINTER_OFFSET))
1387 /* Given a piece of RTX and a pointer to a HOST_WIDE_INT, if the RTX
1388 is a virtual register, return the equivalent hard register and set the
1389 offset indirectly through the pointer. Otherwise, return 0. */
1392 instantiate_new_reg (rtx x
, HOST_WIDE_INT
*poffset
)
1395 HOST_WIDE_INT offset
;
1397 if (x
== virtual_incoming_args_rtx
)
1399 if (stack_realign_drap
)
1401 /* Replace virtual_incoming_args_rtx with internal arg
1402 pointer if DRAP is used to realign stack. */
1403 new_rtx
= crtl
->args
.internal_arg_pointer
;
1407 new_rtx
= arg_pointer_rtx
, offset
= in_arg_offset
;
1409 else if (x
== virtual_stack_vars_rtx
)
1410 new_rtx
= frame_pointer_rtx
, offset
= var_offset
;
1411 else if (x
== virtual_stack_dynamic_rtx
)
1412 new_rtx
= stack_pointer_rtx
, offset
= dynamic_offset
;
1413 else if (x
== virtual_outgoing_args_rtx
)
1414 new_rtx
= stack_pointer_rtx
, offset
= out_arg_offset
;
1415 else if (x
== virtual_cfa_rtx
)
1417 #ifdef FRAME_POINTER_CFA_OFFSET
1418 new_rtx
= frame_pointer_rtx
;
1420 new_rtx
= arg_pointer_rtx
;
1422 offset
= cfa_offset
;
1424 else if (x
== virtual_preferred_stack_boundary_rtx
)
1426 new_rtx
= GEN_INT (crtl
->preferred_stack_boundary
/ BITS_PER_UNIT
);
1436 /* A subroutine of instantiate_virtual_regs, called via for_each_rtx.
1437 Instantiate any virtual registers present inside of *LOC. The expression
1438 is simplified, as much as possible, but is not to be considered "valid"
1439 in any sense implied by the target. If any change is made, set CHANGED
1443 instantiate_virtual_regs_in_rtx (rtx
*loc
, void *data
)
1445 HOST_WIDE_INT offset
;
1446 bool *changed
= (bool *) data
;
1453 switch (GET_CODE (x
))
1456 new_rtx
= instantiate_new_reg (x
, &offset
);
1459 *loc
= plus_constant (new_rtx
, offset
);
1466 new_rtx
= instantiate_new_reg (XEXP (x
, 0), &offset
);
1469 new_rtx
= plus_constant (new_rtx
, offset
);
1470 *loc
= simplify_gen_binary (PLUS
, GET_MODE (x
), new_rtx
, XEXP (x
, 1));
1476 /* FIXME -- from old code */
1477 /* If we have (plus (subreg (virtual-reg)) (const_int)), we know
1478 we can commute the PLUS and SUBREG because pointers into the
1479 frame are well-behaved. */
1489 /* A subroutine of instantiate_virtual_regs_in_insn. Return true if X
1490 matches the predicate for insn CODE operand OPERAND. */
1493 safe_insn_predicate (int code
, int operand
, rtx x
)
1495 return code
< 0 || insn_operand_matches ((enum insn_code
) code
, operand
, x
);
1498 /* A subroutine of instantiate_virtual_regs. Instantiate any virtual
1499 registers present inside of insn. The result will be a valid insn. */
1502 instantiate_virtual_regs_in_insn (rtx insn
)
1504 HOST_WIDE_INT offset
;
1506 bool any_change
= false;
1507 rtx set
, new_rtx
, x
, seq
;
1509 /* There are some special cases to be handled first. */
1510 set
= single_set (insn
);
1513 /* We're allowed to assign to a virtual register. This is interpreted
1514 to mean that the underlying register gets assigned the inverse
1515 transformation. This is used, for example, in the handling of
1517 new_rtx
= instantiate_new_reg (SET_DEST (set
), &offset
);
1522 for_each_rtx (&SET_SRC (set
), instantiate_virtual_regs_in_rtx
, NULL
);
1523 x
= simplify_gen_binary (PLUS
, GET_MODE (new_rtx
), SET_SRC (set
),
1525 x
= force_operand (x
, new_rtx
);
1527 emit_move_insn (new_rtx
, x
);
1532 emit_insn_before (seq
, insn
);
1537 /* Handle a straight copy from a virtual register by generating a
1538 new add insn. The difference between this and falling through
1539 to the generic case is avoiding a new pseudo and eliminating a
1540 move insn in the initial rtl stream. */
1541 new_rtx
= instantiate_new_reg (SET_SRC (set
), &offset
);
1542 if (new_rtx
&& offset
!= 0
1543 && REG_P (SET_DEST (set
))
1544 && REGNO (SET_DEST (set
)) > LAST_VIRTUAL_REGISTER
)
1548 x
= expand_simple_binop (GET_MODE (SET_DEST (set
)), PLUS
,
1549 new_rtx
, GEN_INT (offset
), SET_DEST (set
),
1550 1, OPTAB_LIB_WIDEN
);
1551 if (x
!= SET_DEST (set
))
1552 emit_move_insn (SET_DEST (set
), x
);
1557 emit_insn_before (seq
, insn
);
1562 extract_insn (insn
);
1563 insn_code
= INSN_CODE (insn
);
1565 /* Handle a plus involving a virtual register by determining if the
1566 operands remain valid if they're modified in place. */
1567 if (GET_CODE (SET_SRC (set
)) == PLUS
1568 && recog_data
.n_operands
>= 3
1569 && recog_data
.operand_loc
[1] == &XEXP (SET_SRC (set
), 0)
1570 && recog_data
.operand_loc
[2] == &XEXP (SET_SRC (set
), 1)
1571 && CONST_INT_P (recog_data
.operand
[2])
1572 && (new_rtx
= instantiate_new_reg (recog_data
.operand
[1], &offset
)))
1574 offset
+= INTVAL (recog_data
.operand
[2]);
1576 /* If the sum is zero, then replace with a plain move. */
1578 && REG_P (SET_DEST (set
))
1579 && REGNO (SET_DEST (set
)) > LAST_VIRTUAL_REGISTER
)
1582 emit_move_insn (SET_DEST (set
), new_rtx
);
1586 emit_insn_before (seq
, insn
);
1591 x
= gen_int_mode (offset
, recog_data
.operand_mode
[2]);
1593 /* Using validate_change and apply_change_group here leaves
1594 recog_data in an invalid state. Since we know exactly what
1595 we want to check, do those two by hand. */
1596 if (safe_insn_predicate (insn_code
, 1, new_rtx
)
1597 && safe_insn_predicate (insn_code
, 2, x
))
1599 *recog_data
.operand_loc
[1] = recog_data
.operand
[1] = new_rtx
;
1600 *recog_data
.operand_loc
[2] = recog_data
.operand
[2] = x
;
1603 /* Fall through into the regular operand fixup loop in
1604 order to take care of operands other than 1 and 2. */
1610 extract_insn (insn
);
1611 insn_code
= INSN_CODE (insn
);
1614 /* In the general case, we expect virtual registers to appear only in
1615 operands, and then only as either bare registers or inside memories. */
1616 for (i
= 0; i
< recog_data
.n_operands
; ++i
)
1618 x
= recog_data
.operand
[i
];
1619 switch (GET_CODE (x
))
1623 rtx addr
= XEXP (x
, 0);
1624 bool changed
= false;
1626 for_each_rtx (&addr
, instantiate_virtual_regs_in_rtx
, &changed
);
1631 x
= replace_equiv_address (x
, addr
);
1632 /* It may happen that the address with the virtual reg
1633 was valid (e.g. based on the virtual stack reg, which might
1634 be acceptable to the predicates with all offsets), whereas
1635 the address now isn't anymore, for instance when the address
1636 is still offsetted, but the base reg isn't virtual-stack-reg
1637 anymore. Below we would do a force_reg on the whole operand,
1638 but this insn might actually only accept memory. Hence,
1639 before doing that last resort, try to reload the address into
1640 a register, so this operand stays a MEM. */
1641 if (!safe_insn_predicate (insn_code
, i
, x
))
1643 addr
= force_reg (GET_MODE (addr
), addr
);
1644 x
= replace_equiv_address (x
, addr
);
1649 emit_insn_before (seq
, insn
);
1654 new_rtx
= instantiate_new_reg (x
, &offset
);
1655 if (new_rtx
== NULL
)
1663 /* Careful, special mode predicates may have stuff in
1664 insn_data[insn_code].operand[i].mode that isn't useful
1665 to us for computing a new value. */
1666 /* ??? Recognize address_operand and/or "p" constraints
1667 to see if (plus new offset) is a valid before we put
1668 this through expand_simple_binop. */
1669 x
= expand_simple_binop (GET_MODE (x
), PLUS
, new_rtx
,
1670 GEN_INT (offset
), NULL_RTX
,
1671 1, OPTAB_LIB_WIDEN
);
1674 emit_insn_before (seq
, insn
);
1679 new_rtx
= instantiate_new_reg (SUBREG_REG (x
), &offset
);
1680 if (new_rtx
== NULL
)
1685 new_rtx
= expand_simple_binop (GET_MODE (new_rtx
), PLUS
, new_rtx
,
1686 GEN_INT (offset
), NULL_RTX
,
1687 1, OPTAB_LIB_WIDEN
);
1690 emit_insn_before (seq
, insn
);
1692 x
= simplify_gen_subreg (recog_data
.operand_mode
[i
], new_rtx
,
1693 GET_MODE (new_rtx
), SUBREG_BYTE (x
));
1701 /* At this point, X contains the new value for the operand.
1702 Validate the new value vs the insn predicate. Note that
1703 asm insns will have insn_code -1 here. */
1704 if (!safe_insn_predicate (insn_code
, i
, x
))
1709 gcc_assert (REGNO (x
) <= LAST_VIRTUAL_REGISTER
);
1710 x
= copy_to_reg (x
);
1713 x
= force_reg (insn_data
[insn_code
].operand
[i
].mode
, x
);
1717 emit_insn_before (seq
, insn
);
1720 *recog_data
.operand_loc
[i
] = recog_data
.operand
[i
] = x
;
1726 /* Propagate operand changes into the duplicates. */
1727 for (i
= 0; i
< recog_data
.n_dups
; ++i
)
1728 *recog_data
.dup_loc
[i
]
1729 = copy_rtx (recog_data
.operand
[(unsigned)recog_data
.dup_num
[i
]]);
1731 /* Force re-recognition of the instruction for validation. */
1732 INSN_CODE (insn
) = -1;
1735 if (asm_noperands (PATTERN (insn
)) >= 0)
1737 if (!check_asm_operands (PATTERN (insn
)))
1739 error_for_asm (insn
, "impossible constraint in %<asm%>");
1745 if (recog_memoized (insn
) < 0)
1746 fatal_insn_not_found (insn
);
1750 /* Subroutine of instantiate_decls. Given RTL representing a decl,
1751 do any instantiation required. */
1754 instantiate_decl_rtl (rtx x
)
1761 /* If this is a CONCAT, recurse for the pieces. */
1762 if (GET_CODE (x
) == CONCAT
)
1764 instantiate_decl_rtl (XEXP (x
, 0));
1765 instantiate_decl_rtl (XEXP (x
, 1));
1769 /* If this is not a MEM, no need to do anything. Similarly if the
1770 address is a constant or a register that is not a virtual register. */
1775 if (CONSTANT_P (addr
)
1777 && (REGNO (addr
) < FIRST_VIRTUAL_REGISTER
1778 || REGNO (addr
) > LAST_VIRTUAL_REGISTER
)))
1781 for_each_rtx (&XEXP (x
, 0), instantiate_virtual_regs_in_rtx
, NULL
);
1784 /* Helper for instantiate_decls called via walk_tree: Process all decls
1785 in the given DECL_VALUE_EXPR. */
1788 instantiate_expr (tree
*tp
, int *walk_subtrees
, void *data ATTRIBUTE_UNUSED
)
1796 if (DECL_RTL_SET_P (t
))
1797 instantiate_decl_rtl (DECL_RTL (t
));
1798 if (TREE_CODE (t
) == PARM_DECL
&& DECL_NAMELESS (t
)
1799 && DECL_INCOMING_RTL (t
))
1800 instantiate_decl_rtl (DECL_INCOMING_RTL (t
));
1801 if ((TREE_CODE (t
) == VAR_DECL
1802 || TREE_CODE (t
) == RESULT_DECL
)
1803 && DECL_HAS_VALUE_EXPR_P (t
))
1805 tree v
= DECL_VALUE_EXPR (t
);
1806 walk_tree (&v
, instantiate_expr
, NULL
, NULL
);
1813 /* Subroutine of instantiate_decls: Process all decls in the given
1814 BLOCK node and all its subblocks. */
1817 instantiate_decls_1 (tree let
)
1821 for (t
= BLOCK_VARS (let
); t
; t
= DECL_CHAIN (t
))
1823 if (DECL_RTL_SET_P (t
))
1824 instantiate_decl_rtl (DECL_RTL (t
));
1825 if (TREE_CODE (t
) == VAR_DECL
&& DECL_HAS_VALUE_EXPR_P (t
))
1827 tree v
= DECL_VALUE_EXPR (t
);
1828 walk_tree (&v
, instantiate_expr
, NULL
, NULL
);
1832 /* Process all subblocks. */
1833 for (t
= BLOCK_SUBBLOCKS (let
); t
; t
= BLOCK_CHAIN (t
))
1834 instantiate_decls_1 (t
);
1837 /* Scan all decls in FNDECL (both variables and parameters) and instantiate
1838 all virtual registers in their DECL_RTL's. */
1841 instantiate_decls (tree fndecl
)
1846 /* Process all parameters of the function. */
1847 for (decl
= DECL_ARGUMENTS (fndecl
); decl
; decl
= DECL_CHAIN (decl
))
1849 instantiate_decl_rtl (DECL_RTL (decl
));
1850 instantiate_decl_rtl (DECL_INCOMING_RTL (decl
));
1851 if (DECL_HAS_VALUE_EXPR_P (decl
))
1853 tree v
= DECL_VALUE_EXPR (decl
);
1854 walk_tree (&v
, instantiate_expr
, NULL
, NULL
);
1858 if ((decl
= DECL_RESULT (fndecl
))
1859 && TREE_CODE (decl
) == RESULT_DECL
)
1861 if (DECL_RTL_SET_P (decl
))
1862 instantiate_decl_rtl (DECL_RTL (decl
));
1863 if (DECL_HAS_VALUE_EXPR_P (decl
))
1865 tree v
= DECL_VALUE_EXPR (decl
);
1866 walk_tree (&v
, instantiate_expr
, NULL
, NULL
);
1870 /* Now process all variables defined in the function or its subblocks. */
1871 instantiate_decls_1 (DECL_INITIAL (fndecl
));
1873 FOR_EACH_LOCAL_DECL (cfun
, ix
, decl
)
1874 if (DECL_RTL_SET_P (decl
))
1875 instantiate_decl_rtl (DECL_RTL (decl
));
1876 VEC_free (tree
, gc
, cfun
->local_decls
);
1879 /* Pass through the INSNS of function FNDECL and convert virtual register
1880 references to hard register references. */
1883 instantiate_virtual_regs (void)
1887 /* Compute the offsets to use for this function. */
1888 in_arg_offset
= FIRST_PARM_OFFSET (current_function_decl
);
1889 var_offset
= STARTING_FRAME_OFFSET
;
1890 dynamic_offset
= STACK_DYNAMIC_OFFSET (current_function_decl
);
1891 out_arg_offset
= STACK_POINTER_OFFSET
;
1892 #ifdef FRAME_POINTER_CFA_OFFSET
1893 cfa_offset
= FRAME_POINTER_CFA_OFFSET (current_function_decl
);
1895 cfa_offset
= ARG_POINTER_CFA_OFFSET (current_function_decl
);
1898 /* Initialize recognition, indicating that volatile is OK. */
1901 /* Scan through all the insns, instantiating every virtual register still
1903 for (insn
= get_insns (); insn
; insn
= NEXT_INSN (insn
))
1906 /* These patterns in the instruction stream can never be recognized.
1907 Fortunately, they shouldn't contain virtual registers either. */
1908 if (GET_CODE (PATTERN (insn
)) == USE
1909 || GET_CODE (PATTERN (insn
)) == CLOBBER
1910 || GET_CODE (PATTERN (insn
)) == ADDR_VEC
1911 || GET_CODE (PATTERN (insn
)) == ADDR_DIFF_VEC
1912 || GET_CODE (PATTERN (insn
)) == ASM_INPUT
)
1914 else if (DEBUG_INSN_P (insn
))
1915 for_each_rtx (&INSN_VAR_LOCATION (insn
),
1916 instantiate_virtual_regs_in_rtx
, NULL
);
1918 instantiate_virtual_regs_in_insn (insn
);
1920 if (INSN_DELETED_P (insn
))
1923 for_each_rtx (®_NOTES (insn
), instantiate_virtual_regs_in_rtx
, NULL
);
1925 /* Instantiate any virtual registers in CALL_INSN_FUNCTION_USAGE. */
1927 for_each_rtx (&CALL_INSN_FUNCTION_USAGE (insn
),
1928 instantiate_virtual_regs_in_rtx
, NULL
);
1931 /* Instantiate the virtual registers in the DECLs for debugging purposes. */
1932 instantiate_decls (current_function_decl
);
1934 targetm
.instantiate_decls ();
1936 /* Indicate that, from now on, assign_stack_local should use
1937 frame_pointer_rtx. */
1938 virtuals_instantiated
= 1;
1940 /* See allocate_dynamic_stack_space for the rationale. */
1941 #ifdef SETJMP_VIA_SAVE_AREA
1942 if (flag_stack_usage
&& cfun
->calls_setjmp
)
1944 int align
= PREFERRED_STACK_BOUNDARY
/ BITS_PER_UNIT
;
1945 dynamic_offset
= (dynamic_offset
+ align
- 1) / align
* align
;
1946 current_function_dynamic_stack_size
1947 += current_function_dynamic_alloc_count
* dynamic_offset
;
1954 struct rtl_opt_pass pass_instantiate_virtual_regs
=
1960 instantiate_virtual_regs
, /* execute */
1963 0, /* static_pass_number */
1964 TV_NONE
, /* tv_id */
1965 0, /* properties_required */
1966 0, /* properties_provided */
1967 0, /* properties_destroyed */
1968 0, /* todo_flags_start */
1969 TODO_dump_func
/* todo_flags_finish */
1974 /* Return 1 if EXP is an aggregate type (or a value with aggregate type).
1975 This means a type for which function calls must pass an address to the
1976 function or get an address back from the function.
1977 EXP may be a type node or an expression (whose type is tested). */
1980 aggregate_value_p (const_tree exp
, const_tree fntype
)
1982 const_tree type
= (TYPE_P (exp
)) ? exp
: TREE_TYPE (exp
);
1983 int i
, regno
, nregs
;
1987 switch (TREE_CODE (fntype
))
1991 tree fndecl
= get_callee_fndecl (fntype
);
1993 ? TREE_TYPE (fndecl
)
1994 : TREE_TYPE (TREE_TYPE (CALL_EXPR_FN (fntype
))));
1998 fntype
= TREE_TYPE (fntype
);
2003 case IDENTIFIER_NODE
:
2007 /* We don't expect other tree types here. */
2011 if (VOID_TYPE_P (type
))
2014 /* If a record should be passed the same as its first (and only) member
2015 don't pass it as an aggregate. */
2016 if (TREE_CODE (type
) == RECORD_TYPE
&& TYPE_TRANSPARENT_AGGR (type
))
2017 return aggregate_value_p (first_field (type
), fntype
);
2019 /* If the front end has decided that this needs to be passed by
2020 reference, do so. */
2021 if ((TREE_CODE (exp
) == PARM_DECL
|| TREE_CODE (exp
) == RESULT_DECL
)
2022 && DECL_BY_REFERENCE (exp
))
2025 /* Function types that are TREE_ADDRESSABLE force return in memory. */
2026 if (fntype
&& TREE_ADDRESSABLE (fntype
))
2029 /* Types that are TREE_ADDRESSABLE must be constructed in memory,
2030 and thus can't be returned in registers. */
2031 if (TREE_ADDRESSABLE (type
))
2034 if (flag_pcc_struct_return
&& AGGREGATE_TYPE_P (type
))
2037 if (targetm
.calls
.return_in_memory (type
, fntype
))
2040 /* Make sure we have suitable call-clobbered regs to return
2041 the value in; if not, we must return it in memory. */
2042 reg
= hard_function_value (type
, 0, fntype
, 0);
2044 /* If we have something other than a REG (e.g. a PARALLEL), then assume
2049 regno
= REGNO (reg
);
2050 nregs
= hard_regno_nregs
[regno
][TYPE_MODE (type
)];
2051 for (i
= 0; i
< nregs
; i
++)
2052 if (! call_used_regs
[regno
+ i
])
2058 /* Return true if we should assign DECL a pseudo register; false if it
2059 should live on the local stack. */
2062 use_register_for_decl (const_tree decl
)
2064 if (!targetm
.calls
.allocate_stack_slots_for_args())
2067 /* Honor volatile. */
2068 if (TREE_SIDE_EFFECTS (decl
))
2071 /* Honor addressability. */
2072 if (TREE_ADDRESSABLE (decl
))
2075 /* Only register-like things go in registers. */
2076 if (DECL_MODE (decl
) == BLKmode
)
2079 /* If -ffloat-store specified, don't put explicit float variables
2081 /* ??? This should be checked after DECL_ARTIFICIAL, but tree-ssa
2082 propagates values across these stores, and it probably shouldn't. */
2083 if (flag_float_store
&& FLOAT_TYPE_P (TREE_TYPE (decl
)))
2086 /* If we're not interested in tracking debugging information for
2087 this decl, then we can certainly put it in a register. */
2088 if (DECL_IGNORED_P (decl
))
2094 if (!DECL_REGISTER (decl
))
2097 switch (TREE_CODE (TREE_TYPE (decl
)))
2101 case QUAL_UNION_TYPE
:
2102 /* When not optimizing, disregard register keyword for variables with
2103 types containing methods, otherwise the methods won't be callable
2104 from the debugger. */
2105 if (TYPE_METHODS (TREE_TYPE (decl
)))
2115 /* Return true if TYPE should be passed by invisible reference. */
2118 pass_by_reference (CUMULATIVE_ARGS
*ca
, enum machine_mode mode
,
2119 tree type
, bool named_arg
)
2123 /* If this type contains non-trivial constructors, then it is
2124 forbidden for the middle-end to create any new copies. */
2125 if (TREE_ADDRESSABLE (type
))
2128 /* GCC post 3.4 passes *all* variable sized types by reference. */
2129 if (!TYPE_SIZE (type
) || TREE_CODE (TYPE_SIZE (type
)) != INTEGER_CST
)
2132 /* If a record type should be passed the same as its first (and only)
2133 member, use the type and mode of that member. */
2134 if (TREE_CODE (type
) == RECORD_TYPE
&& TYPE_TRANSPARENT_AGGR (type
))
2136 type
= TREE_TYPE (first_field (type
));
2137 mode
= TYPE_MODE (type
);
2141 return targetm
.calls
.pass_by_reference (ca
, mode
, type
, named_arg
);
2144 /* Return true if TYPE, which is passed by reference, should be callee
2145 copied instead of caller copied. */
2148 reference_callee_copied (CUMULATIVE_ARGS
*ca
, enum machine_mode mode
,
2149 tree type
, bool named_arg
)
2151 if (type
&& TREE_ADDRESSABLE (type
))
2153 return targetm
.calls
.callee_copies (ca
, mode
, type
, named_arg
);
2156 /* Structures to communicate between the subroutines of assign_parms.
2157 The first holds data persistent across all parameters, the second
2158 is cleared out for each parameter. */
2160 struct assign_parm_data_all
2162 CUMULATIVE_ARGS args_so_far
;
2163 struct args_size stack_args_size
;
2164 tree function_result_decl
;
2166 rtx first_conversion_insn
;
2167 rtx last_conversion_insn
;
2168 HOST_WIDE_INT pretend_args_size
;
2169 HOST_WIDE_INT extra_pretend_bytes
;
2170 int reg_parm_stack_space
;
2173 struct assign_parm_data_one
2179 enum machine_mode nominal_mode
;
2180 enum machine_mode passed_mode
;
2181 enum machine_mode promoted_mode
;
2182 struct locate_and_pad_arg_data locate
;
2184 BOOL_BITFIELD named_arg
: 1;
2185 BOOL_BITFIELD passed_pointer
: 1;
2186 BOOL_BITFIELD on_stack
: 1;
2187 BOOL_BITFIELD loaded_in_reg
: 1;
2190 /* A subroutine of assign_parms. Initialize ALL. */
2193 assign_parms_initialize_all (struct assign_parm_data_all
*all
)
2195 tree fntype ATTRIBUTE_UNUSED
;
2197 memset (all
, 0, sizeof (*all
));
2199 fntype
= TREE_TYPE (current_function_decl
);
2201 #ifdef INIT_CUMULATIVE_INCOMING_ARGS
2202 INIT_CUMULATIVE_INCOMING_ARGS (all
->args_so_far
, fntype
, NULL_RTX
);
2204 INIT_CUMULATIVE_ARGS (all
->args_so_far
, fntype
, NULL_RTX
,
2205 current_function_decl
, -1);
2208 #ifdef REG_PARM_STACK_SPACE
2209 all
->reg_parm_stack_space
= REG_PARM_STACK_SPACE (current_function_decl
);
2213 /* If ARGS contains entries with complex types, split the entry into two
2214 entries of the component type. Return a new list of substitutions are
2215 needed, else the old list. */
2218 split_complex_args (VEC(tree
, heap
) **args
)
2223 FOR_EACH_VEC_ELT (tree
, *args
, i
, p
)
2225 tree type
= TREE_TYPE (p
);
2226 if (TREE_CODE (type
) == COMPLEX_TYPE
2227 && targetm
.calls
.split_complex_arg (type
))
2230 tree subtype
= TREE_TYPE (type
);
2231 bool addressable
= TREE_ADDRESSABLE (p
);
2233 /* Rewrite the PARM_DECL's type with its component. */
2235 TREE_TYPE (p
) = subtype
;
2236 DECL_ARG_TYPE (p
) = TREE_TYPE (DECL_ARG_TYPE (p
));
2237 DECL_MODE (p
) = VOIDmode
;
2238 DECL_SIZE (p
) = NULL
;
2239 DECL_SIZE_UNIT (p
) = NULL
;
2240 /* If this arg must go in memory, put it in a pseudo here.
2241 We can't allow it to go in memory as per normal parms,
2242 because the usual place might not have the imag part
2243 adjacent to the real part. */
2244 DECL_ARTIFICIAL (p
) = addressable
;
2245 DECL_IGNORED_P (p
) = addressable
;
2246 TREE_ADDRESSABLE (p
) = 0;
2248 VEC_replace (tree
, *args
, i
, p
);
2250 /* Build a second synthetic decl. */
2251 decl
= build_decl (EXPR_LOCATION (p
),
2252 PARM_DECL
, NULL_TREE
, subtype
);
2253 DECL_ARG_TYPE (decl
) = DECL_ARG_TYPE (p
);
2254 DECL_ARTIFICIAL (decl
) = addressable
;
2255 DECL_IGNORED_P (decl
) = addressable
;
2256 layout_decl (decl
, 0);
2257 VEC_safe_insert (tree
, heap
, *args
, ++i
, decl
);
2262 /* A subroutine of assign_parms. Adjust the parameter list to incorporate
2263 the hidden struct return argument, and (abi willing) complex args.
2264 Return the new parameter list. */
2266 static VEC(tree
, heap
) *
2267 assign_parms_augmented_arg_list (struct assign_parm_data_all
*all
)
2269 tree fndecl
= current_function_decl
;
2270 tree fntype
= TREE_TYPE (fndecl
);
2271 VEC(tree
, heap
) *fnargs
= NULL
;
2274 for (arg
= DECL_ARGUMENTS (fndecl
); arg
; arg
= DECL_CHAIN (arg
))
2275 VEC_safe_push (tree
, heap
, fnargs
, arg
);
2277 all
->orig_fnargs
= DECL_ARGUMENTS (fndecl
);
2279 /* If struct value address is treated as the first argument, make it so. */
2280 if (aggregate_value_p (DECL_RESULT (fndecl
), fndecl
)
2281 && ! cfun
->returns_pcc_struct
2282 && targetm
.calls
.struct_value_rtx (TREE_TYPE (fndecl
), 1) == 0)
2284 tree type
= build_pointer_type (TREE_TYPE (fntype
));
2287 decl
= build_decl (DECL_SOURCE_LOCATION (fndecl
),
2288 PARM_DECL
, get_identifier (".result_ptr"), type
);
2289 DECL_ARG_TYPE (decl
) = type
;
2290 DECL_ARTIFICIAL (decl
) = 1;
2291 DECL_NAMELESS (decl
) = 1;
2292 TREE_CONSTANT (decl
) = 1;
2294 DECL_CHAIN (decl
) = all
->orig_fnargs
;
2295 all
->orig_fnargs
= decl
;
2296 VEC_safe_insert (tree
, heap
, fnargs
, 0, decl
);
2298 all
->function_result_decl
= decl
;
2301 /* If the target wants to split complex arguments into scalars, do so. */
2302 if (targetm
.calls
.split_complex_arg
)
2303 split_complex_args (&fnargs
);
2308 /* A subroutine of assign_parms. Examine PARM and pull out type and mode
2309 data for the parameter. Incorporate ABI specifics such as pass-by-
2310 reference and type promotion. */
2313 assign_parm_find_data_types (struct assign_parm_data_all
*all
, tree parm
,
2314 struct assign_parm_data_one
*data
)
2316 tree nominal_type
, passed_type
;
2317 enum machine_mode nominal_mode
, passed_mode
, promoted_mode
;
2320 memset (data
, 0, sizeof (*data
));
2322 /* NAMED_ARG is a misnomer. We really mean 'non-variadic'. */
2324 data
->named_arg
= 1; /* No variadic parms. */
2325 else if (DECL_CHAIN (parm
))
2326 data
->named_arg
= 1; /* Not the last non-variadic parm. */
2327 else if (targetm
.calls
.strict_argument_naming (&all
->args_so_far
))
2328 data
->named_arg
= 1; /* Only variadic ones are unnamed. */
2330 data
->named_arg
= 0; /* Treat as variadic. */
2332 nominal_type
= TREE_TYPE (parm
);
2333 passed_type
= DECL_ARG_TYPE (parm
);
2335 /* Look out for errors propagating this far. Also, if the parameter's
2336 type is void then its value doesn't matter. */
2337 if (TREE_TYPE (parm
) == error_mark_node
2338 /* This can happen after weird syntax errors
2339 or if an enum type is defined among the parms. */
2340 || TREE_CODE (parm
) != PARM_DECL
2341 || passed_type
== NULL
2342 || VOID_TYPE_P (nominal_type
))
2344 nominal_type
= passed_type
= void_type_node
;
2345 nominal_mode
= passed_mode
= promoted_mode
= VOIDmode
;
2349 /* Find mode of arg as it is passed, and mode of arg as it should be
2350 during execution of this function. */
2351 passed_mode
= TYPE_MODE (passed_type
);
2352 nominal_mode
= TYPE_MODE (nominal_type
);
2354 /* If the parm is to be passed as a transparent union or record, use the
2355 type of the first field for the tests below. We have already verified
2356 that the modes are the same. */
2357 if ((TREE_CODE (passed_type
) == UNION_TYPE
2358 || TREE_CODE (passed_type
) == RECORD_TYPE
)
2359 && TYPE_TRANSPARENT_AGGR (passed_type
))
2360 passed_type
= TREE_TYPE (first_field (passed_type
));
2362 /* See if this arg was passed by invisible reference. */
2363 if (pass_by_reference (&all
->args_so_far
, passed_mode
,
2364 passed_type
, data
->named_arg
))
2366 passed_type
= nominal_type
= build_pointer_type (passed_type
);
2367 data
->passed_pointer
= true;
2368 passed_mode
= nominal_mode
= Pmode
;
2371 /* Find mode as it is passed by the ABI. */
2372 unsignedp
= TYPE_UNSIGNED (passed_type
);
2373 promoted_mode
= promote_function_mode (passed_type
, passed_mode
, &unsignedp
,
2374 TREE_TYPE (current_function_decl
), 0);
2377 data
->nominal_type
= nominal_type
;
2378 data
->passed_type
= passed_type
;
2379 data
->nominal_mode
= nominal_mode
;
2380 data
->passed_mode
= passed_mode
;
2381 data
->promoted_mode
= promoted_mode
;
2384 /* A subroutine of assign_parms. Invoke setup_incoming_varargs. */
2387 assign_parms_setup_varargs (struct assign_parm_data_all
*all
,
2388 struct assign_parm_data_one
*data
, bool no_rtl
)
2390 int varargs_pretend_bytes
= 0;
2392 targetm
.calls
.setup_incoming_varargs (&all
->args_so_far
,
2393 data
->promoted_mode
,
2395 &varargs_pretend_bytes
, no_rtl
);
2397 /* If the back-end has requested extra stack space, record how much is
2398 needed. Do not change pretend_args_size otherwise since it may be
2399 nonzero from an earlier partial argument. */
2400 if (varargs_pretend_bytes
> 0)
2401 all
->pretend_args_size
= varargs_pretend_bytes
;
2404 /* A subroutine of assign_parms. Set DATA->ENTRY_PARM corresponding to
2405 the incoming location of the current parameter. */
2408 assign_parm_find_entry_rtl (struct assign_parm_data_all
*all
,
2409 struct assign_parm_data_one
*data
)
2411 HOST_WIDE_INT pretend_bytes
= 0;
2415 if (data
->promoted_mode
== VOIDmode
)
2417 data
->entry_parm
= data
->stack_parm
= const0_rtx
;
2421 entry_parm
= targetm
.calls
.function_incoming_arg (&all
->args_so_far
,
2422 data
->promoted_mode
,
2426 if (entry_parm
== 0)
2427 data
->promoted_mode
= data
->passed_mode
;
2429 /* Determine parm's home in the stack, in case it arrives in the stack
2430 or we should pretend it did. Compute the stack position and rtx where
2431 the argument arrives and its size.
2433 There is one complexity here: If this was a parameter that would
2434 have been passed in registers, but wasn't only because it is
2435 __builtin_va_alist, we want locate_and_pad_parm to treat it as if
2436 it came in a register so that REG_PARM_STACK_SPACE isn't skipped.
2437 In this case, we call FUNCTION_ARG with NAMED set to 1 instead of 0
2438 as it was the previous time. */
2439 in_regs
= entry_parm
!= 0;
2440 #ifdef STACK_PARMS_IN_REG_PARM_AREA
2443 if (!in_regs
&& !data
->named_arg
)
2445 if (targetm
.calls
.pretend_outgoing_varargs_named (&all
->args_so_far
))
2448 tem
= targetm
.calls
.function_incoming_arg (&all
->args_so_far
,
2449 data
->promoted_mode
,
2450 data
->passed_type
, true);
2451 in_regs
= tem
!= NULL
;
2455 /* If this parameter was passed both in registers and in the stack, use
2456 the copy on the stack. */
2457 if (targetm
.calls
.must_pass_in_stack (data
->promoted_mode
,
2465 partial
= targetm
.calls
.arg_partial_bytes (&all
->args_so_far
,
2466 data
->promoted_mode
,
2469 data
->partial
= partial
;
2471 /* The caller might already have allocated stack space for the
2472 register parameters. */
2473 if (partial
!= 0 && all
->reg_parm_stack_space
== 0)
2475 /* Part of this argument is passed in registers and part
2476 is passed on the stack. Ask the prologue code to extend
2477 the stack part so that we can recreate the full value.
2479 PRETEND_BYTES is the size of the registers we need to store.
2480 CURRENT_FUNCTION_PRETEND_ARGS_SIZE is the amount of extra
2481 stack space that the prologue should allocate.
2483 Internally, gcc assumes that the argument pointer is aligned
2484 to STACK_BOUNDARY bits. This is used both for alignment
2485 optimizations (see init_emit) and to locate arguments that are
2486 aligned to more than PARM_BOUNDARY bits. We must preserve this
2487 invariant by rounding CURRENT_FUNCTION_PRETEND_ARGS_SIZE up to
2488 a stack boundary. */
2490 /* We assume at most one partial arg, and it must be the first
2491 argument on the stack. */
2492 gcc_assert (!all
->extra_pretend_bytes
&& !all
->pretend_args_size
);
2494 pretend_bytes
= partial
;
2495 all
->pretend_args_size
= CEIL_ROUND (pretend_bytes
, STACK_BYTES
);
2497 /* We want to align relative to the actual stack pointer, so
2498 don't include this in the stack size until later. */
2499 all
->extra_pretend_bytes
= all
->pretend_args_size
;
2503 locate_and_pad_parm (data
->promoted_mode
, data
->passed_type
, in_regs
,
2504 entry_parm
? data
->partial
: 0, current_function_decl
,
2505 &all
->stack_args_size
, &data
->locate
);
2507 /* Update parm_stack_boundary if this parameter is passed in the
2509 if (!in_regs
&& crtl
->parm_stack_boundary
< data
->locate
.boundary
)
2510 crtl
->parm_stack_boundary
= data
->locate
.boundary
;
2512 /* Adjust offsets to include the pretend args. */
2513 pretend_bytes
= all
->extra_pretend_bytes
- pretend_bytes
;
2514 data
->locate
.slot_offset
.constant
+= pretend_bytes
;
2515 data
->locate
.offset
.constant
+= pretend_bytes
;
2517 data
->entry_parm
= entry_parm
;
2520 /* A subroutine of assign_parms. If there is actually space on the stack
2521 for this parm, count it in stack_args_size and return true. */
2524 assign_parm_is_stack_parm (struct assign_parm_data_all
*all
,
2525 struct assign_parm_data_one
*data
)
2527 /* Trivially true if we've no incoming register. */
2528 if (data
->entry_parm
== NULL
)
2530 /* Also true if we're partially in registers and partially not,
2531 since we've arranged to drop the entire argument on the stack. */
2532 else if (data
->partial
!= 0)
2534 /* Also true if the target says that it's passed in both registers
2535 and on the stack. */
2536 else if (GET_CODE (data
->entry_parm
) == PARALLEL
2537 && XEXP (XVECEXP (data
->entry_parm
, 0, 0), 0) == NULL_RTX
)
2539 /* Also true if the target says that there's stack allocated for
2540 all register parameters. */
2541 else if (all
->reg_parm_stack_space
> 0)
2543 /* Otherwise, no, this parameter has no ABI defined stack slot. */
2547 all
->stack_args_size
.constant
+= data
->locate
.size
.constant
;
2548 if (data
->locate
.size
.var
)
2549 ADD_PARM_SIZE (all
->stack_args_size
, data
->locate
.size
.var
);
2554 /* A subroutine of assign_parms. Given that this parameter is allocated
2555 stack space by the ABI, find it. */
2558 assign_parm_find_stack_rtl (tree parm
, struct assign_parm_data_one
*data
)
2560 rtx offset_rtx
, stack_parm
;
2561 unsigned int align
, boundary
;
2563 /* If we're passing this arg using a reg, make its stack home the
2564 aligned stack slot. */
2565 if (data
->entry_parm
)
2566 offset_rtx
= ARGS_SIZE_RTX (data
->locate
.slot_offset
);
2568 offset_rtx
= ARGS_SIZE_RTX (data
->locate
.offset
);
2570 stack_parm
= crtl
->args
.internal_arg_pointer
;
2571 if (offset_rtx
!= const0_rtx
)
2572 stack_parm
= gen_rtx_PLUS (Pmode
, stack_parm
, offset_rtx
);
2573 stack_parm
= gen_rtx_MEM (data
->promoted_mode
, stack_parm
);
2575 if (!data
->passed_pointer
)
2577 set_mem_attributes (stack_parm
, parm
, 1);
2578 /* set_mem_attributes could set MEM_SIZE to the passed mode's size,
2579 while promoted mode's size is needed. */
2580 if (data
->promoted_mode
!= BLKmode
2581 && data
->promoted_mode
!= DECL_MODE (parm
))
2583 set_mem_size (stack_parm
,
2584 GEN_INT (GET_MODE_SIZE (data
->promoted_mode
)));
2585 if (MEM_EXPR (stack_parm
) && MEM_OFFSET (stack_parm
))
2587 int offset
= subreg_lowpart_offset (DECL_MODE (parm
),
2588 data
->promoted_mode
);
2590 set_mem_offset (stack_parm
,
2591 plus_constant (MEM_OFFSET (stack_parm
),
2597 boundary
= data
->locate
.boundary
;
2598 align
= BITS_PER_UNIT
;
2600 /* If we're padding upward, we know that the alignment of the slot
2601 is TARGET_FUNCTION_ARG_BOUNDARY. If we're using slot_offset, we're
2602 intentionally forcing upward padding. Otherwise we have to come
2603 up with a guess at the alignment based on OFFSET_RTX. */
2604 if (data
->locate
.where_pad
!= downward
|| data
->entry_parm
)
2606 else if (CONST_INT_P (offset_rtx
))
2608 align
= INTVAL (offset_rtx
) * BITS_PER_UNIT
| boundary
;
2609 align
= align
& -align
;
2611 set_mem_align (stack_parm
, align
);
2613 if (data
->entry_parm
)
2614 set_reg_attrs_for_parm (data
->entry_parm
, stack_parm
);
2616 data
->stack_parm
= stack_parm
;
2619 /* A subroutine of assign_parms. Adjust DATA->ENTRY_RTL such that it's
2620 always valid and contiguous. */
2623 assign_parm_adjust_entry_rtl (struct assign_parm_data_one
*data
)
2625 rtx entry_parm
= data
->entry_parm
;
2626 rtx stack_parm
= data
->stack_parm
;
2628 /* If this parm was passed part in regs and part in memory, pretend it
2629 arrived entirely in memory by pushing the register-part onto the stack.
2630 In the special case of a DImode or DFmode that is split, we could put
2631 it together in a pseudoreg directly, but for now that's not worth
2633 if (data
->partial
!= 0)
2635 /* Handle calls that pass values in multiple non-contiguous
2636 locations. The Irix 6 ABI has examples of this. */
2637 if (GET_CODE (entry_parm
) == PARALLEL
)
2638 emit_group_store (validize_mem (stack_parm
), entry_parm
,
2640 int_size_in_bytes (data
->passed_type
));
2643 gcc_assert (data
->partial
% UNITS_PER_WORD
== 0);
2644 move_block_from_reg (REGNO (entry_parm
), validize_mem (stack_parm
),
2645 data
->partial
/ UNITS_PER_WORD
);
2648 entry_parm
= stack_parm
;
2651 /* If we didn't decide this parm came in a register, by default it came
2653 else if (entry_parm
== NULL
)
2654 entry_parm
= stack_parm
;
2656 /* When an argument is passed in multiple locations, we can't make use
2657 of this information, but we can save some copying if the whole argument
2658 is passed in a single register. */
2659 else if (GET_CODE (entry_parm
) == PARALLEL
2660 && data
->nominal_mode
!= BLKmode
2661 && data
->passed_mode
!= BLKmode
)
2663 size_t i
, len
= XVECLEN (entry_parm
, 0);
2665 for (i
= 0; i
< len
; i
++)
2666 if (XEXP (XVECEXP (entry_parm
, 0, i
), 0) != NULL_RTX
2667 && REG_P (XEXP (XVECEXP (entry_parm
, 0, i
), 0))
2668 && (GET_MODE (XEXP (XVECEXP (entry_parm
, 0, i
), 0))
2669 == data
->passed_mode
)
2670 && INTVAL (XEXP (XVECEXP (entry_parm
, 0, i
), 1)) == 0)
2672 entry_parm
= XEXP (XVECEXP (entry_parm
, 0, i
), 0);
2677 data
->entry_parm
= entry_parm
;
2680 /* A subroutine of assign_parms. Reconstitute any values which were
2681 passed in multiple registers and would fit in a single register. */
2684 assign_parm_remove_parallels (struct assign_parm_data_one
*data
)
2686 rtx entry_parm
= data
->entry_parm
;
2688 /* Convert the PARALLEL to a REG of the same mode as the parallel.
2689 This can be done with register operations rather than on the
2690 stack, even if we will store the reconstituted parameter on the
2692 if (GET_CODE (entry_parm
) == PARALLEL
&& GET_MODE (entry_parm
) != BLKmode
)
2694 rtx parmreg
= gen_reg_rtx (GET_MODE (entry_parm
));
2695 emit_group_store (parmreg
, entry_parm
, data
->passed_type
,
2696 GET_MODE_SIZE (GET_MODE (entry_parm
)));
2697 entry_parm
= parmreg
;
2700 data
->entry_parm
= entry_parm
;
2703 /* A subroutine of assign_parms. Adjust DATA->STACK_RTL such that it's
2704 always valid and properly aligned. */
2707 assign_parm_adjust_stack_rtl (struct assign_parm_data_one
*data
)
2709 rtx stack_parm
= data
->stack_parm
;
2711 /* If we can't trust the parm stack slot to be aligned enough for its
2712 ultimate type, don't use that slot after entry. We'll make another
2713 stack slot, if we need one. */
2715 && ((STRICT_ALIGNMENT
2716 && GET_MODE_ALIGNMENT (data
->nominal_mode
) > MEM_ALIGN (stack_parm
))
2717 || (data
->nominal_type
2718 && TYPE_ALIGN (data
->nominal_type
) > MEM_ALIGN (stack_parm
)
2719 && MEM_ALIGN (stack_parm
) < PREFERRED_STACK_BOUNDARY
)))
2722 /* If parm was passed in memory, and we need to convert it on entry,
2723 don't store it back in that same slot. */
2724 else if (data
->entry_parm
== stack_parm
2725 && data
->nominal_mode
!= BLKmode
2726 && data
->nominal_mode
!= data
->passed_mode
)
2729 /* If stack protection is in effect for this function, don't leave any
2730 pointers in their passed stack slots. */
2731 else if (crtl
->stack_protect_guard
2732 && (flag_stack_protect
== 2
2733 || data
->passed_pointer
2734 || POINTER_TYPE_P (data
->nominal_type
)))
2737 data
->stack_parm
= stack_parm
;
2740 /* A subroutine of assign_parms. Return true if the current parameter
2741 should be stored as a BLKmode in the current frame. */
2744 assign_parm_setup_block_p (struct assign_parm_data_one
*data
)
2746 if (data
->nominal_mode
== BLKmode
)
2748 if (GET_MODE (data
->entry_parm
) == BLKmode
)
2751 #ifdef BLOCK_REG_PADDING
2752 /* Only assign_parm_setup_block knows how to deal with register arguments
2753 that are padded at the least significant end. */
2754 if (REG_P (data
->entry_parm
)
2755 && GET_MODE_SIZE (data
->promoted_mode
) < UNITS_PER_WORD
2756 && (BLOCK_REG_PADDING (data
->passed_mode
, data
->passed_type
, 1)
2757 == (BYTES_BIG_ENDIAN
? upward
: downward
)))
2764 /* A subroutine of assign_parms. Arrange for the parameter to be
2765 present and valid in DATA->STACK_RTL. */
2768 assign_parm_setup_block (struct assign_parm_data_all
*all
,
2769 tree parm
, struct assign_parm_data_one
*data
)
2771 rtx entry_parm
= data
->entry_parm
;
2772 rtx stack_parm
= data
->stack_parm
;
2774 HOST_WIDE_INT size_stored
;
2776 if (GET_CODE (entry_parm
) == PARALLEL
)
2777 entry_parm
= emit_group_move_into_temps (entry_parm
);
2779 size
= int_size_in_bytes (data
->passed_type
);
2780 size_stored
= CEIL_ROUND (size
, UNITS_PER_WORD
);
2781 if (stack_parm
== 0)
2783 DECL_ALIGN (parm
) = MAX (DECL_ALIGN (parm
), BITS_PER_WORD
);
2784 stack_parm
= assign_stack_local (BLKmode
, size_stored
,
2786 if (GET_MODE_SIZE (GET_MODE (entry_parm
)) == size
)
2787 PUT_MODE (stack_parm
, GET_MODE (entry_parm
));
2788 set_mem_attributes (stack_parm
, parm
, 1);
2791 /* If a BLKmode arrives in registers, copy it to a stack slot. Handle
2792 calls that pass values in multiple non-contiguous locations. */
2793 if (REG_P (entry_parm
) || GET_CODE (entry_parm
) == PARALLEL
)
2797 /* Note that we will be storing an integral number of words.
2798 So we have to be careful to ensure that we allocate an
2799 integral number of words. We do this above when we call
2800 assign_stack_local if space was not allocated in the argument
2801 list. If it was, this will not work if PARM_BOUNDARY is not
2802 a multiple of BITS_PER_WORD. It isn't clear how to fix this
2803 if it becomes a problem. Exception is when BLKmode arrives
2804 with arguments not conforming to word_mode. */
2806 if (data
->stack_parm
== 0)
2808 else if (GET_CODE (entry_parm
) == PARALLEL
)
2811 gcc_assert (!size
|| !(PARM_BOUNDARY
% BITS_PER_WORD
));
2813 mem
= validize_mem (stack_parm
);
2815 /* Handle values in multiple non-contiguous locations. */
2816 if (GET_CODE (entry_parm
) == PARALLEL
)
2818 push_to_sequence2 (all
->first_conversion_insn
,
2819 all
->last_conversion_insn
);
2820 emit_group_store (mem
, entry_parm
, data
->passed_type
, size
);
2821 all
->first_conversion_insn
= get_insns ();
2822 all
->last_conversion_insn
= get_last_insn ();
2829 /* If SIZE is that of a mode no bigger than a word, just use
2830 that mode's store operation. */
2831 else if (size
<= UNITS_PER_WORD
)
2833 enum machine_mode mode
2834 = mode_for_size (size
* BITS_PER_UNIT
, MODE_INT
, 0);
2837 #ifdef BLOCK_REG_PADDING
2838 && (size
== UNITS_PER_WORD
2839 || (BLOCK_REG_PADDING (mode
, data
->passed_type
, 1)
2840 != (BYTES_BIG_ENDIAN
? upward
: downward
)))
2846 /* We are really truncating a word_mode value containing
2847 SIZE bytes into a value of mode MODE. If such an
2848 operation requires no actual instructions, we can refer
2849 to the value directly in mode MODE, otherwise we must
2850 start with the register in word_mode and explicitly
2852 if (TRULY_NOOP_TRUNCATION (size
* BITS_PER_UNIT
, BITS_PER_WORD
))
2853 reg
= gen_rtx_REG (mode
, REGNO (entry_parm
));
2856 reg
= gen_rtx_REG (word_mode
, REGNO (entry_parm
));
2857 reg
= convert_to_mode (mode
, copy_to_reg (reg
), 1);
2859 emit_move_insn (change_address (mem
, mode
, 0), reg
);
2862 /* Blocks smaller than a word on a BYTES_BIG_ENDIAN
2863 machine must be aligned to the left before storing
2864 to memory. Note that the previous test doesn't
2865 handle all cases (e.g. SIZE == 3). */
2866 else if (size
!= UNITS_PER_WORD
2867 #ifdef BLOCK_REG_PADDING
2868 && (BLOCK_REG_PADDING (mode
, data
->passed_type
, 1)
2876 int by
= (UNITS_PER_WORD
- size
) * BITS_PER_UNIT
;
2877 rtx reg
= gen_rtx_REG (word_mode
, REGNO (entry_parm
));
2879 x
= expand_shift (LSHIFT_EXPR
, word_mode
, reg
,
2880 build_int_cst (NULL_TREE
, by
),
2882 tem
= change_address (mem
, word_mode
, 0);
2883 emit_move_insn (tem
, x
);
2886 move_block_from_reg (REGNO (entry_parm
), mem
,
2887 size_stored
/ UNITS_PER_WORD
);
2890 move_block_from_reg (REGNO (entry_parm
), mem
,
2891 size_stored
/ UNITS_PER_WORD
);
2893 else if (data
->stack_parm
== 0)
2895 push_to_sequence2 (all
->first_conversion_insn
, all
->last_conversion_insn
);
2896 emit_block_move (stack_parm
, data
->entry_parm
, GEN_INT (size
),
2898 all
->first_conversion_insn
= get_insns ();
2899 all
->last_conversion_insn
= get_last_insn ();
2903 data
->stack_parm
= stack_parm
;
2904 SET_DECL_RTL (parm
, stack_parm
);
2907 /* A subroutine of assign_parm_setup_reg, called through note_stores.
2908 This collects sets and clobbers of hard registers in a HARD_REG_SET,
2909 which is pointed to by DATA. */
2911 record_hard_reg_sets (rtx x
, const_rtx pat ATTRIBUTE_UNUSED
, void *data
)
2913 HARD_REG_SET
*pset
= (HARD_REG_SET
*)data
;
2914 if (REG_P (x
) && HARD_REGISTER_P (x
))
2915 add_to_hard_reg_set (pset
, GET_MODE (x
), REGNO (x
));
2918 /* A subroutine of assign_parms. Allocate a pseudo to hold the current
2919 parameter. Get it there. Perform all ABI specified conversions. */
2922 assign_parm_setup_reg (struct assign_parm_data_all
*all
, tree parm
,
2923 struct assign_parm_data_one
*data
)
2925 rtx parmreg
, validated_mem
;
2926 rtx equiv_stack_parm
;
2927 enum machine_mode promoted_nominal_mode
;
2928 int unsignedp
= TYPE_UNSIGNED (TREE_TYPE (parm
));
2929 bool did_conversion
= false;
2930 bool need_conversion
, moved
;
2932 /* Store the parm in a pseudoregister during the function, but we may
2933 need to do it in a wider mode. Using 2 here makes the result
2934 consistent with promote_decl_mode and thus expand_expr_real_1. */
2935 promoted_nominal_mode
2936 = promote_function_mode (data
->nominal_type
, data
->nominal_mode
, &unsignedp
,
2937 TREE_TYPE (current_function_decl
), 2);
2939 parmreg
= gen_reg_rtx (promoted_nominal_mode
);
2941 if (!DECL_ARTIFICIAL (parm
))
2942 mark_user_reg (parmreg
);
2944 /* If this was an item that we received a pointer to,
2945 set DECL_RTL appropriately. */
2946 if (data
->passed_pointer
)
2948 rtx x
= gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data
->passed_type
)), parmreg
);
2949 set_mem_attributes (x
, parm
, 1);
2950 SET_DECL_RTL (parm
, x
);
2953 SET_DECL_RTL (parm
, parmreg
);
2955 assign_parm_remove_parallels (data
);
2957 /* Copy the value into the register, thus bridging between
2958 assign_parm_find_data_types and expand_expr_real_1. */
2960 equiv_stack_parm
= data
->stack_parm
;
2961 validated_mem
= validize_mem (data
->entry_parm
);
2963 need_conversion
= (data
->nominal_mode
!= data
->passed_mode
2964 || promoted_nominal_mode
!= data
->promoted_mode
);
2968 && GET_MODE_CLASS (data
->nominal_mode
) == MODE_INT
2969 && data
->nominal_mode
== data
->passed_mode
2970 && data
->nominal_mode
== GET_MODE (data
->entry_parm
))
2972 /* ENTRY_PARM has been converted to PROMOTED_MODE, its
2973 mode, by the caller. We now have to convert it to
2974 NOMINAL_MODE, if different. However, PARMREG may be in
2975 a different mode than NOMINAL_MODE if it is being stored
2978 If ENTRY_PARM is a hard register, it might be in a register
2979 not valid for operating in its mode (e.g., an odd-numbered
2980 register for a DFmode). In that case, moves are the only
2981 thing valid, so we can't do a convert from there. This
2982 occurs when the calling sequence allow such misaligned
2985 In addition, the conversion may involve a call, which could
2986 clobber parameters which haven't been copied to pseudo
2989 First, we try to emit an insn which performs the necessary
2990 conversion. We verify that this insn does not clobber any
2993 enum insn_code icode
;
2996 icode
= can_extend_p (promoted_nominal_mode
, data
->passed_mode
,
3000 op1
= validated_mem
;
3001 if (icode
!= CODE_FOR_nothing
3002 && insn_operand_matches (icode
, 0, op0
)
3003 && insn_operand_matches (icode
, 1, op1
))
3005 enum rtx_code code
= unsignedp
? ZERO_EXTEND
: SIGN_EXTEND
;
3007 HARD_REG_SET hardregs
;
3010 insn
= gen_extend_insn (op0
, op1
, promoted_nominal_mode
,
3011 data
->passed_mode
, unsignedp
);
3013 insns
= get_insns ();
3016 CLEAR_HARD_REG_SET (hardregs
);
3017 for (insn
= insns
; insn
&& moved
; insn
= NEXT_INSN (insn
))
3020 note_stores (PATTERN (insn
), record_hard_reg_sets
,
3022 if (!hard_reg_set_empty_p (hardregs
))
3031 if (equiv_stack_parm
!= NULL_RTX
)
3032 equiv_stack_parm
= gen_rtx_fmt_e (code
, GET_MODE (parmreg
),
3039 /* Nothing to do. */
3041 else if (need_conversion
)
3043 /* We did not have an insn to convert directly, or the sequence
3044 generated appeared unsafe. We must first copy the parm to a
3045 pseudo reg, and save the conversion until after all
3046 parameters have been moved. */
3049 rtx tempreg
= gen_reg_rtx (GET_MODE (data
->entry_parm
));
3051 emit_move_insn (tempreg
, validated_mem
);
3053 push_to_sequence2 (all
->first_conversion_insn
, all
->last_conversion_insn
);
3054 tempreg
= convert_to_mode (data
->nominal_mode
, tempreg
, unsignedp
);
3056 if (GET_CODE (tempreg
) == SUBREG
3057 && GET_MODE (tempreg
) == data
->nominal_mode
3058 && REG_P (SUBREG_REG (tempreg
))
3059 && data
->nominal_mode
== data
->passed_mode
3060 && GET_MODE (SUBREG_REG (tempreg
)) == GET_MODE (data
->entry_parm
)
3061 && GET_MODE_SIZE (GET_MODE (tempreg
))
3062 < GET_MODE_SIZE (GET_MODE (data
->entry_parm
)))
3064 /* The argument is already sign/zero extended, so note it
3066 SUBREG_PROMOTED_VAR_P (tempreg
) = 1;
3067 SUBREG_PROMOTED_UNSIGNED_SET (tempreg
, unsignedp
);
3070 /* TREE_USED gets set erroneously during expand_assignment. */
3071 save_tree_used
= TREE_USED (parm
);
3072 expand_assignment (parm
, make_tree (data
->nominal_type
, tempreg
), false);
3073 TREE_USED (parm
) = save_tree_used
;
3074 all
->first_conversion_insn
= get_insns ();
3075 all
->last_conversion_insn
= get_last_insn ();
3078 did_conversion
= true;
3081 emit_move_insn (parmreg
, validated_mem
);
3083 /* If we were passed a pointer but the actual value can safely live
3084 in a register, put it in one. */
3085 if (data
->passed_pointer
3086 && TYPE_MODE (TREE_TYPE (parm
)) != BLKmode
3087 /* If by-reference argument was promoted, demote it. */
3088 && (TYPE_MODE (TREE_TYPE (parm
)) != GET_MODE (DECL_RTL (parm
))
3089 || use_register_for_decl (parm
)))
3091 /* We can't use nominal_mode, because it will have been set to
3092 Pmode above. We must use the actual mode of the parm. */
3093 parmreg
= gen_reg_rtx (TYPE_MODE (TREE_TYPE (parm
)));
3094 mark_user_reg (parmreg
);
3096 if (GET_MODE (parmreg
) != GET_MODE (DECL_RTL (parm
)))
3098 rtx tempreg
= gen_reg_rtx (GET_MODE (DECL_RTL (parm
)));
3099 int unsigned_p
= TYPE_UNSIGNED (TREE_TYPE (parm
));
3101 push_to_sequence2 (all
->first_conversion_insn
,
3102 all
->last_conversion_insn
);
3103 emit_move_insn (tempreg
, DECL_RTL (parm
));
3104 tempreg
= convert_to_mode (GET_MODE (parmreg
), tempreg
, unsigned_p
);
3105 emit_move_insn (parmreg
, tempreg
);
3106 all
->first_conversion_insn
= get_insns ();
3107 all
->last_conversion_insn
= get_last_insn ();
3110 did_conversion
= true;
3113 emit_move_insn (parmreg
, DECL_RTL (parm
));
3115 SET_DECL_RTL (parm
, parmreg
);
3117 /* STACK_PARM is the pointer, not the parm, and PARMREG is
3119 data
->stack_parm
= NULL
;
3122 /* Mark the register as eliminable if we did no conversion and it was
3123 copied from memory at a fixed offset, and the arg pointer was not
3124 copied to a pseudo-reg. If the arg pointer is a pseudo reg or the
3125 offset formed an invalid address, such memory-equivalences as we
3126 make here would screw up life analysis for it. */
3127 if (data
->nominal_mode
== data
->passed_mode
3129 && data
->stack_parm
!= 0
3130 && MEM_P (data
->stack_parm
)
3131 && data
->locate
.offset
.var
== 0
3132 && reg_mentioned_p (virtual_incoming_args_rtx
,
3133 XEXP (data
->stack_parm
, 0)))
3135 rtx linsn
= get_last_insn ();
3138 /* Mark complex types separately. */
3139 if (GET_CODE (parmreg
) == CONCAT
)
3141 enum machine_mode submode
3142 = GET_MODE_INNER (GET_MODE (parmreg
));
3143 int regnor
= REGNO (XEXP (parmreg
, 0));
3144 int regnoi
= REGNO (XEXP (parmreg
, 1));
3145 rtx stackr
= adjust_address_nv (data
->stack_parm
, submode
, 0);
3146 rtx stacki
= adjust_address_nv (data
->stack_parm
, submode
,
3147 GET_MODE_SIZE (submode
));
3149 /* Scan backwards for the set of the real and
3151 for (sinsn
= linsn
; sinsn
!= 0;
3152 sinsn
= prev_nonnote_insn (sinsn
))
3154 set
= single_set (sinsn
);
3158 if (SET_DEST (set
) == regno_reg_rtx
[regnoi
])
3159 set_unique_reg_note (sinsn
, REG_EQUIV
, stacki
);
3160 else if (SET_DEST (set
) == regno_reg_rtx
[regnor
])
3161 set_unique_reg_note (sinsn
, REG_EQUIV
, stackr
);
3164 else if ((set
= single_set (linsn
)) != 0
3165 && SET_DEST (set
) == parmreg
)
3166 set_unique_reg_note (linsn
, REG_EQUIV
, equiv_stack_parm
);
3169 /* For pointer data type, suggest pointer register. */
3170 if (POINTER_TYPE_P (TREE_TYPE (parm
)))
3171 mark_reg_pointer (parmreg
,
3172 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm
))));
3175 /* A subroutine of assign_parms. Allocate stack space to hold the current
3176 parameter. Get it there. Perform all ABI specified conversions. */
3179 assign_parm_setup_stack (struct assign_parm_data_all
*all
, tree parm
,
3180 struct assign_parm_data_one
*data
)
3182 /* Value must be stored in the stack slot STACK_PARM during function
3184 bool to_conversion
= false;
3186 assign_parm_remove_parallels (data
);
3188 if (data
->promoted_mode
!= data
->nominal_mode
)
3190 /* Conversion is required. */
3191 rtx tempreg
= gen_reg_rtx (GET_MODE (data
->entry_parm
));
3193 emit_move_insn (tempreg
, validize_mem (data
->entry_parm
));
3195 push_to_sequence2 (all
->first_conversion_insn
, all
->last_conversion_insn
);
3196 to_conversion
= true;
3198 data
->entry_parm
= convert_to_mode (data
->nominal_mode
, tempreg
,
3199 TYPE_UNSIGNED (TREE_TYPE (parm
)));
3201 if (data
->stack_parm
)
3203 int offset
= subreg_lowpart_offset (data
->nominal_mode
,
3204 GET_MODE (data
->stack_parm
));
3205 /* ??? This may need a big-endian conversion on sparc64. */
3207 = adjust_address (data
->stack_parm
, data
->nominal_mode
, 0);
3208 if (offset
&& MEM_OFFSET (data
->stack_parm
))
3209 set_mem_offset (data
->stack_parm
,
3210 plus_constant (MEM_OFFSET (data
->stack_parm
),
3215 if (data
->entry_parm
!= data
->stack_parm
)
3219 if (data
->stack_parm
== 0)
3221 int align
= STACK_SLOT_ALIGNMENT (data
->passed_type
,
3222 GET_MODE (data
->entry_parm
),
3223 TYPE_ALIGN (data
->passed_type
));
3225 = assign_stack_local (GET_MODE (data
->entry_parm
),
3226 GET_MODE_SIZE (GET_MODE (data
->entry_parm
)),
3228 set_mem_attributes (data
->stack_parm
, parm
, 1);
3231 dest
= validize_mem (data
->stack_parm
);
3232 src
= validize_mem (data
->entry_parm
);
3236 /* Use a block move to handle potentially misaligned entry_parm. */
3238 push_to_sequence2 (all
->first_conversion_insn
,
3239 all
->last_conversion_insn
);
3240 to_conversion
= true;
3242 emit_block_move (dest
, src
,
3243 GEN_INT (int_size_in_bytes (data
->passed_type
)),
3247 emit_move_insn (dest
, src
);
3252 all
->first_conversion_insn
= get_insns ();
3253 all
->last_conversion_insn
= get_last_insn ();
3257 SET_DECL_RTL (parm
, data
->stack_parm
);
3260 /* A subroutine of assign_parms. If the ABI splits complex arguments, then
3261 undo the frobbing that we did in assign_parms_augmented_arg_list. */
3264 assign_parms_unsplit_complex (struct assign_parm_data_all
*all
,
3265 VEC(tree
, heap
) *fnargs
)
3268 tree orig_fnargs
= all
->orig_fnargs
;
3271 for (parm
= orig_fnargs
; parm
; parm
= TREE_CHAIN (parm
), ++i
)
3273 if (TREE_CODE (TREE_TYPE (parm
)) == COMPLEX_TYPE
3274 && targetm
.calls
.split_complex_arg (TREE_TYPE (parm
)))
3276 rtx tmp
, real
, imag
;
3277 enum machine_mode inner
= GET_MODE_INNER (DECL_MODE (parm
));
3279 real
= DECL_RTL (VEC_index (tree
, fnargs
, i
));
3280 imag
= DECL_RTL (VEC_index (tree
, fnargs
, i
+ 1));
3281 if (inner
!= GET_MODE (real
))
3283 real
= gen_lowpart_SUBREG (inner
, real
);
3284 imag
= gen_lowpart_SUBREG (inner
, imag
);
3287 if (TREE_ADDRESSABLE (parm
))
3290 HOST_WIDE_INT size
= int_size_in_bytes (TREE_TYPE (parm
));
3291 int align
= STACK_SLOT_ALIGNMENT (TREE_TYPE (parm
),
3293 TYPE_ALIGN (TREE_TYPE (parm
)));
3295 /* split_complex_arg put the real and imag parts in
3296 pseudos. Move them to memory. */
3297 tmp
= assign_stack_local (DECL_MODE (parm
), size
, align
);
3298 set_mem_attributes (tmp
, parm
, 1);
3299 rmem
= adjust_address_nv (tmp
, inner
, 0);
3300 imem
= adjust_address_nv (tmp
, inner
, GET_MODE_SIZE (inner
));
3301 push_to_sequence2 (all
->first_conversion_insn
,
3302 all
->last_conversion_insn
);
3303 emit_move_insn (rmem
, real
);
3304 emit_move_insn (imem
, imag
);
3305 all
->first_conversion_insn
= get_insns ();
3306 all
->last_conversion_insn
= get_last_insn ();
3310 tmp
= gen_rtx_CONCAT (DECL_MODE (parm
), real
, imag
);
3311 SET_DECL_RTL (parm
, tmp
);
3313 real
= DECL_INCOMING_RTL (VEC_index (tree
, fnargs
, i
));
3314 imag
= DECL_INCOMING_RTL (VEC_index (tree
, fnargs
, i
+ 1));
3315 if (inner
!= GET_MODE (real
))
3317 real
= gen_lowpart_SUBREG (inner
, real
);
3318 imag
= gen_lowpart_SUBREG (inner
, imag
);
3320 tmp
= gen_rtx_CONCAT (DECL_MODE (parm
), real
, imag
);
3321 set_decl_incoming_rtl (parm
, tmp
, false);
3327 /* Assign RTL expressions to the function's parameters. This may involve
3328 copying them into registers and using those registers as the DECL_RTL. */
3331 assign_parms (tree fndecl
)
3333 struct assign_parm_data_all all
;
3335 VEC(tree
, heap
) *fnargs
;
3338 crtl
->args
.internal_arg_pointer
3339 = targetm
.calls
.internal_arg_pointer ();
3341 assign_parms_initialize_all (&all
);
3342 fnargs
= assign_parms_augmented_arg_list (&all
);
3344 FOR_EACH_VEC_ELT (tree
, fnargs
, i
, parm
)
3346 struct assign_parm_data_one data
;
3348 /* Extract the type of PARM; adjust it according to ABI. */
3349 assign_parm_find_data_types (&all
, parm
, &data
);
3351 /* Early out for errors and void parameters. */
3352 if (data
.passed_mode
== VOIDmode
)
3354 SET_DECL_RTL (parm
, const0_rtx
);
3355 DECL_INCOMING_RTL (parm
) = DECL_RTL (parm
);
3359 /* Estimate stack alignment from parameter alignment. */
3360 if (SUPPORTS_STACK_ALIGNMENT
)
3363 = targetm
.calls
.function_arg_boundary (data
.promoted_mode
,
3365 align
= MINIMUM_ALIGNMENT (data
.passed_type
, data
.promoted_mode
,
3367 if (TYPE_ALIGN (data
.nominal_type
) > align
)
3368 align
= MINIMUM_ALIGNMENT (data
.nominal_type
,
3369 TYPE_MODE (data
.nominal_type
),
3370 TYPE_ALIGN (data
.nominal_type
));
3371 if (crtl
->stack_alignment_estimated
< align
)
3373 gcc_assert (!crtl
->stack_realign_processed
);
3374 crtl
->stack_alignment_estimated
= align
;
3378 if (cfun
->stdarg
&& !DECL_CHAIN (parm
))
3379 assign_parms_setup_varargs (&all
, &data
, false);
3381 /* Find out where the parameter arrives in this function. */
3382 assign_parm_find_entry_rtl (&all
, &data
);
3384 /* Find out where stack space for this parameter might be. */
3385 if (assign_parm_is_stack_parm (&all
, &data
))
3387 assign_parm_find_stack_rtl (parm
, &data
);
3388 assign_parm_adjust_entry_rtl (&data
);
3391 /* Record permanently how this parm was passed. */
3392 if (data
.passed_pointer
)
3395 = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data
.passed_type
)),
3397 set_decl_incoming_rtl (parm
, incoming_rtl
, true);
3400 set_decl_incoming_rtl (parm
, data
.entry_parm
, false);
3402 /* Update info on where next arg arrives in registers. */
3403 targetm
.calls
.function_arg_advance (&all
.args_so_far
, data
.promoted_mode
,
3404 data
.passed_type
, data
.named_arg
);
3406 assign_parm_adjust_stack_rtl (&data
);
3408 if (assign_parm_setup_block_p (&data
))
3409 assign_parm_setup_block (&all
, parm
, &data
);
3410 else if (data
.passed_pointer
|| use_register_for_decl (parm
))
3411 assign_parm_setup_reg (&all
, parm
, &data
);
3413 assign_parm_setup_stack (&all
, parm
, &data
);
3416 if (targetm
.calls
.split_complex_arg
)
3417 assign_parms_unsplit_complex (&all
, fnargs
);
3419 VEC_free (tree
, heap
, fnargs
);
3421 /* Output all parameter conversion instructions (possibly including calls)
3422 now that all parameters have been copied out of hard registers. */
3423 emit_insn (all
.first_conversion_insn
);
3425 /* Estimate reload stack alignment from scalar return mode. */
3426 if (SUPPORTS_STACK_ALIGNMENT
)
3428 if (DECL_RESULT (fndecl
))
3430 tree type
= TREE_TYPE (DECL_RESULT (fndecl
));
3431 enum machine_mode mode
= TYPE_MODE (type
);
3435 && !AGGREGATE_TYPE_P (type
))
3437 unsigned int align
= GET_MODE_ALIGNMENT (mode
);
3438 if (crtl
->stack_alignment_estimated
< align
)
3440 gcc_assert (!crtl
->stack_realign_processed
);
3441 crtl
->stack_alignment_estimated
= align
;
3447 /* If we are receiving a struct value address as the first argument, set up
3448 the RTL for the function result. As this might require code to convert
3449 the transmitted address to Pmode, we do this here to ensure that possible
3450 preliminary conversions of the address have been emitted already. */
3451 if (all
.function_result_decl
)
3453 tree result
= DECL_RESULT (current_function_decl
);
3454 rtx addr
= DECL_RTL (all
.function_result_decl
);
3457 if (DECL_BY_REFERENCE (result
))
3459 SET_DECL_VALUE_EXPR (result
, all
.function_result_decl
);
3464 SET_DECL_VALUE_EXPR (result
,
3465 build1 (INDIRECT_REF
, TREE_TYPE (result
),
3466 all
.function_result_decl
));
3467 addr
= convert_memory_address (Pmode
, addr
);
3468 x
= gen_rtx_MEM (DECL_MODE (result
), addr
);
3469 set_mem_attributes (x
, result
, 1);
3472 DECL_HAS_VALUE_EXPR_P (result
) = 1;
3474 SET_DECL_RTL (result
, x
);
3477 /* We have aligned all the args, so add space for the pretend args. */
3478 crtl
->args
.pretend_args_size
= all
.pretend_args_size
;
3479 all
.stack_args_size
.constant
+= all
.extra_pretend_bytes
;
3480 crtl
->args
.size
= all
.stack_args_size
.constant
;
3482 /* Adjust function incoming argument size for alignment and
3485 #ifdef REG_PARM_STACK_SPACE
3486 crtl
->args
.size
= MAX (crtl
->args
.size
,
3487 REG_PARM_STACK_SPACE (fndecl
));
3490 crtl
->args
.size
= CEIL_ROUND (crtl
->args
.size
,
3491 PARM_BOUNDARY
/ BITS_PER_UNIT
);
3493 #ifdef ARGS_GROW_DOWNWARD
3494 crtl
->args
.arg_offset_rtx
3495 = (all
.stack_args_size
.var
== 0 ? GEN_INT (-all
.stack_args_size
.constant
)
3496 : expand_expr (size_diffop (all
.stack_args_size
.var
,
3497 size_int (-all
.stack_args_size
.constant
)),
3498 NULL_RTX
, VOIDmode
, EXPAND_NORMAL
));
3500 crtl
->args
.arg_offset_rtx
= ARGS_SIZE_RTX (all
.stack_args_size
);
3503 /* See how many bytes, if any, of its args a function should try to pop
3506 crtl
->args
.pops_args
= targetm
.calls
.return_pops_args (fndecl
,
3510 /* For stdarg.h function, save info about
3511 regs and stack space used by the named args. */
3513 crtl
->args
.info
= all
.args_so_far
;
3515 /* Set the rtx used for the function return value. Put this in its
3516 own variable so any optimizers that need this information don't have
3517 to include tree.h. Do this here so it gets done when an inlined
3518 function gets output. */
3521 = (DECL_RTL_SET_P (DECL_RESULT (fndecl
))
3522 ? DECL_RTL (DECL_RESULT (fndecl
)) : NULL_RTX
);
3524 /* If scalar return value was computed in a pseudo-reg, or was a named
3525 return value that got dumped to the stack, copy that to the hard
3527 if (DECL_RTL_SET_P (DECL_RESULT (fndecl
)))
3529 tree decl_result
= DECL_RESULT (fndecl
);
3530 rtx decl_rtl
= DECL_RTL (decl_result
);
3532 if (REG_P (decl_rtl
)
3533 ? REGNO (decl_rtl
) >= FIRST_PSEUDO_REGISTER
3534 : DECL_REGISTER (decl_result
))
3538 real_decl_rtl
= targetm
.calls
.function_value (TREE_TYPE (decl_result
),
3540 REG_FUNCTION_VALUE_P (real_decl_rtl
) = 1;
3541 /* The delay slot scheduler assumes that crtl->return_rtx
3542 holds the hard register containing the return value, not a
3543 temporary pseudo. */
3544 crtl
->return_rtx
= real_decl_rtl
;
3549 /* A subroutine of gimplify_parameters, invoked via walk_tree.
3550 For all seen types, gimplify their sizes. */
3553 gimplify_parm_type (tree
*tp
, int *walk_subtrees
, void *data
)
3560 if (POINTER_TYPE_P (t
))
3562 else if (TYPE_SIZE (t
) && !TREE_CONSTANT (TYPE_SIZE (t
))
3563 && !TYPE_SIZES_GIMPLIFIED (t
))
3565 gimplify_type_sizes (t
, (gimple_seq
*) data
);
3573 /* Gimplify the parameter list for current_function_decl. This involves
3574 evaluating SAVE_EXPRs of variable sized parameters and generating code
3575 to implement callee-copies reference parameters. Returns a sequence of
3576 statements to add to the beginning of the function. */
3579 gimplify_parameters (void)
3581 struct assign_parm_data_all all
;
3583 gimple_seq stmts
= NULL
;
3584 VEC(tree
, heap
) *fnargs
;
3587 assign_parms_initialize_all (&all
);
3588 fnargs
= assign_parms_augmented_arg_list (&all
);
3590 FOR_EACH_VEC_ELT (tree
, fnargs
, i
, parm
)
3592 struct assign_parm_data_one data
;
3594 /* Extract the type of PARM; adjust it according to ABI. */
3595 assign_parm_find_data_types (&all
, parm
, &data
);
3597 /* Early out for errors and void parameters. */
3598 if (data
.passed_mode
== VOIDmode
|| DECL_SIZE (parm
) == NULL
)
3601 /* Update info on where next arg arrives in registers. */
3602 targetm
.calls
.function_arg_advance (&all
.args_so_far
, data
.promoted_mode
,
3603 data
.passed_type
, data
.named_arg
);
3605 /* ??? Once upon a time variable_size stuffed parameter list
3606 SAVE_EXPRs (amongst others) onto a pending sizes list. This
3607 turned out to be less than manageable in the gimple world.
3608 Now we have to hunt them down ourselves. */
3609 walk_tree_without_duplicates (&data
.passed_type
,
3610 gimplify_parm_type
, &stmts
);
3612 if (TREE_CODE (DECL_SIZE_UNIT (parm
)) != INTEGER_CST
)
3614 gimplify_one_sizepos (&DECL_SIZE (parm
), &stmts
);
3615 gimplify_one_sizepos (&DECL_SIZE_UNIT (parm
), &stmts
);
3618 if (data
.passed_pointer
)
3620 tree type
= TREE_TYPE (data
.passed_type
);
3621 if (reference_callee_copied (&all
.args_so_far
, TYPE_MODE (type
),
3622 type
, data
.named_arg
))
3626 /* For constant-sized objects, this is trivial; for
3627 variable-sized objects, we have to play games. */
3628 if (TREE_CODE (DECL_SIZE_UNIT (parm
)) == INTEGER_CST
3629 && !(flag_stack_check
== GENERIC_STACK_CHECK
3630 && compare_tree_int (DECL_SIZE_UNIT (parm
),
3631 STACK_CHECK_MAX_VAR_SIZE
) > 0))
3633 local
= create_tmp_reg (type
, get_name (parm
));
3634 DECL_IGNORED_P (local
) = 0;
3635 /* If PARM was addressable, move that flag over
3636 to the local copy, as its address will be taken,
3637 not the PARMs. Keep the parms address taken
3638 as we'll query that flag during gimplification. */
3639 if (TREE_ADDRESSABLE (parm
))
3640 TREE_ADDRESSABLE (local
) = 1;
3644 tree ptr_type
, addr
;
3646 ptr_type
= build_pointer_type (type
);
3647 addr
= create_tmp_reg (ptr_type
, get_name (parm
));
3648 DECL_IGNORED_P (addr
) = 0;
3649 local
= build_fold_indirect_ref (addr
);
3651 t
= built_in_decls
[BUILT_IN_ALLOCA
];
3652 t
= build_call_expr (t
, 1, DECL_SIZE_UNIT (parm
));
3653 /* The call has been built for a variable-sized object. */
3654 CALL_ALLOCA_FOR_VAR_P (t
) = 1;
3655 t
= fold_convert (ptr_type
, t
);
3656 t
= build2 (MODIFY_EXPR
, TREE_TYPE (addr
), addr
, t
);
3657 gimplify_and_add (t
, &stmts
);
3660 gimplify_assign (local
, parm
, &stmts
);
3662 SET_DECL_VALUE_EXPR (parm
, local
);
3663 DECL_HAS_VALUE_EXPR_P (parm
) = 1;
3668 VEC_free (tree
, heap
, fnargs
);
3673 /* Compute the size and offset from the start of the stacked arguments for a
3674 parm passed in mode PASSED_MODE and with type TYPE.
3676 INITIAL_OFFSET_PTR points to the current offset into the stacked
3679 The starting offset and size for this parm are returned in
3680 LOCATE->OFFSET and LOCATE->SIZE, respectively. When IN_REGS is
3681 nonzero, the offset is that of stack slot, which is returned in
3682 LOCATE->SLOT_OFFSET. LOCATE->ALIGNMENT_PAD is the amount of
3683 padding required from the initial offset ptr to the stack slot.
3685 IN_REGS is nonzero if the argument will be passed in registers. It will
3686 never be set if REG_PARM_STACK_SPACE is not defined.
3688 FNDECL is the function in which the argument was defined.
3690 There are two types of rounding that are done. The first, controlled by
3691 TARGET_FUNCTION_ARG_BOUNDARY, forces the offset from the start of the
3692 argument list to be aligned to the specific boundary (in bits). This
3693 rounding affects the initial and starting offsets, but not the argument
3696 The second, controlled by FUNCTION_ARG_PADDING and PARM_BOUNDARY,
3697 optionally rounds the size of the parm to PARM_BOUNDARY. The
3698 initial offset is not affected by this rounding, while the size always
3699 is and the starting offset may be. */
3701 /* LOCATE->OFFSET will be negative for ARGS_GROW_DOWNWARD case;
3702 INITIAL_OFFSET_PTR is positive because locate_and_pad_parm's
3703 callers pass in the total size of args so far as
3704 INITIAL_OFFSET_PTR. LOCATE->SIZE is always positive. */
3707 locate_and_pad_parm (enum machine_mode passed_mode
, tree type
, int in_regs
,
3708 int partial
, tree fndecl ATTRIBUTE_UNUSED
,
3709 struct args_size
*initial_offset_ptr
,
3710 struct locate_and_pad_arg_data
*locate
)
3713 enum direction where_pad
;
3714 unsigned int boundary
;
3715 int reg_parm_stack_space
= 0;
3716 int part_size_in_regs
;
3718 #ifdef REG_PARM_STACK_SPACE
3719 reg_parm_stack_space
= REG_PARM_STACK_SPACE (fndecl
);
3721 /* If we have found a stack parm before we reach the end of the
3722 area reserved for registers, skip that area. */
3725 if (reg_parm_stack_space
> 0)
3727 if (initial_offset_ptr
->var
)
3729 initial_offset_ptr
->var
3730 = size_binop (MAX_EXPR
, ARGS_SIZE_TREE (*initial_offset_ptr
),
3731 ssize_int (reg_parm_stack_space
));
3732 initial_offset_ptr
->constant
= 0;
3734 else if (initial_offset_ptr
->constant
< reg_parm_stack_space
)
3735 initial_offset_ptr
->constant
= reg_parm_stack_space
;
3738 #endif /* REG_PARM_STACK_SPACE */
3740 part_size_in_regs
= (reg_parm_stack_space
== 0 ? partial
: 0);
3743 = type
? size_in_bytes (type
) : size_int (GET_MODE_SIZE (passed_mode
));
3744 where_pad
= FUNCTION_ARG_PADDING (passed_mode
, type
);
3745 boundary
= targetm
.calls
.function_arg_boundary (passed_mode
, type
);
3746 locate
->where_pad
= where_pad
;
3748 /* Alignment can't exceed MAX_SUPPORTED_STACK_ALIGNMENT. */
3749 if (boundary
> MAX_SUPPORTED_STACK_ALIGNMENT
)
3750 boundary
= MAX_SUPPORTED_STACK_ALIGNMENT
;
3752 locate
->boundary
= boundary
;
3754 if (SUPPORTS_STACK_ALIGNMENT
)
3756 /* stack_alignment_estimated can't change after stack has been
3758 if (crtl
->stack_alignment_estimated
< boundary
)
3760 if (!crtl
->stack_realign_processed
)
3761 crtl
->stack_alignment_estimated
= boundary
;
3764 /* If stack is realigned and stack alignment value
3765 hasn't been finalized, it is OK not to increase
3766 stack_alignment_estimated. The bigger alignment
3767 requirement is recorded in stack_alignment_needed
3769 gcc_assert (!crtl
->stack_realign_finalized
3770 && crtl
->stack_realign_needed
);
3775 /* Remember if the outgoing parameter requires extra alignment on the
3776 calling function side. */
3777 if (crtl
->stack_alignment_needed
< boundary
)
3778 crtl
->stack_alignment_needed
= boundary
;
3779 if (crtl
->preferred_stack_boundary
< boundary
)
3780 crtl
->preferred_stack_boundary
= boundary
;
3782 #ifdef ARGS_GROW_DOWNWARD
3783 locate
->slot_offset
.constant
= -initial_offset_ptr
->constant
;
3784 if (initial_offset_ptr
->var
)
3785 locate
->slot_offset
.var
= size_binop (MINUS_EXPR
, ssize_int (0),
3786 initial_offset_ptr
->var
);
3790 if (where_pad
!= none
3791 && (!host_integerp (sizetree
, 1)
3792 || (tree_low_cst (sizetree
, 1) * BITS_PER_UNIT
) % PARM_BOUNDARY
))
3793 s2
= round_up (s2
, PARM_BOUNDARY
/ BITS_PER_UNIT
);
3794 SUB_PARM_SIZE (locate
->slot_offset
, s2
);
3797 locate
->slot_offset
.constant
+= part_size_in_regs
;
3800 #ifdef REG_PARM_STACK_SPACE
3801 || REG_PARM_STACK_SPACE (fndecl
) > 0
3804 pad_to_arg_alignment (&locate
->slot_offset
, boundary
,
3805 &locate
->alignment_pad
);
3807 locate
->size
.constant
= (-initial_offset_ptr
->constant
3808 - locate
->slot_offset
.constant
);
3809 if (initial_offset_ptr
->var
)
3810 locate
->size
.var
= size_binop (MINUS_EXPR
,
3811 size_binop (MINUS_EXPR
,
3813 initial_offset_ptr
->var
),
3814 locate
->slot_offset
.var
);
3816 /* Pad_below needs the pre-rounded size to know how much to pad
3818 locate
->offset
= locate
->slot_offset
;
3819 if (where_pad
== downward
)
3820 pad_below (&locate
->offset
, passed_mode
, sizetree
);
3822 #else /* !ARGS_GROW_DOWNWARD */
3824 #ifdef REG_PARM_STACK_SPACE
3825 || REG_PARM_STACK_SPACE (fndecl
) > 0
3828 pad_to_arg_alignment (initial_offset_ptr
, boundary
,
3829 &locate
->alignment_pad
);
3830 locate
->slot_offset
= *initial_offset_ptr
;
3832 #ifdef PUSH_ROUNDING
3833 if (passed_mode
!= BLKmode
)
3834 sizetree
= size_int (PUSH_ROUNDING (TREE_INT_CST_LOW (sizetree
)));
3837 /* Pad_below needs the pre-rounded size to know how much to pad below
3838 so this must be done before rounding up. */
3839 locate
->offset
= locate
->slot_offset
;
3840 if (where_pad
== downward
)
3841 pad_below (&locate
->offset
, passed_mode
, sizetree
);
3843 if (where_pad
!= none
3844 && (!host_integerp (sizetree
, 1)
3845 || (tree_low_cst (sizetree
, 1) * BITS_PER_UNIT
) % PARM_BOUNDARY
))
3846 sizetree
= round_up (sizetree
, PARM_BOUNDARY
/ BITS_PER_UNIT
);
3848 ADD_PARM_SIZE (locate
->size
, sizetree
);
3850 locate
->size
.constant
-= part_size_in_regs
;
3851 #endif /* ARGS_GROW_DOWNWARD */
3853 #ifdef FUNCTION_ARG_OFFSET
3854 locate
->offset
.constant
+= FUNCTION_ARG_OFFSET (passed_mode
, type
);
3858 /* Round the stack offset in *OFFSET_PTR up to a multiple of BOUNDARY.
3859 BOUNDARY is measured in bits, but must be a multiple of a storage unit. */
3862 pad_to_arg_alignment (struct args_size
*offset_ptr
, int boundary
,
3863 struct args_size
*alignment_pad
)
3865 tree save_var
= NULL_TREE
;
3866 HOST_WIDE_INT save_constant
= 0;
3867 int boundary_in_bytes
= boundary
/ BITS_PER_UNIT
;
3868 HOST_WIDE_INT sp_offset
= STACK_POINTER_OFFSET
;
3870 #ifdef SPARC_STACK_BOUNDARY_HACK
3871 /* ??? The SPARC port may claim a STACK_BOUNDARY higher than
3872 the real alignment of %sp. However, when it does this, the
3873 alignment of %sp+STACK_POINTER_OFFSET is STACK_BOUNDARY. */
3874 if (SPARC_STACK_BOUNDARY_HACK
)
3878 if (boundary
> PARM_BOUNDARY
)
3880 save_var
= offset_ptr
->var
;
3881 save_constant
= offset_ptr
->constant
;
3884 alignment_pad
->var
= NULL_TREE
;
3885 alignment_pad
->constant
= 0;
3887 if (boundary
> BITS_PER_UNIT
)
3889 if (offset_ptr
->var
)
3891 tree sp_offset_tree
= ssize_int (sp_offset
);
3892 tree offset
= size_binop (PLUS_EXPR
,
3893 ARGS_SIZE_TREE (*offset_ptr
),
3895 #ifdef ARGS_GROW_DOWNWARD
3896 tree rounded
= round_down (offset
, boundary
/ BITS_PER_UNIT
);
3898 tree rounded
= round_up (offset
, boundary
/ BITS_PER_UNIT
);
3901 offset_ptr
->var
= size_binop (MINUS_EXPR
, rounded
, sp_offset_tree
);
3902 /* ARGS_SIZE_TREE includes constant term. */
3903 offset_ptr
->constant
= 0;
3904 if (boundary
> PARM_BOUNDARY
)
3905 alignment_pad
->var
= size_binop (MINUS_EXPR
, offset_ptr
->var
,
3910 offset_ptr
->constant
= -sp_offset
+
3911 #ifdef ARGS_GROW_DOWNWARD
3912 FLOOR_ROUND (offset_ptr
->constant
+ sp_offset
, boundary_in_bytes
);
3914 CEIL_ROUND (offset_ptr
->constant
+ sp_offset
, boundary_in_bytes
);
3916 if (boundary
> PARM_BOUNDARY
)
3917 alignment_pad
->constant
= offset_ptr
->constant
- save_constant
;
3923 pad_below (struct args_size
*offset_ptr
, enum machine_mode passed_mode
, tree sizetree
)
3925 if (passed_mode
!= BLKmode
)
3927 if (GET_MODE_BITSIZE (passed_mode
) % PARM_BOUNDARY
)
3928 offset_ptr
->constant
3929 += (((GET_MODE_BITSIZE (passed_mode
) + PARM_BOUNDARY
- 1)
3930 / PARM_BOUNDARY
* PARM_BOUNDARY
/ BITS_PER_UNIT
)
3931 - GET_MODE_SIZE (passed_mode
));
3935 if (TREE_CODE (sizetree
) != INTEGER_CST
3936 || (TREE_INT_CST_LOW (sizetree
) * BITS_PER_UNIT
) % PARM_BOUNDARY
)
3938 /* Round the size up to multiple of PARM_BOUNDARY bits. */
3939 tree s2
= round_up (sizetree
, PARM_BOUNDARY
/ BITS_PER_UNIT
);
3941 ADD_PARM_SIZE (*offset_ptr
, s2
);
3942 SUB_PARM_SIZE (*offset_ptr
, sizetree
);
3948 /* True if register REGNO was alive at a place where `setjmp' was
3949 called and was set more than once or is an argument. Such regs may
3950 be clobbered by `longjmp'. */
3953 regno_clobbered_at_setjmp (bitmap setjmp_crosses
, int regno
)
3955 /* There appear to be cases where some local vars never reach the
3956 backend but have bogus regnos. */
3957 if (regno
>= max_reg_num ())
3960 return ((REG_N_SETS (regno
) > 1
3961 || REGNO_REG_SET_P (df_get_live_out (ENTRY_BLOCK_PTR
), regno
))
3962 && REGNO_REG_SET_P (setjmp_crosses
, regno
));
3965 /* Walk the tree of blocks describing the binding levels within a
3966 function and warn about variables the might be killed by setjmp or
3967 vfork. This is done after calling flow_analysis before register
3968 allocation since that will clobber the pseudo-regs to hard
3972 setjmp_vars_warning (bitmap setjmp_crosses
, tree block
)
3976 for (decl
= BLOCK_VARS (block
); decl
; decl
= DECL_CHAIN (decl
))
3978 if (TREE_CODE (decl
) == VAR_DECL
3979 && DECL_RTL_SET_P (decl
)
3980 && REG_P (DECL_RTL (decl
))
3981 && regno_clobbered_at_setjmp (setjmp_crosses
, REGNO (DECL_RTL (decl
))))
3982 warning (OPT_Wclobbered
, "variable %q+D might be clobbered by"
3983 " %<longjmp%> or %<vfork%>", decl
);
3986 for (sub
= BLOCK_SUBBLOCKS (block
); sub
; sub
= BLOCK_CHAIN (sub
))
3987 setjmp_vars_warning (setjmp_crosses
, sub
);
3990 /* Do the appropriate part of setjmp_vars_warning
3991 but for arguments instead of local variables. */
3994 setjmp_args_warning (bitmap setjmp_crosses
)
3997 for (decl
= DECL_ARGUMENTS (current_function_decl
);
3998 decl
; decl
= DECL_CHAIN (decl
))
3999 if (DECL_RTL (decl
) != 0
4000 && REG_P (DECL_RTL (decl
))
4001 && regno_clobbered_at_setjmp (setjmp_crosses
, REGNO (DECL_RTL (decl
))))
4002 warning (OPT_Wclobbered
,
4003 "argument %q+D might be clobbered by %<longjmp%> or %<vfork%>",
4007 /* Generate warning messages for variables live across setjmp. */
4010 generate_setjmp_warnings (void)
4012 bitmap setjmp_crosses
= regstat_get_setjmp_crosses ();
4014 if (n_basic_blocks
== NUM_FIXED_BLOCKS
4015 || bitmap_empty_p (setjmp_crosses
))
4018 setjmp_vars_warning (setjmp_crosses
, DECL_INITIAL (current_function_decl
));
4019 setjmp_args_warning (setjmp_crosses
);
4023 /* Reverse the order of elements in the fragment chain T of blocks,
4024 and return the new head of the chain (old last element). */
4027 block_fragments_nreverse (tree t
)
4029 tree prev
= 0, block
, next
;
4030 for (block
= t
; block
; block
= next
)
4032 next
= BLOCK_FRAGMENT_CHAIN (block
);
4033 BLOCK_FRAGMENT_CHAIN (block
) = prev
;
4039 /* Reverse the order of elements in the chain T of blocks,
4040 and return the new head of the chain (old last element).
4041 Also do the same on subblocks and reverse the order of elements
4042 in BLOCK_FRAGMENT_CHAIN as well. */
4045 blocks_nreverse_all (tree t
)
4047 tree prev
= 0, block
, next
;
4048 for (block
= t
; block
; block
= next
)
4050 next
= BLOCK_CHAIN (block
);
4051 BLOCK_CHAIN (block
) = prev
;
4052 BLOCK_SUBBLOCKS (block
) = blocks_nreverse_all (BLOCK_SUBBLOCKS (block
));
4053 if (BLOCK_FRAGMENT_CHAIN (block
)
4054 && BLOCK_FRAGMENT_ORIGIN (block
) == NULL_TREE
)
4055 BLOCK_FRAGMENT_CHAIN (block
)
4056 = block_fragments_nreverse (BLOCK_FRAGMENT_CHAIN (block
));
4063 /* Identify BLOCKs referenced by more than one NOTE_INSN_BLOCK_{BEG,END},
4064 and create duplicate blocks. */
4065 /* ??? Need an option to either create block fragments or to create
4066 abstract origin duplicates of a source block. It really depends
4067 on what optimization has been performed. */
4070 reorder_blocks (void)
4072 tree block
= DECL_INITIAL (current_function_decl
);
4073 VEC(tree
,heap
) *block_stack
;
4075 if (block
== NULL_TREE
)
4078 block_stack
= VEC_alloc (tree
, heap
, 10);
4080 /* Reset the TREE_ASM_WRITTEN bit for all blocks. */
4081 clear_block_marks (block
);
4083 /* Prune the old trees away, so that they don't get in the way. */
4084 BLOCK_SUBBLOCKS (block
) = NULL_TREE
;
4085 BLOCK_CHAIN (block
) = NULL_TREE
;
4087 /* Recreate the block tree from the note nesting. */
4088 reorder_blocks_1 (get_insns (), block
, &block_stack
);
4089 BLOCK_SUBBLOCKS (block
) = blocks_nreverse_all (BLOCK_SUBBLOCKS (block
));
4091 VEC_free (tree
, heap
, block_stack
);
4094 /* Helper function for reorder_blocks. Reset TREE_ASM_WRITTEN. */
4097 clear_block_marks (tree block
)
4101 TREE_ASM_WRITTEN (block
) = 0;
4102 clear_block_marks (BLOCK_SUBBLOCKS (block
));
4103 block
= BLOCK_CHAIN (block
);
4108 reorder_blocks_1 (rtx insns
, tree current_block
, VEC(tree
,heap
) **p_block_stack
)
4112 for (insn
= insns
; insn
; insn
= NEXT_INSN (insn
))
4116 if (NOTE_KIND (insn
) == NOTE_INSN_BLOCK_BEG
)
4118 tree block
= NOTE_BLOCK (insn
);
4121 gcc_assert (BLOCK_FRAGMENT_ORIGIN (block
) == NULL_TREE
);
4124 /* If we have seen this block before, that means it now
4125 spans multiple address regions. Create a new fragment. */
4126 if (TREE_ASM_WRITTEN (block
))
4128 tree new_block
= copy_node (block
);
4130 BLOCK_FRAGMENT_ORIGIN (new_block
) = origin
;
4131 BLOCK_FRAGMENT_CHAIN (new_block
)
4132 = BLOCK_FRAGMENT_CHAIN (origin
);
4133 BLOCK_FRAGMENT_CHAIN (origin
) = new_block
;
4135 NOTE_BLOCK (insn
) = new_block
;
4139 BLOCK_SUBBLOCKS (block
) = 0;
4140 TREE_ASM_WRITTEN (block
) = 1;
4141 /* When there's only one block for the entire function,
4142 current_block == block and we mustn't do this, it
4143 will cause infinite recursion. */
4144 if (block
!= current_block
)
4146 if (block
!= origin
)
4147 gcc_assert (BLOCK_SUPERCONTEXT (origin
) == current_block
);
4149 BLOCK_SUPERCONTEXT (block
) = current_block
;
4150 BLOCK_CHAIN (block
) = BLOCK_SUBBLOCKS (current_block
);
4151 BLOCK_SUBBLOCKS (current_block
) = block
;
4152 current_block
= origin
;
4154 VEC_safe_push (tree
, heap
, *p_block_stack
, block
);
4156 else if (NOTE_KIND (insn
) == NOTE_INSN_BLOCK_END
)
4158 NOTE_BLOCK (insn
) = VEC_pop (tree
, *p_block_stack
);
4159 current_block
= BLOCK_SUPERCONTEXT (current_block
);
4165 /* Reverse the order of elements in the chain T of blocks,
4166 and return the new head of the chain (old last element). */
4169 blocks_nreverse (tree t
)
4171 tree prev
= 0, block
, next
;
4172 for (block
= t
; block
; block
= next
)
4174 next
= BLOCK_CHAIN (block
);
4175 BLOCK_CHAIN (block
) = prev
;
4181 /* Concatenate two chains of blocks (chained through BLOCK_CHAIN)
4182 by modifying the last node in chain 1 to point to chain 2. */
4185 block_chainon (tree op1
, tree op2
)
4194 for (t1
= op1
; BLOCK_CHAIN (t1
); t1
= BLOCK_CHAIN (t1
))
4196 BLOCK_CHAIN (t1
) = op2
;
4198 #ifdef ENABLE_TREE_CHECKING
4201 for (t2
= op2
; t2
; t2
= BLOCK_CHAIN (t2
))
4202 gcc_assert (t2
!= t1
);
4209 /* Count the subblocks of the list starting with BLOCK. If VECTOR is
4210 non-NULL, list them all into VECTOR, in a depth-first preorder
4211 traversal of the block tree. Also clear TREE_ASM_WRITTEN in all
4215 all_blocks (tree block
, tree
*vector
)
4221 TREE_ASM_WRITTEN (block
) = 0;
4223 /* Record this block. */
4225 vector
[n_blocks
] = block
;
4229 /* Record the subblocks, and their subblocks... */
4230 n_blocks
+= all_blocks (BLOCK_SUBBLOCKS (block
),
4231 vector
? vector
+ n_blocks
: 0);
4232 block
= BLOCK_CHAIN (block
);
4238 /* Return a vector containing all the blocks rooted at BLOCK. The
4239 number of elements in the vector is stored in N_BLOCKS_P. The
4240 vector is dynamically allocated; it is the caller's responsibility
4241 to call `free' on the pointer returned. */
4244 get_block_vector (tree block
, int *n_blocks_p
)
4248 *n_blocks_p
= all_blocks (block
, NULL
);
4249 block_vector
= XNEWVEC (tree
, *n_blocks_p
);
4250 all_blocks (block
, block_vector
);
4252 return block_vector
;
4255 static GTY(()) int next_block_index
= 2;
4257 /* Set BLOCK_NUMBER for all the blocks in FN. */
4260 number_blocks (tree fn
)
4266 /* For SDB and XCOFF debugging output, we start numbering the blocks
4267 from 1 within each function, rather than keeping a running
4269 #if defined (SDB_DEBUGGING_INFO) || defined (XCOFF_DEBUGGING_INFO)
4270 if (write_symbols
== SDB_DEBUG
|| write_symbols
== XCOFF_DEBUG
)
4271 next_block_index
= 1;
4274 block_vector
= get_block_vector (DECL_INITIAL (fn
), &n_blocks
);
4276 /* The top-level BLOCK isn't numbered at all. */
4277 for (i
= 1; i
< n_blocks
; ++i
)
4278 /* We number the blocks from two. */
4279 BLOCK_NUMBER (block_vector
[i
]) = next_block_index
++;
4281 free (block_vector
);
4286 /* If VAR is present in a subblock of BLOCK, return the subblock. */
4289 debug_find_var_in_block_tree (tree var
, tree block
)
4293 for (t
= BLOCK_VARS (block
); t
; t
= TREE_CHAIN (t
))
4297 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= TREE_CHAIN (t
))
4299 tree ret
= debug_find_var_in_block_tree (var
, t
);
4307 /* Keep track of whether we're in a dummy function context. If we are,
4308 we don't want to invoke the set_current_function hook, because we'll
4309 get into trouble if the hook calls target_reinit () recursively or
4310 when the initial initialization is not yet complete. */
4312 static bool in_dummy_function
;
4314 /* Invoke the target hook when setting cfun. Update the optimization options
4315 if the function uses different options than the default. */
4318 invoke_set_current_function_hook (tree fndecl
)
4320 if (!in_dummy_function
)
4322 tree opts
= ((fndecl
)
4323 ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (fndecl
)
4324 : optimization_default_node
);
4327 opts
= optimization_default_node
;
4329 /* Change optimization options if needed. */
4330 if (optimization_current_node
!= opts
)
4332 optimization_current_node
= opts
;
4333 cl_optimization_restore (&global_options
, TREE_OPTIMIZATION (opts
));
4336 targetm
.set_current_function (fndecl
);
4340 /* cfun should never be set directly; use this function. */
4343 set_cfun (struct function
*new_cfun
)
4345 if (cfun
!= new_cfun
)
4348 invoke_set_current_function_hook (new_cfun
? new_cfun
->decl
: NULL_TREE
);
4352 /* Initialized with NOGC, making this poisonous to the garbage collector. */
4354 static VEC(function_p
,heap
) *cfun_stack
;
4356 /* Push the current cfun onto the stack, and set cfun to new_cfun. */
4359 push_cfun (struct function
*new_cfun
)
4361 VEC_safe_push (function_p
, heap
, cfun_stack
, cfun
);
4362 set_cfun (new_cfun
);
4365 /* Pop cfun from the stack. */
4370 struct function
*new_cfun
= VEC_pop (function_p
, cfun_stack
);
4371 set_cfun (new_cfun
);
4374 /* Return value of funcdef and increase it. */
4376 get_next_funcdef_no (void)
4378 return funcdef_no
++;
4381 /* Return value of funcdef. */
4383 get_last_funcdef_no (void)
4388 /* Allocate a function structure for FNDECL and set its contents
4389 to the defaults. Set cfun to the newly-allocated object.
4390 Some of the helper functions invoked during initialization assume
4391 that cfun has already been set. Therefore, assign the new object
4392 directly into cfun and invoke the back end hook explicitly at the
4393 very end, rather than initializing a temporary and calling set_cfun
4396 ABSTRACT_P is true if this is a function that will never be seen by
4397 the middle-end. Such functions are front-end concepts (like C++
4398 function templates) that do not correspond directly to functions
4399 placed in object files. */
4402 allocate_struct_function (tree fndecl
, bool abstract_p
)
4405 tree fntype
= fndecl
? TREE_TYPE (fndecl
) : NULL_TREE
;
4407 cfun
= ggc_alloc_cleared_function ();
4409 init_eh_for_function ();
4411 if (init_machine_status
)
4412 cfun
->machine
= (*init_machine_status
) ();
4414 #ifdef OVERRIDE_ABI_FORMAT
4415 OVERRIDE_ABI_FORMAT (fndecl
);
4418 invoke_set_current_function_hook (fndecl
);
4420 if (fndecl
!= NULL_TREE
)
4422 DECL_STRUCT_FUNCTION (fndecl
) = cfun
;
4423 cfun
->decl
= fndecl
;
4424 current_function_funcdef_no
= get_next_funcdef_no ();
4426 result
= DECL_RESULT (fndecl
);
4427 if (!abstract_p
&& aggregate_value_p (result
, fndecl
))
4429 #ifdef PCC_STATIC_STRUCT_RETURN
4430 cfun
->returns_pcc_struct
= 1;
4432 cfun
->returns_struct
= 1;
4435 cfun
->stdarg
= stdarg_p (fntype
);
4437 /* Assume all registers in stdarg functions need to be saved. */
4438 cfun
->va_list_gpr_size
= VA_LIST_MAX_GPR_SIZE
;
4439 cfun
->va_list_fpr_size
= VA_LIST_MAX_FPR_SIZE
;
4441 /* ??? This could be set on a per-function basis by the front-end
4442 but is this worth the hassle? */
4443 cfun
->can_throw_non_call_exceptions
= flag_non_call_exceptions
;
4447 /* This is like allocate_struct_function, but pushes a new cfun for FNDECL
4448 instead of just setting it. */
4451 push_struct_function (tree fndecl
)
4453 VEC_safe_push (function_p
, heap
, cfun_stack
, cfun
);
4454 allocate_struct_function (fndecl
, false);
4457 /* Reset crtl and other non-struct-function variables to defaults as
4458 appropriate for emitting rtl at the start of a function. */
4461 prepare_function_start (void)
4463 gcc_assert (!crtl
->emit
.x_last_insn
);
4466 init_varasm_status ();
4468 default_rtl_profile ();
4470 if (flag_stack_usage
)
4472 cfun
->su
= ggc_alloc_cleared_stack_usage ();
4473 cfun
->su
->static_stack_size
= -1;
4476 cse_not_expected
= ! optimize
;
4478 /* Caller save not needed yet. */
4479 caller_save_needed
= 0;
4481 /* We haven't done register allocation yet. */
4484 /* Indicate that we have not instantiated virtual registers yet. */
4485 virtuals_instantiated
= 0;
4487 /* Indicate that we want CONCATs now. */
4488 generating_concat_p
= 1;
4490 /* Indicate we have no need of a frame pointer yet. */
4491 frame_pointer_needed
= 0;
4494 /* Initialize the rtl expansion mechanism so that we can do simple things
4495 like generate sequences. This is used to provide a context during global
4496 initialization of some passes. You must call expand_dummy_function_end
4497 to exit this context. */
4500 init_dummy_function_start (void)
4502 gcc_assert (!in_dummy_function
);
4503 in_dummy_function
= true;
4504 push_struct_function (NULL_TREE
);
4505 prepare_function_start ();
4508 /* Generate RTL for the start of the function SUBR (a FUNCTION_DECL tree node)
4509 and initialize static variables for generating RTL for the statements
4513 init_function_start (tree subr
)
4515 if (subr
&& DECL_STRUCT_FUNCTION (subr
))
4516 set_cfun (DECL_STRUCT_FUNCTION (subr
));
4518 allocate_struct_function (subr
, false);
4519 prepare_function_start ();
4521 /* Warn if this value is an aggregate type,
4522 regardless of which calling convention we are using for it. */
4523 if (AGGREGATE_TYPE_P (TREE_TYPE (DECL_RESULT (subr
))))
4524 warning (OPT_Waggregate_return
, "function returns an aggregate");
4527 /* Make sure all values used by the optimization passes have sane defaults. */
4529 init_function_for_compilation (void)
4535 struct rtl_opt_pass pass_init_function
=
4539 "*init_function", /* name */
4541 init_function_for_compilation
, /* execute */
4544 0, /* static_pass_number */
4545 TV_NONE
, /* tv_id */
4546 0, /* properties_required */
4547 0, /* properties_provided */
4548 0, /* properties_destroyed */
4549 0, /* todo_flags_start */
4550 0 /* todo_flags_finish */
4556 expand_main_function (void)
4558 #if (defined(INVOKE__main) \
4559 || (!defined(HAS_INIT_SECTION) \
4560 && !defined(INIT_SECTION_ASM_OP) \
4561 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
4562 emit_library_call (init_one_libfunc (NAME__MAIN
), LCT_NORMAL
, VOIDmode
, 0);
4566 /* Expand code to initialize the stack_protect_guard. This is invoked at
4567 the beginning of a function to be protected. */
4569 #ifndef HAVE_stack_protect_set
4570 # define HAVE_stack_protect_set 0
4571 # define gen_stack_protect_set(x,y) (gcc_unreachable (), NULL_RTX)
4575 stack_protect_prologue (void)
4577 tree guard_decl
= targetm
.stack_protect_guard ();
4580 x
= expand_normal (crtl
->stack_protect_guard
);
4581 y
= expand_normal (guard_decl
);
4583 /* Allow the target to copy from Y to X without leaking Y into a
4585 if (HAVE_stack_protect_set
)
4587 rtx insn
= gen_stack_protect_set (x
, y
);
4595 /* Otherwise do a straight move. */
4596 emit_move_insn (x
, y
);
4599 /* Expand code to verify the stack_protect_guard. This is invoked at
4600 the end of a function to be protected. */
4602 #ifndef HAVE_stack_protect_test
4603 # define HAVE_stack_protect_test 0
4604 # define gen_stack_protect_test(x, y, z) (gcc_unreachable (), NULL_RTX)
4608 stack_protect_epilogue (void)
4610 tree guard_decl
= targetm
.stack_protect_guard ();
4611 rtx label
= gen_label_rtx ();
4614 x
= expand_normal (crtl
->stack_protect_guard
);
4615 y
= expand_normal (guard_decl
);
4617 /* Allow the target to compare Y with X without leaking either into
4619 switch (HAVE_stack_protect_test
!= 0)
4622 tmp
= gen_stack_protect_test (x
, y
, label
);
4631 emit_cmp_and_jump_insns (x
, y
, EQ
, NULL_RTX
, ptr_mode
, 1, label
);
4635 /* The noreturn predictor has been moved to the tree level. The rtl-level
4636 predictors estimate this branch about 20%, which isn't enough to get
4637 things moved out of line. Since this is the only extant case of adding
4638 a noreturn function at the rtl level, it doesn't seem worth doing ought
4639 except adding the prediction by hand. */
4640 tmp
= get_last_insn ();
4642 predict_insn_def (tmp
, PRED_NORETURN
, TAKEN
);
4644 expand_expr_stmt (targetm
.stack_protect_fail ());
4648 /* Start the RTL for a new function, and set variables used for
4650 SUBR is the FUNCTION_DECL node.
4651 PARMS_HAVE_CLEANUPS is nonzero if there are cleanups associated with
4652 the function's parameters, which must be run at any return statement. */
4655 expand_function_start (tree subr
)
4657 /* Make sure volatile mem refs aren't considered
4658 valid operands of arithmetic insns. */
4659 init_recog_no_volatile ();
4663 && ! DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (subr
));
4666 = (stack_limit_rtx
!= NULL_RTX
&& ! DECL_NO_LIMIT_STACK (subr
));
4668 /* Make the label for return statements to jump to. Do not special
4669 case machines with special return instructions -- they will be
4670 handled later during jump, ifcvt, or epilogue creation. */
4671 return_label
= gen_label_rtx ();
4673 /* Initialize rtx used to return the value. */
4674 /* Do this before assign_parms so that we copy the struct value address
4675 before any library calls that assign parms might generate. */
4677 /* Decide whether to return the value in memory or in a register. */
4678 if (aggregate_value_p (DECL_RESULT (subr
), subr
))
4680 /* Returning something that won't go in a register. */
4681 rtx value_address
= 0;
4683 #ifdef PCC_STATIC_STRUCT_RETURN
4684 if (cfun
->returns_pcc_struct
)
4686 int size
= int_size_in_bytes (TREE_TYPE (DECL_RESULT (subr
)));
4687 value_address
= assemble_static_space (size
);
4692 rtx sv
= targetm
.calls
.struct_value_rtx (TREE_TYPE (subr
), 2);
4693 /* Expect to be passed the address of a place to store the value.
4694 If it is passed as an argument, assign_parms will take care of
4698 value_address
= gen_reg_rtx (Pmode
);
4699 emit_move_insn (value_address
, sv
);
4704 rtx x
= value_address
;
4705 if (!DECL_BY_REFERENCE (DECL_RESULT (subr
)))
4707 x
= gen_rtx_MEM (DECL_MODE (DECL_RESULT (subr
)), x
);
4708 set_mem_attributes (x
, DECL_RESULT (subr
), 1);
4710 SET_DECL_RTL (DECL_RESULT (subr
), x
);
4713 else if (DECL_MODE (DECL_RESULT (subr
)) == VOIDmode
)
4714 /* If return mode is void, this decl rtl should not be used. */
4715 SET_DECL_RTL (DECL_RESULT (subr
), NULL_RTX
);
4718 /* Compute the return values into a pseudo reg, which we will copy
4719 into the true return register after the cleanups are done. */
4720 tree return_type
= TREE_TYPE (DECL_RESULT (subr
));
4721 if (TYPE_MODE (return_type
) != BLKmode
4722 && targetm
.calls
.return_in_msb (return_type
))
4723 /* expand_function_end will insert the appropriate padding in
4724 this case. Use the return value's natural (unpadded) mode
4725 within the function proper. */
4726 SET_DECL_RTL (DECL_RESULT (subr
),
4727 gen_reg_rtx (TYPE_MODE (return_type
)));
4730 /* In order to figure out what mode to use for the pseudo, we
4731 figure out what the mode of the eventual return register will
4732 actually be, and use that. */
4733 rtx hard_reg
= hard_function_value (return_type
, subr
, 0, 1);
4735 /* Structures that are returned in registers are not
4736 aggregate_value_p, so we may see a PARALLEL or a REG. */
4737 if (REG_P (hard_reg
))
4738 SET_DECL_RTL (DECL_RESULT (subr
),
4739 gen_reg_rtx (GET_MODE (hard_reg
)));
4742 gcc_assert (GET_CODE (hard_reg
) == PARALLEL
);
4743 SET_DECL_RTL (DECL_RESULT (subr
), gen_group_rtx (hard_reg
));
4747 /* Set DECL_REGISTER flag so that expand_function_end will copy the
4748 result to the real return register(s). */
4749 DECL_REGISTER (DECL_RESULT (subr
)) = 1;
4752 /* Initialize rtx for parameters and local variables.
4753 In some cases this requires emitting insns. */
4754 assign_parms (subr
);
4756 /* If function gets a static chain arg, store it. */
4757 if (cfun
->static_chain_decl
)
4759 tree parm
= cfun
->static_chain_decl
;
4760 rtx local
, chain
, insn
;
4762 local
= gen_reg_rtx (Pmode
);
4763 chain
= targetm
.calls
.static_chain (current_function_decl
, true);
4765 set_decl_incoming_rtl (parm
, chain
, false);
4766 SET_DECL_RTL (parm
, local
);
4767 mark_reg_pointer (local
, TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm
))));
4769 insn
= emit_move_insn (local
, chain
);
4771 /* Mark the register as eliminable, similar to parameters. */
4773 && reg_mentioned_p (arg_pointer_rtx
, XEXP (chain
, 0)))
4774 set_unique_reg_note (insn
, REG_EQUIV
, chain
);
4777 /* If the function receives a non-local goto, then store the
4778 bits we need to restore the frame pointer. */
4779 if (cfun
->nonlocal_goto_save_area
)
4784 /* ??? We need to do this save early. Unfortunately here is
4785 before the frame variable gets declared. Help out... */
4786 tree var
= TREE_OPERAND (cfun
->nonlocal_goto_save_area
, 0);
4787 if (!DECL_RTL_SET_P (var
))
4790 t_save
= build4 (ARRAY_REF
, ptr_type_node
,
4791 cfun
->nonlocal_goto_save_area
,
4792 integer_zero_node
, NULL_TREE
, NULL_TREE
);
4793 r_save
= expand_expr (t_save
, NULL_RTX
, VOIDmode
, EXPAND_WRITE
);
4794 r_save
= convert_memory_address (Pmode
, r_save
);
4796 emit_move_insn (r_save
, targetm
.builtin_setjmp_frame_value ());
4797 update_nonlocal_goto_save_area ();
4800 /* The following was moved from init_function_start.
4801 The move is supposed to make sdb output more accurate. */
4802 /* Indicate the beginning of the function body,
4803 as opposed to parm setup. */
4804 emit_note (NOTE_INSN_FUNCTION_BEG
);
4806 gcc_assert (NOTE_P (get_last_insn ()));
4808 parm_birth_insn
= get_last_insn ();
4813 PROFILE_HOOK (current_function_funcdef_no
);
4817 /* After the display initializations is where the stack checking
4819 if(flag_stack_check
)
4820 stack_check_probe_note
= emit_note (NOTE_INSN_DELETED
);
4822 /* Make sure there is a line number after the function entry setup code. */
4823 force_next_line_note ();
4826 /* Undo the effects of init_dummy_function_start. */
4828 expand_dummy_function_end (void)
4830 gcc_assert (in_dummy_function
);
4832 /* End any sequences that failed to be closed due to syntax errors. */
4833 while (in_sequence_p ())
4836 /* Outside function body, can't compute type's actual size
4837 until next function's body starts. */
4839 free_after_parsing (cfun
);
4840 free_after_compilation (cfun
);
4842 in_dummy_function
= false;
4845 /* Call DOIT for each hard register used as a return value from
4846 the current function. */
4849 diddle_return_value (void (*doit
) (rtx
, void *), void *arg
)
4851 rtx outgoing
= crtl
->return_rtx
;
4856 if (REG_P (outgoing
))
4857 (*doit
) (outgoing
, arg
);
4858 else if (GET_CODE (outgoing
) == PARALLEL
)
4862 for (i
= 0; i
< XVECLEN (outgoing
, 0); i
++)
4864 rtx x
= XEXP (XVECEXP (outgoing
, 0, i
), 0);
4866 if (REG_P (x
) && REGNO (x
) < FIRST_PSEUDO_REGISTER
)
4873 do_clobber_return_reg (rtx reg
, void *arg ATTRIBUTE_UNUSED
)
4879 clobber_return_register (void)
4881 diddle_return_value (do_clobber_return_reg
, NULL
);
4883 /* In case we do use pseudo to return value, clobber it too. */
4884 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl
)))
4886 tree decl_result
= DECL_RESULT (current_function_decl
);
4887 rtx decl_rtl
= DECL_RTL (decl_result
);
4888 if (REG_P (decl_rtl
) && REGNO (decl_rtl
) >= FIRST_PSEUDO_REGISTER
)
4890 do_clobber_return_reg (decl_rtl
, NULL
);
4896 do_use_return_reg (rtx reg
, void *arg ATTRIBUTE_UNUSED
)
4902 use_return_register (void)
4904 diddle_return_value (do_use_return_reg
, NULL
);
4907 /* Possibly warn about unused parameters. */
4909 do_warn_unused_parameter (tree fn
)
4913 for (decl
= DECL_ARGUMENTS (fn
);
4914 decl
; decl
= DECL_CHAIN (decl
))
4915 if (!TREE_USED (decl
) && TREE_CODE (decl
) == PARM_DECL
4916 && DECL_NAME (decl
) && !DECL_ARTIFICIAL (decl
)
4917 && !TREE_NO_WARNING (decl
))
4918 warning (OPT_Wunused_parameter
, "unused parameter %q+D", decl
);
4921 static GTY(()) rtx initial_trampoline
;
4923 /* Generate RTL for the end of the current function. */
4926 expand_function_end (void)
4930 /* If arg_pointer_save_area was referenced only from a nested
4931 function, we will not have initialized it yet. Do that now. */
4932 if (arg_pointer_save_area
&& ! crtl
->arg_pointer_save_area_init
)
4933 get_arg_pointer_save_area ();
4935 /* If we are doing generic stack checking and this function makes calls,
4936 do a stack probe at the start of the function to ensure we have enough
4937 space for another stack frame. */
4938 if (flag_stack_check
== GENERIC_STACK_CHECK
)
4942 for (insn
= get_insns (); insn
; insn
= NEXT_INSN (insn
))
4945 rtx max_frame_size
= GEN_INT (STACK_CHECK_MAX_FRAME_SIZE
);
4947 if (STACK_CHECK_MOVING_SP
)
4948 anti_adjust_stack_and_probe (max_frame_size
, true);
4950 probe_stack_range (STACK_OLD_CHECK_PROTECT
, max_frame_size
);
4953 set_insn_locators (seq
, prologue_locator
);
4954 emit_insn_before (seq
, stack_check_probe_note
);
4959 /* End any sequences that failed to be closed due to syntax errors. */
4960 while (in_sequence_p ())
4963 clear_pending_stack_adjust ();
4964 do_pending_stack_adjust ();
4966 /* Output a linenumber for the end of the function.
4967 SDB depends on this. */
4968 force_next_line_note ();
4969 set_curr_insn_source_location (input_location
);
4971 /* Before the return label (if any), clobber the return
4972 registers so that they are not propagated live to the rest of
4973 the function. This can only happen with functions that drop
4974 through; if there had been a return statement, there would
4975 have either been a return rtx, or a jump to the return label.
4977 We delay actual code generation after the current_function_value_rtx
4979 clobber_after
= get_last_insn ();
4981 /* Output the label for the actual return from the function. */
4982 emit_label (return_label
);
4984 if (targetm
.except_unwind_info (&global_options
) == UI_SJLJ
)
4986 /* Let except.c know where it should emit the call to unregister
4987 the function context for sjlj exceptions. */
4988 if (flag_exceptions
)
4989 sjlj_emit_function_exit_after (get_last_insn ());
4993 /* We want to ensure that instructions that may trap are not
4994 moved into the epilogue by scheduling, because we don't
4995 always emit unwind information for the epilogue. */
4996 if (cfun
->can_throw_non_call_exceptions
)
4997 emit_insn (gen_blockage ());
5000 /* If this is an implementation of throw, do what's necessary to
5001 communicate between __builtin_eh_return and the epilogue. */
5002 expand_eh_return ();
5004 /* If scalar return value was computed in a pseudo-reg, or was a named
5005 return value that got dumped to the stack, copy that to the hard
5007 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl
)))
5009 tree decl_result
= DECL_RESULT (current_function_decl
);
5010 rtx decl_rtl
= DECL_RTL (decl_result
);
5012 if (REG_P (decl_rtl
)
5013 ? REGNO (decl_rtl
) >= FIRST_PSEUDO_REGISTER
5014 : DECL_REGISTER (decl_result
))
5016 rtx real_decl_rtl
= crtl
->return_rtx
;
5018 /* This should be set in assign_parms. */
5019 gcc_assert (REG_FUNCTION_VALUE_P (real_decl_rtl
));
5021 /* If this is a BLKmode structure being returned in registers,
5022 then use the mode computed in expand_return. Note that if
5023 decl_rtl is memory, then its mode may have been changed,
5024 but that crtl->return_rtx has not. */
5025 if (GET_MODE (real_decl_rtl
) == BLKmode
)
5026 PUT_MODE (real_decl_rtl
, GET_MODE (decl_rtl
));
5028 /* If a non-BLKmode return value should be padded at the least
5029 significant end of the register, shift it left by the appropriate
5030 amount. BLKmode results are handled using the group load/store
5032 if (TYPE_MODE (TREE_TYPE (decl_result
)) != BLKmode
5033 && targetm
.calls
.return_in_msb (TREE_TYPE (decl_result
)))
5035 emit_move_insn (gen_rtx_REG (GET_MODE (decl_rtl
),
5036 REGNO (real_decl_rtl
)),
5038 shift_return_value (GET_MODE (decl_rtl
), true, real_decl_rtl
);
5040 /* If a named return value dumped decl_return to memory, then
5041 we may need to re-do the PROMOTE_MODE signed/unsigned
5043 else if (GET_MODE (real_decl_rtl
) != GET_MODE (decl_rtl
))
5045 int unsignedp
= TYPE_UNSIGNED (TREE_TYPE (decl_result
));
5046 promote_function_mode (TREE_TYPE (decl_result
),
5047 GET_MODE (decl_rtl
), &unsignedp
,
5048 TREE_TYPE (current_function_decl
), 1);
5050 convert_move (real_decl_rtl
, decl_rtl
, unsignedp
);
5052 else if (GET_CODE (real_decl_rtl
) == PARALLEL
)
5054 /* If expand_function_start has created a PARALLEL for decl_rtl,
5055 move the result to the real return registers. Otherwise, do
5056 a group load from decl_rtl for a named return. */
5057 if (GET_CODE (decl_rtl
) == PARALLEL
)
5058 emit_group_move (real_decl_rtl
, decl_rtl
);
5060 emit_group_load (real_decl_rtl
, decl_rtl
,
5061 TREE_TYPE (decl_result
),
5062 int_size_in_bytes (TREE_TYPE (decl_result
)));
5064 /* In the case of complex integer modes smaller than a word, we'll
5065 need to generate some non-trivial bitfield insertions. Do that
5066 on a pseudo and not the hard register. */
5067 else if (GET_CODE (decl_rtl
) == CONCAT
5068 && GET_MODE_CLASS (GET_MODE (decl_rtl
)) == MODE_COMPLEX_INT
5069 && GET_MODE_BITSIZE (GET_MODE (decl_rtl
)) <= BITS_PER_WORD
)
5071 int old_generating_concat_p
;
5074 old_generating_concat_p
= generating_concat_p
;
5075 generating_concat_p
= 0;
5076 tmp
= gen_reg_rtx (GET_MODE (decl_rtl
));
5077 generating_concat_p
= old_generating_concat_p
;
5079 emit_move_insn (tmp
, decl_rtl
);
5080 emit_move_insn (real_decl_rtl
, tmp
);
5083 emit_move_insn (real_decl_rtl
, decl_rtl
);
5087 /* If returning a structure, arrange to return the address of the value
5088 in a place where debuggers expect to find it.
5090 If returning a structure PCC style,
5091 the caller also depends on this value.
5092 And cfun->returns_pcc_struct is not necessarily set. */
5093 if (cfun
->returns_struct
5094 || cfun
->returns_pcc_struct
)
5096 rtx value_address
= DECL_RTL (DECL_RESULT (current_function_decl
));
5097 tree type
= TREE_TYPE (DECL_RESULT (current_function_decl
));
5100 if (DECL_BY_REFERENCE (DECL_RESULT (current_function_decl
)))
5101 type
= TREE_TYPE (type
);
5103 value_address
= XEXP (value_address
, 0);
5105 outgoing
= targetm
.calls
.function_value (build_pointer_type (type
),
5106 current_function_decl
, true);
5108 /* Mark this as a function return value so integrate will delete the
5109 assignment and USE below when inlining this function. */
5110 REG_FUNCTION_VALUE_P (outgoing
) = 1;
5112 /* The address may be ptr_mode and OUTGOING may be Pmode. */
5113 value_address
= convert_memory_address (GET_MODE (outgoing
),
5116 emit_move_insn (outgoing
, value_address
);
5118 /* Show return register used to hold result (in this case the address
5120 crtl
->return_rtx
= outgoing
;
5123 /* Emit the actual code to clobber return register. */
5128 clobber_return_register ();
5132 emit_insn_after (seq
, clobber_after
);
5135 /* Output the label for the naked return from the function. */
5136 if (naked_return_label
)
5137 emit_label (naked_return_label
);
5139 /* @@@ This is a kludge. We want to ensure that instructions that
5140 may trap are not moved into the epilogue by scheduling, because
5141 we don't always emit unwind information for the epilogue. */
5142 if (cfun
->can_throw_non_call_exceptions
5143 && targetm
.except_unwind_info (&global_options
) != UI_SJLJ
)
5144 emit_insn (gen_blockage ());
5146 /* If stack protection is enabled for this function, check the guard. */
5147 if (crtl
->stack_protect_guard
)
5148 stack_protect_epilogue ();
5150 /* If we had calls to alloca, and this machine needs
5151 an accurate stack pointer to exit the function,
5152 insert some code to save and restore the stack pointer. */
5153 if (! EXIT_IGNORE_STACK
5154 && cfun
->calls_alloca
)
5159 emit_stack_save (SAVE_FUNCTION
, &tem
);
5162 emit_insn_before (seq
, parm_birth_insn
);
5164 emit_stack_restore (SAVE_FUNCTION
, tem
);
5167 /* ??? This should no longer be necessary since stupid is no longer with
5168 us, but there are some parts of the compiler (eg reload_combine, and
5169 sh mach_dep_reorg) that still try and compute their own lifetime info
5170 instead of using the general framework. */
5171 use_return_register ();
5175 get_arg_pointer_save_area (void)
5177 rtx ret
= arg_pointer_save_area
;
5181 ret
= assign_stack_local (Pmode
, GET_MODE_SIZE (Pmode
), 0);
5182 arg_pointer_save_area
= ret
;
5185 if (! crtl
->arg_pointer_save_area_init
)
5189 /* Save the arg pointer at the beginning of the function. The
5190 generated stack slot may not be a valid memory address, so we
5191 have to check it and fix it if necessary. */
5193 emit_move_insn (validize_mem (ret
),
5194 crtl
->args
.internal_arg_pointer
);
5198 push_topmost_sequence ();
5199 emit_insn_after (seq
, entry_of_function ());
5200 pop_topmost_sequence ();
5202 crtl
->arg_pointer_save_area_init
= true;
5208 /* Add a list of INSNS to the hash HASHP, possibly allocating HASHP
5209 for the first time. */
5212 record_insns (rtx insns
, rtx end
, htab_t
*hashp
)
5215 htab_t hash
= *hashp
;
5219 = htab_create_ggc (17, htab_hash_pointer
, htab_eq_pointer
, NULL
);
5221 for (tmp
= insns
; tmp
!= end
; tmp
= NEXT_INSN (tmp
))
5223 void **slot
= htab_find_slot (hash
, tmp
, INSERT
);
5224 gcc_assert (*slot
== NULL
);
5229 /* INSN has been duplicated or replaced by as COPY, perhaps by duplicating a
5230 basic block, splitting or peepholes. If INSN is a prologue or epilogue
5231 insn, then record COPY as well. */
5234 maybe_copy_prologue_epilogue_insn (rtx insn
, rtx copy
)
5239 hash
= epilogue_insn_hash
;
5240 if (!hash
|| !htab_find (hash
, insn
))
5242 hash
= prologue_insn_hash
;
5243 if (!hash
|| !htab_find (hash
, insn
))
5247 slot
= htab_find_slot (hash
, copy
, INSERT
);
5248 gcc_assert (*slot
== NULL
);
5252 /* Set the locator of the insn chain starting at INSN to LOC. */
5254 set_insn_locators (rtx insn
, int loc
)
5256 while (insn
!= NULL_RTX
)
5259 INSN_LOCATOR (insn
) = loc
;
5260 insn
= NEXT_INSN (insn
);
5264 /* Determine if any INSNs in HASH are, or are part of, INSN. Because
5265 we can be running after reorg, SEQUENCE rtl is possible. */
5268 contains (const_rtx insn
, htab_t hash
)
5273 if (NONJUMP_INSN_P (insn
) && GET_CODE (PATTERN (insn
)) == SEQUENCE
)
5276 for (i
= XVECLEN (PATTERN (insn
), 0) - 1; i
>= 0; i
--)
5277 if (htab_find (hash
, XVECEXP (PATTERN (insn
), 0, i
)))
5282 return htab_find (hash
, insn
) != NULL
;
5286 prologue_epilogue_contains (const_rtx insn
)
5288 if (contains (insn
, prologue_insn_hash
))
5290 if (contains (insn
, epilogue_insn_hash
))
5296 /* Insert use of return register before the end of BB. */
5299 emit_use_return_register_into_block (basic_block bb
)
5303 use_return_register ();
5306 emit_insn_before (seq
, BB_END (bb
));
5309 /* Insert gen_return at the end of block BB. This also means updating
5310 block_for_insn appropriately. */
5313 emit_return_into_block (basic_block bb
)
5315 emit_jump_insn_after (gen_return (), BB_END (bb
));
5317 #endif /* HAVE_return */
5319 /* Generate the prologue and epilogue RTL if the machine supports it. Thread
5320 this into place with notes indicating where the prologue ends and where
5321 the epilogue begins. Update the basic block information when possible. */
5324 thread_prologue_and_epilogue_insns (void)
5327 rtx seq ATTRIBUTE_UNUSED
, epilogue_end ATTRIBUTE_UNUSED
;
5331 rtl_profile_for_bb (ENTRY_BLOCK_PTR
);
5335 epilogue_end
= NULL_RTX
;
5337 /* Can't deal with multiple successors of the entry block at the
5338 moment. Function should always have at least one entry
5340 gcc_assert (single_succ_p (ENTRY_BLOCK_PTR
));
5341 entry_edge
= single_succ_edge (ENTRY_BLOCK_PTR
);
5343 if (flag_split_stack
5344 && (lookup_attribute ("no_split_stack", DECL_ATTRIBUTES (cfun
->decl
))
5347 #ifndef HAVE_split_stack_prologue
5350 gcc_assert (HAVE_split_stack_prologue
);
5353 emit_insn (gen_split_stack_prologue ());
5357 record_insns (seq
, NULL
, &prologue_insn_hash
);
5358 set_insn_locators (seq
, prologue_locator
);
5360 insert_insn_on_edge (seq
, entry_edge
);
5365 #ifdef HAVE_prologue
5369 seq
= gen_prologue ();
5372 /* Insert an explicit USE for the frame pointer
5373 if the profiling is on and the frame pointer is required. */
5374 if (crtl
->profile
&& frame_pointer_needed
)
5375 emit_use (hard_frame_pointer_rtx
);
5377 /* Retain a map of the prologue insns. */
5378 record_insns (seq
, NULL
, &prologue_insn_hash
);
5379 emit_note (NOTE_INSN_PROLOGUE_END
);
5381 /* Ensure that instructions are not moved into the prologue when
5382 profiling is on. The call to the profiling routine can be
5383 emitted within the live range of a call-clobbered register. */
5384 if (!targetm
.profile_before_prologue () && crtl
->profile
)
5385 emit_insn (gen_blockage ());
5389 set_insn_locators (seq
, prologue_locator
);
5391 insert_insn_on_edge (seq
, entry_edge
);
5396 /* If the exit block has no non-fake predecessors, we don't need
5398 FOR_EACH_EDGE (e
, ei
, EXIT_BLOCK_PTR
->preds
)
5399 if ((e
->flags
& EDGE_FAKE
) == 0)
5404 rtl_profile_for_bb (EXIT_BLOCK_PTR
);
5406 if (optimize
&& HAVE_return
)
5408 /* If we're allowed to generate a simple return instruction,
5409 then by definition we don't need a full epilogue. Examine
5410 the block that falls through to EXIT. If it does not
5411 contain any code, examine its predecessors and try to
5412 emit (conditional) return instructions. */
5417 e
= find_fallthru_edge (EXIT_BLOCK_PTR
->preds
);
5422 /* Verify that there are no active instructions in the last block. */
5423 label
= BB_END (last
);
5424 while (label
&& !LABEL_P (label
))
5426 if (active_insn_p (label
))
5428 label
= PREV_INSN (label
);
5431 if (BB_HEAD (last
) == label
&& LABEL_P (label
))
5435 for (ei2
= ei_start (last
->preds
); (e
= ei_safe_edge (ei2
)); )
5437 basic_block bb
= e
->src
;
5440 if (bb
== ENTRY_BLOCK_PTR
)
5447 if (!JUMP_P (jump
) || JUMP_LABEL (jump
) != label
)
5453 /* If we have an unconditional jump, we can replace that
5454 with a simple return instruction. */
5455 if (simplejump_p (jump
))
5457 /* The use of the return register might be present in the exit
5458 fallthru block. Either:
5459 - removing the use is safe, and we should remove the use in
5460 the exit fallthru block, or
5461 - removing the use is not safe, and we should add it here.
5462 For now, we conservatively choose the latter. Either of the
5463 2 helps in crossjumping. */
5464 emit_use_return_register_into_block (bb
);
5466 emit_return_into_block (bb
);
5470 /* If we have a conditional jump, we can try to replace
5471 that with a conditional return instruction. */
5472 else if (condjump_p (jump
))
5474 if (! redirect_jump (jump
, 0, 0))
5480 /* See comment in simple_jump_p case above. */
5481 emit_use_return_register_into_block (bb
);
5483 /* If this block has only one successor, it both jumps
5484 and falls through to the fallthru block, so we can't
5486 if (single_succ_p (bb
))
5498 /* Fix up the CFG for the successful change we just made. */
5499 redirect_edge_succ (e
, EXIT_BLOCK_PTR
);
5502 /* Emit a return insn for the exit fallthru block. Whether
5503 this is still reachable will be determined later. */
5505 emit_barrier_after (BB_END (last
));
5506 emit_return_into_block (last
);
5507 epilogue_end
= BB_END (last
);
5508 single_succ_edge (last
)->flags
&= ~EDGE_FALLTHRU
;
5514 /* A small fib -- epilogue is not yet completed, but we wish to re-use
5515 this marker for the splits of EH_RETURN patterns, and nothing else
5516 uses the flag in the meantime. */
5517 epilogue_completed
= 1;
5519 #ifdef HAVE_eh_return
5520 /* Find non-fallthru edges that end with EH_RETURN instructions. On
5521 some targets, these get split to a special version of the epilogue
5522 code. In order to be able to properly annotate these with unwind
5523 info, try to split them now. If we get a valid split, drop an
5524 EPILOGUE_BEG note and mark the insns as epilogue insns. */
5525 FOR_EACH_EDGE (e
, ei
, EXIT_BLOCK_PTR
->preds
)
5527 rtx prev
, last
, trial
;
5529 if (e
->flags
& EDGE_FALLTHRU
)
5531 last
= BB_END (e
->src
);
5532 if (!eh_returnjump_p (last
))
5535 prev
= PREV_INSN (last
);
5536 trial
= try_split (PATTERN (last
), last
, 1);
5540 record_insns (NEXT_INSN (prev
), NEXT_INSN (trial
), &epilogue_insn_hash
);
5541 emit_note_after (NOTE_INSN_EPILOGUE_BEG
, prev
);
5545 /* Find the edge that falls through to EXIT. Other edges may exist
5546 due to RETURN instructions, but those don't need epilogues.
5547 There really shouldn't be a mixture -- either all should have
5548 been converted or none, however... */
5550 e
= find_fallthru_edge (EXIT_BLOCK_PTR
->preds
);
5554 #ifdef HAVE_epilogue
5558 epilogue_end
= emit_note (NOTE_INSN_EPILOGUE_BEG
);
5559 seq
= gen_epilogue ();
5561 emit_jump_insn (seq
);
5563 /* Retain a map of the epilogue insns. */
5564 record_insns (seq
, NULL
, &epilogue_insn_hash
);
5565 set_insn_locators (seq
, epilogue_locator
);
5570 insert_insn_on_edge (seq
, e
);
5578 if (! next_active_insn (BB_END (e
->src
)))
5580 /* We have a fall-through edge to the exit block, the source is not
5581 at the end of the function, and there will be an assembler epilogue
5582 at the end of the function.
5583 We can't use force_nonfallthru here, because that would try to
5584 use return. Inserting a jump 'by hand' is extremely messy, so
5585 we take advantage of cfg_layout_finalize using
5586 fixup_fallthru_exit_predecessor. */
5587 cfg_layout_initialize (0);
5588 FOR_EACH_BB (cur_bb
)
5589 if (cur_bb
->index
>= NUM_FIXED_BLOCKS
5590 && cur_bb
->next_bb
->index
>= NUM_FIXED_BLOCKS
)
5591 cur_bb
->aux
= cur_bb
->next_bb
;
5592 cfg_layout_finalize ();
5596 default_rtl_profile ();
5602 commit_edge_insertions ();
5604 /* Look for basic blocks within the prologue insns. */
5605 blocks
= sbitmap_alloc (last_basic_block
);
5606 sbitmap_zero (blocks
);
5607 SET_BIT (blocks
, entry_edge
->dest
->index
);
5608 find_many_sub_basic_blocks (blocks
);
5609 sbitmap_free (blocks
);
5611 /* The epilogue insns we inserted may cause the exit edge to no longer
5613 FOR_EACH_EDGE (e
, ei
, EXIT_BLOCK_PTR
->preds
)
5615 if (((e
->flags
& EDGE_FALLTHRU
) != 0)
5616 && returnjump_p (BB_END (e
->src
)))
5617 e
->flags
&= ~EDGE_FALLTHRU
;
5621 #ifdef HAVE_sibcall_epilogue
5622 /* Emit sibling epilogues before any sibling call sites. */
5623 for (ei
= ei_start (EXIT_BLOCK_PTR
->preds
); (e
= ei_safe_edge (ei
)); )
5625 basic_block bb
= e
->src
;
5626 rtx insn
= BB_END (bb
);
5629 || ! SIBLING_CALL_P (insn
))
5636 emit_note (NOTE_INSN_EPILOGUE_BEG
);
5637 emit_insn (gen_sibcall_epilogue ());
5641 /* Retain a map of the epilogue insns. Used in life analysis to
5642 avoid getting rid of sibcall epilogue insns. Do this before we
5643 actually emit the sequence. */
5644 record_insns (seq
, NULL
, &epilogue_insn_hash
);
5645 set_insn_locators (seq
, epilogue_locator
);
5647 emit_insn_before (seq
, insn
);
5652 #ifdef HAVE_epilogue
5657 /* Similarly, move any line notes that appear after the epilogue.
5658 There is no need, however, to be quite so anal about the existence
5659 of such a note. Also possibly move
5660 NOTE_INSN_FUNCTION_BEG notes, as those can be relevant for debug
5662 for (insn
= epilogue_end
; insn
; insn
= next
)
5664 next
= NEXT_INSN (insn
);
5666 && (NOTE_KIND (insn
) == NOTE_INSN_FUNCTION_BEG
))
5667 reorder_insns (insn
, insn
, PREV_INSN (epilogue_end
));
5672 /* Threading the prologue and epilogue changes the artificial refs
5673 in the entry and exit blocks. */
5674 epilogue_completed
= 1;
5675 df_update_entry_exit_and_calls ();
5678 /* Reposition the prologue-end and epilogue-begin notes after
5679 instruction scheduling. */
5682 reposition_prologue_and_epilogue_notes (void)
5684 #if defined (HAVE_prologue) || defined (HAVE_epilogue) \
5685 || defined (HAVE_sibcall_epilogue)
5686 /* Since the hash table is created on demand, the fact that it is
5687 non-null is a signal that it is non-empty. */
5688 if (prologue_insn_hash
!= NULL
)
5690 size_t len
= htab_elements (prologue_insn_hash
);
5691 rtx insn
, last
= NULL
, note
= NULL
;
5693 /* Scan from the beginning until we reach the last prologue insn. */
5694 /* ??? While we do have the CFG intact, there are two problems:
5695 (1) The prologue can contain loops (typically probing the stack),
5696 which means that the end of the prologue isn't in the first bb.
5697 (2) Sometimes the PROLOGUE_END note gets pushed into the next bb. */
5698 for (insn
= get_insns (); insn
; insn
= NEXT_INSN (insn
))
5702 if (NOTE_KIND (insn
) == NOTE_INSN_PROLOGUE_END
)
5705 else if (contains (insn
, prologue_insn_hash
))
5717 /* Scan forward looking for the PROLOGUE_END note. It should
5718 be right at the beginning of the block, possibly with other
5719 insn notes that got moved there. */
5720 for (note
= NEXT_INSN (last
); ; note
= NEXT_INSN (note
))
5723 && NOTE_KIND (note
) == NOTE_INSN_PROLOGUE_END
)
5728 /* Avoid placing note between CODE_LABEL and BASIC_BLOCK note. */
5730 last
= NEXT_INSN (last
);
5731 reorder_insns (note
, note
, last
);
5735 if (epilogue_insn_hash
!= NULL
)
5740 FOR_EACH_EDGE (e
, ei
, EXIT_BLOCK_PTR
->preds
)
5742 rtx insn
, first
= NULL
, note
= NULL
;
5743 basic_block bb
= e
->src
;
5745 /* Scan from the beginning until we reach the first epilogue insn. */
5746 FOR_BB_INSNS (bb
, insn
)
5750 if (NOTE_KIND (insn
) == NOTE_INSN_EPILOGUE_BEG
)
5757 else if (first
== NULL
&& contains (insn
, epilogue_insn_hash
))
5767 /* If the function has a single basic block, and no real
5768 epilogue insns (e.g. sibcall with no cleanup), the
5769 epilogue note can get scheduled before the prologue
5770 note. If we have frame related prologue insns, having
5771 them scanned during the epilogue will result in a crash.
5772 In this case re-order the epilogue note to just before
5773 the last insn in the block. */
5775 first
= BB_END (bb
);
5777 if (PREV_INSN (first
) != note
)
5778 reorder_insns (note
, note
, PREV_INSN (first
));
5782 #endif /* HAVE_prologue or HAVE_epilogue */
5785 /* Returns the name of the current function. */
5787 current_function_name (void)
5791 return lang_hooks
.decl_printable_name (cfun
->decl
, 2);
5796 rest_of_handle_check_leaf_regs (void)
5798 #ifdef LEAF_REGISTERS
5799 current_function_uses_only_leaf_regs
5800 = optimize
> 0 && only_leaf_regs_used () && leaf_function_p ();
5805 /* Insert a TYPE into the used types hash table of CFUN. */
5808 used_types_insert_helper (tree type
, struct function
*func
)
5810 if (type
!= NULL
&& func
!= NULL
)
5814 if (func
->used_types_hash
== NULL
)
5815 func
->used_types_hash
= htab_create_ggc (37, htab_hash_pointer
,
5816 htab_eq_pointer
, NULL
);
5817 slot
= htab_find_slot (func
->used_types_hash
, type
, INSERT
);
5823 /* Given a type, insert it into the used hash table in cfun. */
5825 used_types_insert (tree t
)
5827 while (POINTER_TYPE_P (t
) || TREE_CODE (t
) == ARRAY_TYPE
)
5832 if (TREE_CODE (t
) == ERROR_MARK
)
5834 if (TYPE_NAME (t
) == NULL_TREE
5835 || TYPE_NAME (t
) == TYPE_NAME (TYPE_MAIN_VARIANT (t
)))
5836 t
= TYPE_MAIN_VARIANT (t
);
5837 if (debug_info_level
> DINFO_LEVEL_NONE
)
5840 used_types_insert_helper (t
, cfun
);
5842 /* So this might be a type referenced by a global variable.
5843 Record that type so that we can later decide to emit its debug
5845 VEC_safe_push (tree
, gc
, types_used_by_cur_var_decl
, t
);
5849 /* Helper to Hash a struct types_used_by_vars_entry. */
5852 hash_types_used_by_vars_entry (const struct types_used_by_vars_entry
*entry
)
5854 gcc_assert (entry
&& entry
->var_decl
&& entry
->type
);
5856 return iterative_hash_object (entry
->type
,
5857 iterative_hash_object (entry
->var_decl
, 0));
5860 /* Hash function of the types_used_by_vars_entry hash table. */
5863 types_used_by_vars_do_hash (const void *x
)
5865 const struct types_used_by_vars_entry
*entry
=
5866 (const struct types_used_by_vars_entry
*) x
;
5868 return hash_types_used_by_vars_entry (entry
);
5871 /*Equality function of the types_used_by_vars_entry hash table. */
5874 types_used_by_vars_eq (const void *x1
, const void *x2
)
5876 const struct types_used_by_vars_entry
*e1
=
5877 (const struct types_used_by_vars_entry
*) x1
;
5878 const struct types_used_by_vars_entry
*e2
=
5879 (const struct types_used_by_vars_entry
*)x2
;
5881 return (e1
->var_decl
== e2
->var_decl
&& e1
->type
== e2
->type
);
5884 /* Inserts an entry into the types_used_by_vars_hash hash table. */
5887 types_used_by_var_decl_insert (tree type
, tree var_decl
)
5889 if (type
!= NULL
&& var_decl
!= NULL
)
5892 struct types_used_by_vars_entry e
;
5893 e
.var_decl
= var_decl
;
5895 if (types_used_by_vars_hash
== NULL
)
5896 types_used_by_vars_hash
=
5897 htab_create_ggc (37, types_used_by_vars_do_hash
,
5898 types_used_by_vars_eq
, NULL
);
5899 slot
= htab_find_slot_with_hash (types_used_by_vars_hash
, &e
,
5900 hash_types_used_by_vars_entry (&e
), INSERT
);
5903 struct types_used_by_vars_entry
*entry
;
5904 entry
= ggc_alloc_types_used_by_vars_entry ();
5906 entry
->var_decl
= var_decl
;
5912 struct rtl_opt_pass pass_leaf_regs
=
5916 "*leaf_regs", /* name */
5918 rest_of_handle_check_leaf_regs
, /* execute */
5921 0, /* static_pass_number */
5922 TV_NONE
, /* tv_id */
5923 0, /* properties_required */
5924 0, /* properties_provided */
5925 0, /* properties_destroyed */
5926 0, /* todo_flags_start */
5927 0 /* todo_flags_finish */
5932 rest_of_handle_thread_prologue_and_epilogue (void)
5935 cleanup_cfg (CLEANUP_EXPENSIVE
);
5937 /* On some machines, the prologue and epilogue code, or parts thereof,
5938 can be represented as RTL. Doing so lets us schedule insns between
5939 it and the rest of the code and also allows delayed branch
5940 scheduling to operate in the epilogue. */
5941 thread_prologue_and_epilogue_insns ();
5943 /* The stack usage info is finalized during prologue expansion. */
5944 if (flag_stack_usage
)
5945 output_stack_usage ();
5950 struct rtl_opt_pass pass_thread_prologue_and_epilogue
=
5954 "pro_and_epilogue", /* name */
5956 rest_of_handle_thread_prologue_and_epilogue
, /* execute */
5959 0, /* static_pass_number */
5960 TV_THREAD_PROLOGUE_AND_EPILOGUE
, /* tv_id */
5961 0, /* properties_required */
5962 0, /* properties_provided */
5963 0, /* properties_destroyed */
5964 TODO_verify_flow
, /* todo_flags_start */
5967 TODO_df_finish
| TODO_verify_rtl_sharing
|
5968 TODO_ggc_collect
/* todo_flags_finish */
5973 /* This mini-pass fixes fall-out from SSA in asm statements that have
5974 in-out constraints. Say you start with
5977 asm ("": "+mr" (inout));
5980 which is transformed very early to use explicit output and match operands:
5983 asm ("": "=mr" (inout) : "0" (inout));
5986 Or, after SSA and copyprop,
5988 asm ("": "=mr" (inout_2) : "0" (inout_1));
5991 Clearly inout_2 and inout_1 can't be coalesced easily anymore, as
5992 they represent two separate values, so they will get different pseudo
5993 registers during expansion. Then, since the two operands need to match
5994 per the constraints, but use different pseudo registers, reload can
5995 only register a reload for these operands. But reloads can only be
5996 satisfied by hardregs, not by memory, so we need a register for this
5997 reload, just because we are presented with non-matching operands.
5998 So, even though we allow memory for this operand, no memory can be
5999 used for it, just because the two operands don't match. This can
6000 cause reload failures on register-starved targets.
6002 So it's a symptom of reload not being able to use memory for reloads
6003 or, alternatively it's also a symptom of both operands not coming into
6004 reload as matching (in which case the pseudo could go to memory just
6005 fine, as the alternative allows it, and no reload would be necessary).
6006 We fix the latter problem here, by transforming
6008 asm ("": "=mr" (inout_2) : "0" (inout_1));
6013 asm ("": "=mr" (inout_2) : "0" (inout_2)); */
6016 match_asm_constraints_1 (rtx insn
, rtx
*p_sets
, int noutputs
)
6019 bool changed
= false;
6020 rtx op
= SET_SRC (p_sets
[0]);
6021 int ninputs
= ASM_OPERANDS_INPUT_LENGTH (op
);
6022 rtvec inputs
= ASM_OPERANDS_INPUT_VEC (op
);
6023 bool *output_matched
= XALLOCAVEC (bool, noutputs
);
6025 memset (output_matched
, 0, noutputs
* sizeof (bool));
6026 for (i
= 0; i
< ninputs
; i
++)
6028 rtx input
, output
, insns
;
6029 const char *constraint
= ASM_OPERANDS_INPUT_CONSTRAINT (op
, i
);
6033 if (*constraint
== '%')
6036 match
= strtoul (constraint
, &end
, 10);
6037 if (end
== constraint
)
6040 gcc_assert (match
< noutputs
);
6041 output
= SET_DEST (p_sets
[match
]);
6042 input
= RTVEC_ELT (inputs
, i
);
6043 /* Only do the transformation for pseudos. */
6044 if (! REG_P (output
)
6045 || rtx_equal_p (output
, input
)
6046 || (GET_MODE (input
) != VOIDmode
6047 && GET_MODE (input
) != GET_MODE (output
)))
6050 /* We can't do anything if the output is also used as input,
6051 as we're going to overwrite it. */
6052 for (j
= 0; j
< ninputs
; j
++)
6053 if (reg_overlap_mentioned_p (output
, RTVEC_ELT (inputs
, j
)))
6058 /* Avoid changing the same input several times. For
6059 asm ("" : "=mr" (out1), "=mr" (out2) : "0" (in), "1" (in));
6060 only change in once (to out1), rather than changing it
6061 first to out1 and afterwards to out2. */
6064 for (j
= 0; j
< noutputs
; j
++)
6065 if (output_matched
[j
] && input
== SET_DEST (p_sets
[j
]))
6070 output_matched
[match
] = true;
6073 emit_move_insn (output
, input
);
6074 insns
= get_insns ();
6076 emit_insn_before (insns
, insn
);
6078 /* Now replace all mentions of the input with output. We can't
6079 just replace the occurrence in inputs[i], as the register might
6080 also be used in some other input (or even in an address of an
6081 output), which would mean possibly increasing the number of
6082 inputs by one (namely 'output' in addition), which might pose
6083 a too complicated problem for reload to solve. E.g. this situation:
6085 asm ("" : "=r" (output), "=m" (input) : "0" (input))
6087 Here 'input' is used in two occurrences as input (once for the
6088 input operand, once for the address in the second output operand).
6089 If we would replace only the occurrence of the input operand (to
6090 make the matching) we would be left with this:
6093 asm ("" : "=r" (output), "=m" (input) : "0" (output))
6095 Now we suddenly have two different input values (containing the same
6096 value, but different pseudos) where we formerly had only one.
6097 With more complicated asms this might lead to reload failures
6098 which wouldn't have happen without this pass. So, iterate over
6099 all operands and replace all occurrences of the register used. */
6100 for (j
= 0; j
< noutputs
; j
++)
6101 if (!rtx_equal_p (SET_DEST (p_sets
[j
]), input
)
6102 && reg_overlap_mentioned_p (input
, SET_DEST (p_sets
[j
])))
6103 SET_DEST (p_sets
[j
]) = replace_rtx (SET_DEST (p_sets
[j
]),
6105 for (j
= 0; j
< ninputs
; j
++)
6106 if (reg_overlap_mentioned_p (input
, RTVEC_ELT (inputs
, j
)))
6107 RTVEC_ELT (inputs
, j
) = replace_rtx (RTVEC_ELT (inputs
, j
),
6114 df_insn_rescan (insn
);
6118 rest_of_match_asm_constraints (void)
6121 rtx insn
, pat
, *p_sets
;
6124 if (!crtl
->has_asm_statement
)
6127 df_set_flags (DF_DEFER_INSN_RESCAN
);
6130 FOR_BB_INSNS (bb
, insn
)
6135 pat
= PATTERN (insn
);
6136 if (GET_CODE (pat
) == PARALLEL
)
6137 p_sets
= &XVECEXP (pat
, 0, 0), noutputs
= XVECLEN (pat
, 0);
6138 else if (GET_CODE (pat
) == SET
)
6139 p_sets
= &PATTERN (insn
), noutputs
= 1;
6143 if (GET_CODE (*p_sets
) == SET
6144 && GET_CODE (SET_SRC (*p_sets
)) == ASM_OPERANDS
)
6145 match_asm_constraints_1 (insn
, p_sets
, noutputs
);
6149 return TODO_df_finish
;
6152 struct rtl_opt_pass pass_match_asm_constraints
=
6156 "asmcons", /* name */
6158 rest_of_match_asm_constraints
, /* execute */
6161 0, /* static_pass_number */
6162 TV_NONE
, /* tv_id */
6163 0, /* properties_required */
6164 0, /* properties_provided */
6165 0, /* properties_destroyed */
6166 0, /* todo_flags_start */
6167 TODO_dump_func
/* todo_flags_finish */
6172 #include "gt-function.h"