2008-05-30 Vladimir Makarov <vmakarov@redhat.com>
[official-gcc.git] / gcc / function.c
blobf2dd5a330938e2248e274c503a4a824aa763a102
1 /* Expands front end tree to back end RTL for GCC.
2 Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
3 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008
4 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* This file handles the generation of rtl code from tree structure
23 at the level of the function as a whole.
24 It creates the rtl expressions for parameters and auto variables
25 and has full responsibility for allocating stack slots.
27 `expand_function_start' is called at the beginning of a function,
28 before the function body is parsed, and `expand_function_end' is
29 called after parsing the body.
31 Call `assign_stack_local' to allocate a stack slot for a local variable.
32 This is usually done during the RTL generation for the function body,
33 but it can also be done in the reload pass when a pseudo-register does
34 not get a hard register. */
36 #include "config.h"
37 #include "system.h"
38 #include "coretypes.h"
39 #include "tm.h"
40 #include "rtl.h"
41 #include "tree.h"
42 #include "flags.h"
43 #include "except.h"
44 #include "function.h"
45 #include "expr.h"
46 #include "optabs.h"
47 #include "libfuncs.h"
48 #include "regs.h"
49 #include "hard-reg-set.h"
50 #include "insn-config.h"
51 #include "recog.h"
52 #include "output.h"
53 #include "basic-block.h"
54 #include "toplev.h"
55 #include "hashtab.h"
56 #include "ggc.h"
57 #include "tm_p.h"
58 #include "integrate.h"
59 #include "langhooks.h"
60 #include "target.h"
61 #include "cfglayout.h"
62 #include "tree-gimple.h"
63 #include "tree-pass.h"
64 #include "predict.h"
65 #include "df.h"
66 #include "timevar.h"
67 #include "vecprim.h"
68 #include "cgraph.h"
70 /* So we can assign to cfun in this file. */
71 #undef cfun
73 #ifndef STACK_ALIGNMENT_NEEDED
74 #define STACK_ALIGNMENT_NEEDED 1
75 #endif
77 #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT)
79 /* Some systems use __main in a way incompatible with its use in gcc, in these
80 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
81 give the same symbol without quotes for an alternative entry point. You
82 must define both, or neither. */
83 #ifndef NAME__MAIN
84 #define NAME__MAIN "__main"
85 #endif
87 /* Round a value to the lowest integer less than it that is a multiple of
88 the required alignment. Avoid using division in case the value is
89 negative. Assume the alignment is a power of two. */
90 #define FLOOR_ROUND(VALUE,ALIGN) ((VALUE) & ~((ALIGN) - 1))
92 /* Similar, but round to the next highest integer that meets the
93 alignment. */
94 #define CEIL_ROUND(VALUE,ALIGN) (((VALUE) + (ALIGN) - 1) & ~((ALIGN)- 1))
96 /* Nonzero if function being compiled doesn't contain any calls
97 (ignoring the prologue and epilogue). This is set prior to
98 local register allocation and is valid for the remaining
99 compiler passes. */
100 int current_function_is_leaf;
102 /* Nonzero if function being compiled doesn't modify the stack pointer
103 (ignoring the prologue and epilogue). This is only valid after
104 pass_stack_ptr_mod has run. */
105 int current_function_sp_is_unchanging;
107 /* Nonzero if the function being compiled is a leaf function which only
108 uses leaf registers. This is valid after reload (specifically after
109 sched2) and is useful only if the port defines LEAF_REGISTERS. */
110 int current_function_uses_only_leaf_regs;
112 /* Nonzero once virtual register instantiation has been done.
113 assign_stack_local uses frame_pointer_rtx when this is nonzero.
114 calls.c:emit_library_call_value_1 uses it to set up
115 post-instantiation libcalls. */
116 int virtuals_instantiated;
118 /* Assign unique numbers to labels generated for profiling, debugging, etc. */
119 static GTY(()) int funcdef_no;
121 /* These variables hold pointers to functions to create and destroy
122 target specific, per-function data structures. */
123 struct machine_function * (*init_machine_status) (void);
125 /* The currently compiled function. */
126 struct function *cfun = 0;
128 /* These arrays record the INSN_UIDs of the prologue and epilogue insns. */
129 static VEC(int,heap) *prologue;
130 static VEC(int,heap) *epilogue;
132 /* Array of INSN_UIDs to hold the INSN_UIDs for each sibcall epilogue
133 in this function. */
134 static VEC(int,heap) *sibcall_epilogue;
136 /* In order to evaluate some expressions, such as function calls returning
137 structures in memory, we need to temporarily allocate stack locations.
138 We record each allocated temporary in the following structure.
140 Associated with each temporary slot is a nesting level. When we pop up
141 one level, all temporaries associated with the previous level are freed.
142 Normally, all temporaries are freed after the execution of the statement
143 in which they were created. However, if we are inside a ({...}) grouping,
144 the result may be in a temporary and hence must be preserved. If the
145 result could be in a temporary, we preserve it if we can determine which
146 one it is in. If we cannot determine which temporary may contain the
147 result, all temporaries are preserved. A temporary is preserved by
148 pretending it was allocated at the previous nesting level.
150 Automatic variables are also assigned temporary slots, at the nesting
151 level where they are defined. They are marked a "kept" so that
152 free_temp_slots will not free them. */
154 struct temp_slot GTY(())
156 /* Points to next temporary slot. */
157 struct temp_slot *next;
158 /* Points to previous temporary slot. */
159 struct temp_slot *prev;
161 /* The rtx to used to reference the slot. */
162 rtx slot;
163 /* The rtx used to represent the address if not the address of the
164 slot above. May be an EXPR_LIST if multiple addresses exist. */
165 rtx address;
166 /* The alignment (in bits) of the slot. */
167 unsigned int align;
168 /* The size, in units, of the slot. */
169 HOST_WIDE_INT size;
170 /* The type of the object in the slot, or zero if it doesn't correspond
171 to a type. We use this to determine whether a slot can be reused.
172 It can be reused if objects of the type of the new slot will always
173 conflict with objects of the type of the old slot. */
174 tree type;
175 /* Nonzero if this temporary is currently in use. */
176 char in_use;
177 /* Nonzero if this temporary has its address taken. */
178 char addr_taken;
179 /* Nesting level at which this slot is being used. */
180 int level;
181 /* Nonzero if this should survive a call to free_temp_slots. */
182 int keep;
183 /* The offset of the slot from the frame_pointer, including extra space
184 for alignment. This info is for combine_temp_slots. */
185 HOST_WIDE_INT base_offset;
186 /* The size of the slot, including extra space for alignment. This
187 info is for combine_temp_slots. */
188 HOST_WIDE_INT full_size;
191 /* Forward declarations. */
193 static struct temp_slot *find_temp_slot_from_address (rtx);
194 static void pad_to_arg_alignment (struct args_size *, int, struct args_size *);
195 static void pad_below (struct args_size *, enum machine_mode, tree);
196 static void reorder_blocks_1 (rtx, tree, VEC(tree,heap) **);
197 static int all_blocks (tree, tree *);
198 static tree *get_block_vector (tree, int *);
199 extern tree debug_find_var_in_block_tree (tree, tree);
200 /* We always define `record_insns' even if it's not used so that we
201 can always export `prologue_epilogue_contains'. */
202 static void record_insns (rtx, VEC(int,heap) **) ATTRIBUTE_UNUSED;
203 static int contains (const_rtx, VEC(int,heap) **);
204 #ifdef HAVE_return
205 static void emit_return_into_block (basic_block);
206 #endif
207 static void prepare_function_start (void);
208 static void do_clobber_return_reg (rtx, void *);
209 static void do_use_return_reg (rtx, void *);
210 static void set_insn_locators (rtx, int) ATTRIBUTE_UNUSED;
212 /* Pointer to chain of `struct function' for containing functions. */
213 struct function *outer_function_chain;
215 /* Given a function decl for a containing function,
216 return the `struct function' for it. */
218 struct function *
219 find_function_data (tree decl)
221 struct function *p;
223 for (p = outer_function_chain; p; p = p->outer)
224 if (p->decl == decl)
225 return p;
227 gcc_unreachable ();
230 /* Save the current context for compilation of a nested function.
231 This is called from language-specific code. */
233 void
234 push_function_context (void)
236 if (cfun == 0)
237 allocate_struct_function (NULL, false);
239 cfun->outer = outer_function_chain;
240 outer_function_chain = cfun;
241 set_cfun (NULL);
244 /* Restore the last saved context, at the end of a nested function.
245 This function is called from language-specific code. */
247 void
248 pop_function_context (void)
250 struct function *p = outer_function_chain;
252 set_cfun (p);
253 outer_function_chain = p->outer;
254 current_function_decl = p->decl;
256 /* Reset variables that have known state during rtx generation. */
257 virtuals_instantiated = 0;
258 generating_concat_p = 1;
261 /* Clear out all parts of the state in F that can safely be discarded
262 after the function has been parsed, but not compiled, to let
263 garbage collection reclaim the memory. */
265 void
266 free_after_parsing (struct function *f)
268 f->language = 0;
271 /* Clear out all parts of the state in F that can safely be discarded
272 after the function has been compiled, to let garbage collection
273 reclaim the memory. */
275 void
276 free_after_compilation (struct function *f)
278 VEC_free (int, heap, prologue);
279 VEC_free (int, heap, epilogue);
280 VEC_free (int, heap, sibcall_epilogue);
281 if (crtl->emit.regno_pointer_align)
282 free (crtl->emit.regno_pointer_align);
284 memset (crtl, 0, sizeof (struct rtl_data));
285 f->eh = NULL;
286 f->machine = NULL;
287 f->cfg = NULL;
289 regno_reg_rtx = NULL;
292 /* Return size needed for stack frame based on slots so far allocated.
293 This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY;
294 the caller may have to do that. */
296 HOST_WIDE_INT
297 get_frame_size (void)
299 if (FRAME_GROWS_DOWNWARD)
300 return -frame_offset;
301 else
302 return frame_offset;
305 /* Issue an error message and return TRUE if frame OFFSET overflows in
306 the signed target pointer arithmetics for function FUNC. Otherwise
307 return FALSE. */
309 bool
310 frame_offset_overflow (HOST_WIDE_INT offset, tree func)
312 unsigned HOST_WIDE_INT size = FRAME_GROWS_DOWNWARD ? -offset : offset;
314 if (size > ((unsigned HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (Pmode) - 1))
315 /* Leave room for the fixed part of the frame. */
316 - 64 * UNITS_PER_WORD)
318 error ("%Jtotal size of local objects too large", func);
319 return TRUE;
322 return FALSE;
325 /* Return stack slot alignment in bits for TYPE and MODE. */
327 static unsigned int
328 get_stack_local_alignment (tree type, enum machine_mode mode)
330 unsigned int alignment;
332 if (mode == BLKmode)
333 alignment = BIGGEST_ALIGNMENT;
334 else
335 alignment = GET_MODE_ALIGNMENT (mode);
337 /* Allow the frond-end to (possibly) increase the alignment of this
338 stack slot. */
339 if (! type)
340 type = lang_hooks.types.type_for_mode (mode, 0);
342 return STACK_SLOT_ALIGNMENT (type, mode, alignment);
345 /* Allocate a stack slot of SIZE bytes and return a MEM rtx for it
346 with machine mode MODE.
348 ALIGN controls the amount of alignment for the address of the slot:
349 0 means according to MODE,
350 -1 means use BIGGEST_ALIGNMENT and round size to multiple of that,
351 -2 means use BITS_PER_UNIT,
352 positive specifies alignment boundary in bits.
354 We do not round to stack_boundary here. */
357 assign_stack_local (enum machine_mode mode, HOST_WIDE_INT size, int align)
359 rtx x, addr;
360 int bigend_correction = 0;
361 unsigned int alignment, alignment_in_bits;
362 int frame_off, frame_alignment, frame_phase;
364 if (align == 0)
366 alignment = get_stack_local_alignment (NULL, mode);
367 alignment /= BITS_PER_UNIT;
369 else if (align == -1)
371 alignment = BIGGEST_ALIGNMENT / BITS_PER_UNIT;
372 size = CEIL_ROUND (size, alignment);
374 else if (align == -2)
375 alignment = 1; /* BITS_PER_UNIT / BITS_PER_UNIT */
376 else
377 alignment = align / BITS_PER_UNIT;
379 if (FRAME_GROWS_DOWNWARD)
380 frame_offset -= size;
382 /* Ignore alignment we can't do with expected alignment of the boundary. */
383 if (alignment * BITS_PER_UNIT > PREFERRED_STACK_BOUNDARY)
384 alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
386 alignment_in_bits = alignment * BITS_PER_UNIT;
388 if (crtl->stack_alignment_needed < alignment_in_bits)
389 crtl->stack_alignment_needed = alignment_in_bits;
391 /* Calculate how many bytes the start of local variables is off from
392 stack alignment. */
393 frame_alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
394 frame_off = STARTING_FRAME_OFFSET % frame_alignment;
395 frame_phase = frame_off ? frame_alignment - frame_off : 0;
397 /* Round the frame offset to the specified alignment. The default is
398 to always honor requests to align the stack but a port may choose to
399 do its own stack alignment by defining STACK_ALIGNMENT_NEEDED. */
400 if (STACK_ALIGNMENT_NEEDED
401 || mode != BLKmode
402 || size != 0)
404 /* We must be careful here, since FRAME_OFFSET might be negative and
405 division with a negative dividend isn't as well defined as we might
406 like. So we instead assume that ALIGNMENT is a power of two and
407 use logical operations which are unambiguous. */
408 if (FRAME_GROWS_DOWNWARD)
409 frame_offset
410 = (FLOOR_ROUND (frame_offset - frame_phase,
411 (unsigned HOST_WIDE_INT) alignment)
412 + frame_phase);
413 else
414 frame_offset
415 = (CEIL_ROUND (frame_offset - frame_phase,
416 (unsigned HOST_WIDE_INT) alignment)
417 + frame_phase);
420 /* On a big-endian machine, if we are allocating more space than we will use,
421 use the least significant bytes of those that are allocated. */
422 if (BYTES_BIG_ENDIAN && mode != BLKmode && GET_MODE_SIZE (mode) < size)
423 bigend_correction = size - GET_MODE_SIZE (mode);
425 /* If we have already instantiated virtual registers, return the actual
426 address relative to the frame pointer. */
427 if (virtuals_instantiated)
428 addr = plus_constant (frame_pointer_rtx,
429 trunc_int_for_mode
430 (frame_offset + bigend_correction
431 + STARTING_FRAME_OFFSET, Pmode));
432 else
433 addr = plus_constant (virtual_stack_vars_rtx,
434 trunc_int_for_mode
435 (frame_offset + bigend_correction,
436 Pmode));
438 if (!FRAME_GROWS_DOWNWARD)
439 frame_offset += size;
441 x = gen_rtx_MEM (mode, addr);
442 set_mem_align (x, alignment_in_bits);
443 MEM_NOTRAP_P (x) = 1;
445 stack_slot_list
446 = gen_rtx_EXPR_LIST (VOIDmode, x, stack_slot_list);
448 if (frame_offset_overflow (frame_offset, current_function_decl))
449 frame_offset = 0;
451 return x;
454 /* Removes temporary slot TEMP from LIST. */
456 static void
457 cut_slot_from_list (struct temp_slot *temp, struct temp_slot **list)
459 if (temp->next)
460 temp->next->prev = temp->prev;
461 if (temp->prev)
462 temp->prev->next = temp->next;
463 else
464 *list = temp->next;
466 temp->prev = temp->next = NULL;
469 /* Inserts temporary slot TEMP to LIST. */
471 static void
472 insert_slot_to_list (struct temp_slot *temp, struct temp_slot **list)
474 temp->next = *list;
475 if (*list)
476 (*list)->prev = temp;
477 temp->prev = NULL;
478 *list = temp;
481 /* Returns the list of used temp slots at LEVEL. */
483 static struct temp_slot **
484 temp_slots_at_level (int level)
486 if (level >= (int) VEC_length (temp_slot_p, used_temp_slots))
487 VEC_safe_grow_cleared (temp_slot_p, gc, used_temp_slots, level + 1);
489 return &(VEC_address (temp_slot_p, used_temp_slots)[level]);
492 /* Returns the maximal temporary slot level. */
494 static int
495 max_slot_level (void)
497 if (!used_temp_slots)
498 return -1;
500 return VEC_length (temp_slot_p, used_temp_slots) - 1;
503 /* Moves temporary slot TEMP to LEVEL. */
505 static void
506 move_slot_to_level (struct temp_slot *temp, int level)
508 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
509 insert_slot_to_list (temp, temp_slots_at_level (level));
510 temp->level = level;
513 /* Make temporary slot TEMP available. */
515 static void
516 make_slot_available (struct temp_slot *temp)
518 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
519 insert_slot_to_list (temp, &avail_temp_slots);
520 temp->in_use = 0;
521 temp->level = -1;
524 /* Allocate a temporary stack slot and record it for possible later
525 reuse.
527 MODE is the machine mode to be given to the returned rtx.
529 SIZE is the size in units of the space required. We do no rounding here
530 since assign_stack_local will do any required rounding.
532 KEEP is 1 if this slot is to be retained after a call to
533 free_temp_slots. Automatic variables for a block are allocated
534 with this flag. KEEP values of 2 or 3 were needed respectively
535 for variables whose lifetime is controlled by CLEANUP_POINT_EXPRs
536 or for SAVE_EXPRs, but they are now unused.
538 TYPE is the type that will be used for the stack slot. */
541 assign_stack_temp_for_type (enum machine_mode mode, HOST_WIDE_INT size,
542 int keep, tree type)
544 unsigned int align;
545 struct temp_slot *p, *best_p = 0, *selected = NULL, **pp;
546 rtx slot;
548 /* If SIZE is -1 it means that somebody tried to allocate a temporary
549 of a variable size. */
550 gcc_assert (size != -1);
552 /* These are now unused. */
553 gcc_assert (keep <= 1);
555 align = get_stack_local_alignment (type, mode);
557 /* Try to find an available, already-allocated temporary of the proper
558 mode which meets the size and alignment requirements. Choose the
559 smallest one with the closest alignment.
561 If assign_stack_temp is called outside of the tree->rtl expansion,
562 we cannot reuse the stack slots (that may still refer to
563 VIRTUAL_STACK_VARS_REGNUM). */
564 if (!virtuals_instantiated)
566 for (p = avail_temp_slots; p; p = p->next)
568 if (p->align >= align && p->size >= size
569 && GET_MODE (p->slot) == mode
570 && objects_must_conflict_p (p->type, type)
571 && (best_p == 0 || best_p->size > p->size
572 || (best_p->size == p->size && best_p->align > p->align)))
574 if (p->align == align && p->size == size)
576 selected = p;
577 cut_slot_from_list (selected, &avail_temp_slots);
578 best_p = 0;
579 break;
581 best_p = p;
586 /* Make our best, if any, the one to use. */
587 if (best_p)
589 selected = best_p;
590 cut_slot_from_list (selected, &avail_temp_slots);
592 /* If there are enough aligned bytes left over, make them into a new
593 temp_slot so that the extra bytes don't get wasted. Do this only
594 for BLKmode slots, so that we can be sure of the alignment. */
595 if (GET_MODE (best_p->slot) == BLKmode)
597 int alignment = best_p->align / BITS_PER_UNIT;
598 HOST_WIDE_INT rounded_size = CEIL_ROUND (size, alignment);
600 if (best_p->size - rounded_size >= alignment)
602 p = ggc_alloc (sizeof (struct temp_slot));
603 p->in_use = p->addr_taken = 0;
604 p->size = best_p->size - rounded_size;
605 p->base_offset = best_p->base_offset + rounded_size;
606 p->full_size = best_p->full_size - rounded_size;
607 p->slot = adjust_address_nv (best_p->slot, BLKmode, rounded_size);
608 p->align = best_p->align;
609 p->address = 0;
610 p->type = best_p->type;
611 insert_slot_to_list (p, &avail_temp_slots);
613 stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, p->slot,
614 stack_slot_list);
616 best_p->size = rounded_size;
617 best_p->full_size = rounded_size;
622 /* If we still didn't find one, make a new temporary. */
623 if (selected == 0)
625 HOST_WIDE_INT frame_offset_old = frame_offset;
627 p = ggc_alloc (sizeof (struct temp_slot));
629 /* We are passing an explicit alignment request to assign_stack_local.
630 One side effect of that is assign_stack_local will not round SIZE
631 to ensure the frame offset remains suitably aligned.
633 So for requests which depended on the rounding of SIZE, we go ahead
634 and round it now. We also make sure ALIGNMENT is at least
635 BIGGEST_ALIGNMENT. */
636 gcc_assert (mode != BLKmode || align == BIGGEST_ALIGNMENT);
637 p->slot = assign_stack_local (mode,
638 (mode == BLKmode
639 ? CEIL_ROUND (size, (int) align / BITS_PER_UNIT)
640 : size),
641 align);
643 p->align = align;
645 /* The following slot size computation is necessary because we don't
646 know the actual size of the temporary slot until assign_stack_local
647 has performed all the frame alignment and size rounding for the
648 requested temporary. Note that extra space added for alignment
649 can be either above or below this stack slot depending on which
650 way the frame grows. We include the extra space if and only if it
651 is above this slot. */
652 if (FRAME_GROWS_DOWNWARD)
653 p->size = frame_offset_old - frame_offset;
654 else
655 p->size = size;
657 /* Now define the fields used by combine_temp_slots. */
658 if (FRAME_GROWS_DOWNWARD)
660 p->base_offset = frame_offset;
661 p->full_size = frame_offset_old - frame_offset;
663 else
665 p->base_offset = frame_offset_old;
666 p->full_size = frame_offset - frame_offset_old;
668 p->address = 0;
670 selected = p;
673 p = selected;
674 p->in_use = 1;
675 p->addr_taken = 0;
676 p->type = type;
677 p->level = temp_slot_level;
678 p->keep = keep;
680 pp = temp_slots_at_level (p->level);
681 insert_slot_to_list (p, pp);
683 /* Create a new MEM rtx to avoid clobbering MEM flags of old slots. */
684 slot = gen_rtx_MEM (mode, XEXP (p->slot, 0));
685 stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, slot, stack_slot_list);
687 /* If we know the alias set for the memory that will be used, use
688 it. If there's no TYPE, then we don't know anything about the
689 alias set for the memory. */
690 set_mem_alias_set (slot, type ? get_alias_set (type) : 0);
691 set_mem_align (slot, align);
693 /* If a type is specified, set the relevant flags. */
694 if (type != 0)
696 MEM_VOLATILE_P (slot) = TYPE_VOLATILE (type);
697 MEM_SET_IN_STRUCT_P (slot, (AGGREGATE_TYPE_P (type)
698 || TREE_CODE (type) == COMPLEX_TYPE));
700 MEM_NOTRAP_P (slot) = 1;
702 return slot;
705 /* Allocate a temporary stack slot and record it for possible later
706 reuse. First three arguments are same as in preceding function. */
709 assign_stack_temp (enum machine_mode mode, HOST_WIDE_INT size, int keep)
711 return assign_stack_temp_for_type (mode, size, keep, NULL_TREE);
714 /* Assign a temporary.
715 If TYPE_OR_DECL is a decl, then we are doing it on behalf of the decl
716 and so that should be used in error messages. In either case, we
717 allocate of the given type.
718 KEEP is as for assign_stack_temp.
719 MEMORY_REQUIRED is 1 if the result must be addressable stack memory;
720 it is 0 if a register is OK.
721 DONT_PROMOTE is 1 if we should not promote values in register
722 to wider modes. */
725 assign_temp (tree type_or_decl, int keep, int memory_required,
726 int dont_promote ATTRIBUTE_UNUSED)
728 tree type, decl;
729 enum machine_mode mode;
730 #ifdef PROMOTE_MODE
731 int unsignedp;
732 #endif
734 if (DECL_P (type_or_decl))
735 decl = type_or_decl, type = TREE_TYPE (decl);
736 else
737 decl = NULL, type = type_or_decl;
739 mode = TYPE_MODE (type);
740 #ifdef PROMOTE_MODE
741 unsignedp = TYPE_UNSIGNED (type);
742 #endif
744 if (mode == BLKmode || memory_required)
746 HOST_WIDE_INT size = int_size_in_bytes (type);
747 rtx tmp;
749 /* Zero sized arrays are GNU C extension. Set size to 1 to avoid
750 problems with allocating the stack space. */
751 if (size == 0)
752 size = 1;
754 /* Unfortunately, we don't yet know how to allocate variable-sized
755 temporaries. However, sometimes we can find a fixed upper limit on
756 the size, so try that instead. */
757 else if (size == -1)
758 size = max_int_size_in_bytes (type);
760 /* The size of the temporary may be too large to fit into an integer. */
761 /* ??? Not sure this should happen except for user silliness, so limit
762 this to things that aren't compiler-generated temporaries. The
763 rest of the time we'll die in assign_stack_temp_for_type. */
764 if (decl && size == -1
765 && TREE_CODE (TYPE_SIZE_UNIT (type)) == INTEGER_CST)
767 error ("size of variable %q+D is too large", decl);
768 size = 1;
771 tmp = assign_stack_temp_for_type (mode, size, keep, type);
772 return tmp;
775 #ifdef PROMOTE_MODE
776 if (! dont_promote)
777 mode = promote_mode (type, mode, &unsignedp, 0);
778 #endif
780 return gen_reg_rtx (mode);
783 /* Combine temporary stack slots which are adjacent on the stack.
785 This allows for better use of already allocated stack space. This is only
786 done for BLKmode slots because we can be sure that we won't have alignment
787 problems in this case. */
789 static void
790 combine_temp_slots (void)
792 struct temp_slot *p, *q, *next, *next_q;
793 int num_slots;
795 /* We can't combine slots, because the information about which slot
796 is in which alias set will be lost. */
797 if (flag_strict_aliasing)
798 return;
800 /* If there are a lot of temp slots, don't do anything unless
801 high levels of optimization. */
802 if (! flag_expensive_optimizations)
803 for (p = avail_temp_slots, num_slots = 0; p; p = p->next, num_slots++)
804 if (num_slots > 100 || (num_slots > 10 && optimize == 0))
805 return;
807 for (p = avail_temp_slots; p; p = next)
809 int delete_p = 0;
811 next = p->next;
813 if (GET_MODE (p->slot) != BLKmode)
814 continue;
816 for (q = p->next; q; q = next_q)
818 int delete_q = 0;
820 next_q = q->next;
822 if (GET_MODE (q->slot) != BLKmode)
823 continue;
825 if (p->base_offset + p->full_size == q->base_offset)
827 /* Q comes after P; combine Q into P. */
828 p->size += q->size;
829 p->full_size += q->full_size;
830 delete_q = 1;
832 else if (q->base_offset + q->full_size == p->base_offset)
834 /* P comes after Q; combine P into Q. */
835 q->size += p->size;
836 q->full_size += p->full_size;
837 delete_p = 1;
838 break;
840 if (delete_q)
841 cut_slot_from_list (q, &avail_temp_slots);
844 /* Either delete P or advance past it. */
845 if (delete_p)
846 cut_slot_from_list (p, &avail_temp_slots);
850 /* Find the temp slot corresponding to the object at address X. */
852 static struct temp_slot *
853 find_temp_slot_from_address (rtx x)
855 struct temp_slot *p;
856 rtx next;
857 int i;
859 for (i = max_slot_level (); i >= 0; i--)
860 for (p = *temp_slots_at_level (i); p; p = p->next)
862 if (XEXP (p->slot, 0) == x
863 || p->address == x
864 || (GET_CODE (x) == PLUS
865 && XEXP (x, 0) == virtual_stack_vars_rtx
866 && GET_CODE (XEXP (x, 1)) == CONST_INT
867 && INTVAL (XEXP (x, 1)) >= p->base_offset
868 && INTVAL (XEXP (x, 1)) < p->base_offset + p->full_size))
869 return p;
871 else if (p->address != 0 && GET_CODE (p->address) == EXPR_LIST)
872 for (next = p->address; next; next = XEXP (next, 1))
873 if (XEXP (next, 0) == x)
874 return p;
877 /* If we have a sum involving a register, see if it points to a temp
878 slot. */
879 if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 0))
880 && (p = find_temp_slot_from_address (XEXP (x, 0))) != 0)
881 return p;
882 else if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 1))
883 && (p = find_temp_slot_from_address (XEXP (x, 1))) != 0)
884 return p;
886 return 0;
889 /* Indicate that NEW is an alternate way of referring to the temp slot
890 that previously was known by OLD. */
892 void
893 update_temp_slot_address (rtx old, rtx new)
895 struct temp_slot *p;
897 if (rtx_equal_p (old, new))
898 return;
900 p = find_temp_slot_from_address (old);
902 /* If we didn't find one, see if both OLD is a PLUS. If so, and NEW
903 is a register, see if one operand of the PLUS is a temporary
904 location. If so, NEW points into it. Otherwise, if both OLD and
905 NEW are a PLUS and if there is a register in common between them.
906 If so, try a recursive call on those values. */
907 if (p == 0)
909 if (GET_CODE (old) != PLUS)
910 return;
912 if (REG_P (new))
914 update_temp_slot_address (XEXP (old, 0), new);
915 update_temp_slot_address (XEXP (old, 1), new);
916 return;
918 else if (GET_CODE (new) != PLUS)
919 return;
921 if (rtx_equal_p (XEXP (old, 0), XEXP (new, 0)))
922 update_temp_slot_address (XEXP (old, 1), XEXP (new, 1));
923 else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 0)))
924 update_temp_slot_address (XEXP (old, 0), XEXP (new, 1));
925 else if (rtx_equal_p (XEXP (old, 0), XEXP (new, 1)))
926 update_temp_slot_address (XEXP (old, 1), XEXP (new, 0));
927 else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 1)))
928 update_temp_slot_address (XEXP (old, 0), XEXP (new, 0));
930 return;
933 /* Otherwise add an alias for the temp's address. */
934 else if (p->address == 0)
935 p->address = new;
936 else
938 if (GET_CODE (p->address) != EXPR_LIST)
939 p->address = gen_rtx_EXPR_LIST (VOIDmode, p->address, NULL_RTX);
941 p->address = gen_rtx_EXPR_LIST (VOIDmode, new, p->address);
945 /* If X could be a reference to a temporary slot, mark the fact that its
946 address was taken. */
948 void
949 mark_temp_addr_taken (rtx x)
951 struct temp_slot *p;
953 if (x == 0)
954 return;
956 /* If X is not in memory or is at a constant address, it cannot be in
957 a temporary slot. */
958 if (!MEM_P (x) || CONSTANT_P (XEXP (x, 0)))
959 return;
961 p = find_temp_slot_from_address (XEXP (x, 0));
962 if (p != 0)
963 p->addr_taken = 1;
966 /* If X could be a reference to a temporary slot, mark that slot as
967 belonging to the to one level higher than the current level. If X
968 matched one of our slots, just mark that one. Otherwise, we can't
969 easily predict which it is, so upgrade all of them. Kept slots
970 need not be touched.
972 This is called when an ({...}) construct occurs and a statement
973 returns a value in memory. */
975 void
976 preserve_temp_slots (rtx x)
978 struct temp_slot *p = 0, *next;
980 /* If there is no result, we still might have some objects whose address
981 were taken, so we need to make sure they stay around. */
982 if (x == 0)
984 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
986 next = p->next;
988 if (p->addr_taken)
989 move_slot_to_level (p, temp_slot_level - 1);
992 return;
995 /* If X is a register that is being used as a pointer, see if we have
996 a temporary slot we know it points to. To be consistent with
997 the code below, we really should preserve all non-kept slots
998 if we can't find a match, but that seems to be much too costly. */
999 if (REG_P (x) && REG_POINTER (x))
1000 p = find_temp_slot_from_address (x);
1002 /* If X is not in memory or is at a constant address, it cannot be in
1003 a temporary slot, but it can contain something whose address was
1004 taken. */
1005 if (p == 0 && (!MEM_P (x) || CONSTANT_P (XEXP (x, 0))))
1007 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1009 next = p->next;
1011 if (p->addr_taken)
1012 move_slot_to_level (p, temp_slot_level - 1);
1015 return;
1018 /* First see if we can find a match. */
1019 if (p == 0)
1020 p = find_temp_slot_from_address (XEXP (x, 0));
1022 if (p != 0)
1024 /* Move everything at our level whose address was taken to our new
1025 level in case we used its address. */
1026 struct temp_slot *q;
1028 if (p->level == temp_slot_level)
1030 for (q = *temp_slots_at_level (temp_slot_level); q; q = next)
1032 next = q->next;
1034 if (p != q && q->addr_taken)
1035 move_slot_to_level (q, temp_slot_level - 1);
1038 move_slot_to_level (p, temp_slot_level - 1);
1039 p->addr_taken = 0;
1041 return;
1044 /* Otherwise, preserve all non-kept slots at this level. */
1045 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1047 next = p->next;
1049 if (!p->keep)
1050 move_slot_to_level (p, temp_slot_level - 1);
1054 /* Free all temporaries used so far. This is normally called at the
1055 end of generating code for a statement. */
1057 void
1058 free_temp_slots (void)
1060 struct temp_slot *p, *next;
1062 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1064 next = p->next;
1066 if (!p->keep)
1067 make_slot_available (p);
1070 combine_temp_slots ();
1073 /* Push deeper into the nesting level for stack temporaries. */
1075 void
1076 push_temp_slots (void)
1078 temp_slot_level++;
1081 /* Pop a temporary nesting level. All slots in use in the current level
1082 are freed. */
1084 void
1085 pop_temp_slots (void)
1087 struct temp_slot *p, *next;
1089 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1091 next = p->next;
1092 make_slot_available (p);
1095 combine_temp_slots ();
1097 temp_slot_level--;
1100 /* Initialize temporary slots. */
1102 void
1103 init_temp_slots (void)
1105 /* We have not allocated any temporaries yet. */
1106 avail_temp_slots = 0;
1107 used_temp_slots = 0;
1108 temp_slot_level = 0;
1111 /* These routines are responsible for converting virtual register references
1112 to the actual hard register references once RTL generation is complete.
1114 The following four variables are used for communication between the
1115 routines. They contain the offsets of the virtual registers from their
1116 respective hard registers. */
1118 static int in_arg_offset;
1119 static int var_offset;
1120 static int dynamic_offset;
1121 static int out_arg_offset;
1122 static int cfa_offset;
1124 /* In most machines, the stack pointer register is equivalent to the bottom
1125 of the stack. */
1127 #ifndef STACK_POINTER_OFFSET
1128 #define STACK_POINTER_OFFSET 0
1129 #endif
1131 /* If not defined, pick an appropriate default for the offset of dynamically
1132 allocated memory depending on the value of ACCUMULATE_OUTGOING_ARGS,
1133 REG_PARM_STACK_SPACE, and OUTGOING_REG_PARM_STACK_SPACE. */
1135 #ifndef STACK_DYNAMIC_OFFSET
1137 /* The bottom of the stack points to the actual arguments. If
1138 REG_PARM_STACK_SPACE is defined, this includes the space for the register
1139 parameters. However, if OUTGOING_REG_PARM_STACK space is not defined,
1140 stack space for register parameters is not pushed by the caller, but
1141 rather part of the fixed stack areas and hence not included in
1142 `crtl->outgoing_args_size'. Nevertheless, we must allow
1143 for it when allocating stack dynamic objects. */
1145 #if defined(REG_PARM_STACK_SPACE)
1146 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1147 ((ACCUMULATE_OUTGOING_ARGS \
1148 ? (crtl->outgoing_args_size \
1149 + (OUTGOING_REG_PARM_STACK_SPACE ((!(FNDECL) ? NULL_TREE : TREE_TYPE (FNDECL))) ? 0 \
1150 : REG_PARM_STACK_SPACE (FNDECL))) \
1151 : 0) + (STACK_POINTER_OFFSET))
1152 #else
1153 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1154 ((ACCUMULATE_OUTGOING_ARGS ? crtl->outgoing_args_size : 0) \
1155 + (STACK_POINTER_OFFSET))
1156 #endif
1157 #endif
1160 /* Given a piece of RTX and a pointer to a HOST_WIDE_INT, if the RTX
1161 is a virtual register, return the equivalent hard register and set the
1162 offset indirectly through the pointer. Otherwise, return 0. */
1164 static rtx
1165 instantiate_new_reg (rtx x, HOST_WIDE_INT *poffset)
1167 rtx new;
1168 HOST_WIDE_INT offset;
1170 if (x == virtual_incoming_args_rtx)
1171 new = arg_pointer_rtx, offset = in_arg_offset;
1172 else if (x == virtual_stack_vars_rtx)
1173 new = frame_pointer_rtx, offset = var_offset;
1174 else if (x == virtual_stack_dynamic_rtx)
1175 new = stack_pointer_rtx, offset = dynamic_offset;
1176 else if (x == virtual_outgoing_args_rtx)
1177 new = stack_pointer_rtx, offset = out_arg_offset;
1178 else if (x == virtual_cfa_rtx)
1180 #ifdef FRAME_POINTER_CFA_OFFSET
1181 new = frame_pointer_rtx;
1182 #else
1183 new = arg_pointer_rtx;
1184 #endif
1185 offset = cfa_offset;
1187 else
1188 return NULL_RTX;
1190 *poffset = offset;
1191 return new;
1194 /* A subroutine of instantiate_virtual_regs, called via for_each_rtx.
1195 Instantiate any virtual registers present inside of *LOC. The expression
1196 is simplified, as much as possible, but is not to be considered "valid"
1197 in any sense implied by the target. If any change is made, set CHANGED
1198 to true. */
1200 static int
1201 instantiate_virtual_regs_in_rtx (rtx *loc, void *data)
1203 HOST_WIDE_INT offset;
1204 bool *changed = (bool *) data;
1205 rtx x, new;
1207 x = *loc;
1208 if (x == 0)
1209 return 0;
1211 switch (GET_CODE (x))
1213 case REG:
1214 new = instantiate_new_reg (x, &offset);
1215 if (new)
1217 *loc = plus_constant (new, offset);
1218 if (changed)
1219 *changed = true;
1221 return -1;
1223 case PLUS:
1224 new = instantiate_new_reg (XEXP (x, 0), &offset);
1225 if (new)
1227 new = plus_constant (new, offset);
1228 *loc = simplify_gen_binary (PLUS, GET_MODE (x), new, XEXP (x, 1));
1229 if (changed)
1230 *changed = true;
1231 return -1;
1234 /* FIXME -- from old code */
1235 /* If we have (plus (subreg (virtual-reg)) (const_int)), we know
1236 we can commute the PLUS and SUBREG because pointers into the
1237 frame are well-behaved. */
1238 break;
1240 default:
1241 break;
1244 return 0;
1247 /* A subroutine of instantiate_virtual_regs_in_insn. Return true if X
1248 matches the predicate for insn CODE operand OPERAND. */
1250 static int
1251 safe_insn_predicate (int code, int operand, rtx x)
1253 const struct insn_operand_data *op_data;
1255 if (code < 0)
1256 return true;
1258 op_data = &insn_data[code].operand[operand];
1259 if (op_data->predicate == NULL)
1260 return true;
1262 return op_data->predicate (x, op_data->mode);
1265 /* A subroutine of instantiate_virtual_regs. Instantiate any virtual
1266 registers present inside of insn. The result will be a valid insn. */
1268 static void
1269 instantiate_virtual_regs_in_insn (rtx insn)
1271 HOST_WIDE_INT offset;
1272 int insn_code, i;
1273 bool any_change = false;
1274 rtx set, new, x, seq;
1276 /* There are some special cases to be handled first. */
1277 set = single_set (insn);
1278 if (set)
1280 /* We're allowed to assign to a virtual register. This is interpreted
1281 to mean that the underlying register gets assigned the inverse
1282 transformation. This is used, for example, in the handling of
1283 non-local gotos. */
1284 new = instantiate_new_reg (SET_DEST (set), &offset);
1285 if (new)
1287 start_sequence ();
1289 for_each_rtx (&SET_SRC (set), instantiate_virtual_regs_in_rtx, NULL);
1290 x = simplify_gen_binary (PLUS, GET_MODE (new), SET_SRC (set),
1291 GEN_INT (-offset));
1292 x = force_operand (x, new);
1293 if (x != new)
1294 emit_move_insn (new, x);
1296 seq = get_insns ();
1297 end_sequence ();
1299 emit_insn_before (seq, insn);
1300 delete_insn (insn);
1301 return;
1304 /* Handle a straight copy from a virtual register by generating a
1305 new add insn. The difference between this and falling through
1306 to the generic case is avoiding a new pseudo and eliminating a
1307 move insn in the initial rtl stream. */
1308 new = instantiate_new_reg (SET_SRC (set), &offset);
1309 if (new && offset != 0
1310 && REG_P (SET_DEST (set))
1311 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1313 start_sequence ();
1315 x = expand_simple_binop (GET_MODE (SET_DEST (set)), PLUS,
1316 new, GEN_INT (offset), SET_DEST (set),
1317 1, OPTAB_LIB_WIDEN);
1318 if (x != SET_DEST (set))
1319 emit_move_insn (SET_DEST (set), x);
1321 seq = get_insns ();
1322 end_sequence ();
1324 emit_insn_before (seq, insn);
1325 delete_insn (insn);
1326 return;
1329 extract_insn (insn);
1330 insn_code = INSN_CODE (insn);
1332 /* Handle a plus involving a virtual register by determining if the
1333 operands remain valid if they're modified in place. */
1334 if (GET_CODE (SET_SRC (set)) == PLUS
1335 && recog_data.n_operands >= 3
1336 && recog_data.operand_loc[1] == &XEXP (SET_SRC (set), 0)
1337 && recog_data.operand_loc[2] == &XEXP (SET_SRC (set), 1)
1338 && GET_CODE (recog_data.operand[2]) == CONST_INT
1339 && (new = instantiate_new_reg (recog_data.operand[1], &offset)))
1341 offset += INTVAL (recog_data.operand[2]);
1343 /* If the sum is zero, then replace with a plain move. */
1344 if (offset == 0
1345 && REG_P (SET_DEST (set))
1346 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1348 start_sequence ();
1349 emit_move_insn (SET_DEST (set), new);
1350 seq = get_insns ();
1351 end_sequence ();
1353 emit_insn_before (seq, insn);
1354 delete_insn (insn);
1355 return;
1358 x = gen_int_mode (offset, recog_data.operand_mode[2]);
1360 /* Using validate_change and apply_change_group here leaves
1361 recog_data in an invalid state. Since we know exactly what
1362 we want to check, do those two by hand. */
1363 if (safe_insn_predicate (insn_code, 1, new)
1364 && safe_insn_predicate (insn_code, 2, x))
1366 *recog_data.operand_loc[1] = recog_data.operand[1] = new;
1367 *recog_data.operand_loc[2] = recog_data.operand[2] = x;
1368 any_change = true;
1370 /* Fall through into the regular operand fixup loop in
1371 order to take care of operands other than 1 and 2. */
1375 else
1377 extract_insn (insn);
1378 insn_code = INSN_CODE (insn);
1381 /* In the general case, we expect virtual registers to appear only in
1382 operands, and then only as either bare registers or inside memories. */
1383 for (i = 0; i < recog_data.n_operands; ++i)
1385 x = recog_data.operand[i];
1386 switch (GET_CODE (x))
1388 case MEM:
1390 rtx addr = XEXP (x, 0);
1391 bool changed = false;
1393 for_each_rtx (&addr, instantiate_virtual_regs_in_rtx, &changed);
1394 if (!changed)
1395 continue;
1397 start_sequence ();
1398 x = replace_equiv_address (x, addr);
1399 /* It may happen that the address with the virtual reg
1400 was valid (e.g. based on the virtual stack reg, which might
1401 be acceptable to the predicates with all offsets), whereas
1402 the address now isn't anymore, for instance when the address
1403 is still offsetted, but the base reg isn't virtual-stack-reg
1404 anymore. Below we would do a force_reg on the whole operand,
1405 but this insn might actually only accept memory. Hence,
1406 before doing that last resort, try to reload the address into
1407 a register, so this operand stays a MEM. */
1408 if (!safe_insn_predicate (insn_code, i, x))
1410 addr = force_reg (GET_MODE (addr), addr);
1411 x = replace_equiv_address (x, addr);
1413 seq = get_insns ();
1414 end_sequence ();
1415 if (seq)
1416 emit_insn_before (seq, insn);
1418 break;
1420 case REG:
1421 new = instantiate_new_reg (x, &offset);
1422 if (new == NULL)
1423 continue;
1424 if (offset == 0)
1425 x = new;
1426 else
1428 start_sequence ();
1430 /* Careful, special mode predicates may have stuff in
1431 insn_data[insn_code].operand[i].mode that isn't useful
1432 to us for computing a new value. */
1433 /* ??? Recognize address_operand and/or "p" constraints
1434 to see if (plus new offset) is a valid before we put
1435 this through expand_simple_binop. */
1436 x = expand_simple_binop (GET_MODE (x), PLUS, new,
1437 GEN_INT (offset), NULL_RTX,
1438 1, OPTAB_LIB_WIDEN);
1439 seq = get_insns ();
1440 end_sequence ();
1441 emit_insn_before (seq, insn);
1443 break;
1445 case SUBREG:
1446 new = instantiate_new_reg (SUBREG_REG (x), &offset);
1447 if (new == NULL)
1448 continue;
1449 if (offset != 0)
1451 start_sequence ();
1452 new = expand_simple_binop (GET_MODE (new), PLUS, new,
1453 GEN_INT (offset), NULL_RTX,
1454 1, OPTAB_LIB_WIDEN);
1455 seq = get_insns ();
1456 end_sequence ();
1457 emit_insn_before (seq, insn);
1459 x = simplify_gen_subreg (recog_data.operand_mode[i], new,
1460 GET_MODE (new), SUBREG_BYTE (x));
1461 break;
1463 default:
1464 continue;
1467 /* At this point, X contains the new value for the operand.
1468 Validate the new value vs the insn predicate. Note that
1469 asm insns will have insn_code -1 here. */
1470 if (!safe_insn_predicate (insn_code, i, x))
1472 start_sequence ();
1473 x = force_reg (insn_data[insn_code].operand[i].mode, x);
1474 seq = get_insns ();
1475 end_sequence ();
1476 if (seq)
1477 emit_insn_before (seq, insn);
1480 *recog_data.operand_loc[i] = recog_data.operand[i] = x;
1481 any_change = true;
1484 if (any_change)
1486 /* Propagate operand changes into the duplicates. */
1487 for (i = 0; i < recog_data.n_dups; ++i)
1488 *recog_data.dup_loc[i]
1489 = copy_rtx (recog_data.operand[(unsigned)recog_data.dup_num[i]]);
1491 /* Force re-recognition of the instruction for validation. */
1492 INSN_CODE (insn) = -1;
1495 if (asm_noperands (PATTERN (insn)) >= 0)
1497 if (!check_asm_operands (PATTERN (insn)))
1499 error_for_asm (insn, "impossible constraint in %<asm%>");
1500 delete_insn (insn);
1503 else
1505 if (recog_memoized (insn) < 0)
1506 fatal_insn_not_found (insn);
1510 /* Subroutine of instantiate_decls. Given RTL representing a decl,
1511 do any instantiation required. */
1513 void
1514 instantiate_decl_rtl (rtx x)
1516 rtx addr;
1518 if (x == 0)
1519 return;
1521 /* If this is a CONCAT, recurse for the pieces. */
1522 if (GET_CODE (x) == CONCAT)
1524 instantiate_decl_rtl (XEXP (x, 0));
1525 instantiate_decl_rtl (XEXP (x, 1));
1526 return;
1529 /* If this is not a MEM, no need to do anything. Similarly if the
1530 address is a constant or a register that is not a virtual register. */
1531 if (!MEM_P (x))
1532 return;
1534 addr = XEXP (x, 0);
1535 if (CONSTANT_P (addr)
1536 || (REG_P (addr)
1537 && (REGNO (addr) < FIRST_VIRTUAL_REGISTER
1538 || REGNO (addr) > LAST_VIRTUAL_REGISTER)))
1539 return;
1541 for_each_rtx (&XEXP (x, 0), instantiate_virtual_regs_in_rtx, NULL);
1544 /* Helper for instantiate_decls called via walk_tree: Process all decls
1545 in the given DECL_VALUE_EXPR. */
1547 static tree
1548 instantiate_expr (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
1550 tree t = *tp;
1551 if (! EXPR_P (t) && ! GIMPLE_STMT_P (t))
1553 *walk_subtrees = 0;
1554 if (DECL_P (t) && DECL_RTL_SET_P (t))
1555 instantiate_decl_rtl (DECL_RTL (t));
1557 return NULL;
1560 /* Subroutine of instantiate_decls: Process all decls in the given
1561 BLOCK node and all its subblocks. */
1563 static void
1564 instantiate_decls_1 (tree let)
1566 tree t;
1568 for (t = BLOCK_VARS (let); t; t = TREE_CHAIN (t))
1570 if (DECL_RTL_SET_P (t))
1571 instantiate_decl_rtl (DECL_RTL (t));
1572 if (TREE_CODE (t) == VAR_DECL && DECL_HAS_VALUE_EXPR_P (t))
1574 tree v = DECL_VALUE_EXPR (t);
1575 walk_tree (&v, instantiate_expr, NULL, NULL);
1579 /* Process all subblocks. */
1580 for (t = BLOCK_SUBBLOCKS (let); t; t = BLOCK_CHAIN (t))
1581 instantiate_decls_1 (t);
1584 /* Scan all decls in FNDECL (both variables and parameters) and instantiate
1585 all virtual registers in their DECL_RTL's. */
1587 static void
1588 instantiate_decls (tree fndecl)
1590 tree decl;
1592 /* Process all parameters of the function. */
1593 for (decl = DECL_ARGUMENTS (fndecl); decl; decl = TREE_CHAIN (decl))
1595 instantiate_decl_rtl (DECL_RTL (decl));
1596 instantiate_decl_rtl (DECL_INCOMING_RTL (decl));
1597 if (DECL_HAS_VALUE_EXPR_P (decl))
1599 tree v = DECL_VALUE_EXPR (decl);
1600 walk_tree (&v, instantiate_expr, NULL, NULL);
1604 /* Now process all variables defined in the function or its subblocks. */
1605 instantiate_decls_1 (DECL_INITIAL (fndecl));
1608 /* Pass through the INSNS of function FNDECL and convert virtual register
1609 references to hard register references. */
1611 static unsigned int
1612 instantiate_virtual_regs (void)
1614 rtx insn;
1616 /* Compute the offsets to use for this function. */
1617 in_arg_offset = FIRST_PARM_OFFSET (current_function_decl);
1618 var_offset = STARTING_FRAME_OFFSET;
1619 dynamic_offset = STACK_DYNAMIC_OFFSET (current_function_decl);
1620 out_arg_offset = STACK_POINTER_OFFSET;
1621 #ifdef FRAME_POINTER_CFA_OFFSET
1622 cfa_offset = FRAME_POINTER_CFA_OFFSET (current_function_decl);
1623 #else
1624 cfa_offset = ARG_POINTER_CFA_OFFSET (current_function_decl);
1625 #endif
1627 /* Initialize recognition, indicating that volatile is OK. */
1628 init_recog ();
1630 /* Scan through all the insns, instantiating every virtual register still
1631 present. */
1632 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
1633 if (INSN_P (insn))
1635 /* These patterns in the instruction stream can never be recognized.
1636 Fortunately, they shouldn't contain virtual registers either. */
1637 if (GET_CODE (PATTERN (insn)) == USE
1638 || GET_CODE (PATTERN (insn)) == CLOBBER
1639 || GET_CODE (PATTERN (insn)) == ADDR_VEC
1640 || GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
1641 || GET_CODE (PATTERN (insn)) == ASM_INPUT)
1642 continue;
1644 instantiate_virtual_regs_in_insn (insn);
1646 if (INSN_DELETED_P (insn))
1647 continue;
1649 for_each_rtx (&REG_NOTES (insn), instantiate_virtual_regs_in_rtx, NULL);
1651 /* Instantiate any virtual registers in CALL_INSN_FUNCTION_USAGE. */
1652 if (GET_CODE (insn) == CALL_INSN)
1653 for_each_rtx (&CALL_INSN_FUNCTION_USAGE (insn),
1654 instantiate_virtual_regs_in_rtx, NULL);
1657 /* Instantiate the virtual registers in the DECLs for debugging purposes. */
1658 instantiate_decls (current_function_decl);
1660 targetm.instantiate_decls ();
1662 /* Indicate that, from now on, assign_stack_local should use
1663 frame_pointer_rtx. */
1664 virtuals_instantiated = 1;
1665 return 0;
1668 struct rtl_opt_pass pass_instantiate_virtual_regs =
1671 RTL_PASS,
1672 "vregs", /* name */
1673 NULL, /* gate */
1674 instantiate_virtual_regs, /* execute */
1675 NULL, /* sub */
1676 NULL, /* next */
1677 0, /* static_pass_number */
1678 0, /* tv_id */
1679 0, /* properties_required */
1680 0, /* properties_provided */
1681 0, /* properties_destroyed */
1682 0, /* todo_flags_start */
1683 TODO_dump_func /* todo_flags_finish */
1688 /* Return 1 if EXP is an aggregate type (or a value with aggregate type).
1689 This means a type for which function calls must pass an address to the
1690 function or get an address back from the function.
1691 EXP may be a type node or an expression (whose type is tested). */
1694 aggregate_value_p (const_tree exp, const_tree fntype)
1696 int i, regno, nregs;
1697 rtx reg;
1699 const_tree type = (TYPE_P (exp)) ? exp : TREE_TYPE (exp);
1701 /* DECL node associated with FNTYPE when relevant, which we might need to
1702 check for by-invisible-reference returns, typically for CALL_EXPR input
1703 EXPressions. */
1704 const_tree fndecl = NULL_TREE;
1706 if (fntype)
1707 switch (TREE_CODE (fntype))
1709 case CALL_EXPR:
1710 fndecl = get_callee_fndecl (fntype);
1711 fntype = fndecl ? TREE_TYPE (fndecl) : 0;
1712 break;
1713 case FUNCTION_DECL:
1714 fndecl = fntype;
1715 fntype = TREE_TYPE (fndecl);
1716 break;
1717 case FUNCTION_TYPE:
1718 case METHOD_TYPE:
1719 break;
1720 case IDENTIFIER_NODE:
1721 fntype = 0;
1722 break;
1723 default:
1724 /* We don't expect other rtl types here. */
1725 gcc_unreachable ();
1728 if (TREE_CODE (type) == VOID_TYPE)
1729 return 0;
1731 /* If the front end has decided that this needs to be passed by
1732 reference, do so. */
1733 if ((TREE_CODE (exp) == PARM_DECL || TREE_CODE (exp) == RESULT_DECL)
1734 && DECL_BY_REFERENCE (exp))
1735 return 1;
1737 /* If the EXPression is a CALL_EXPR, honor DECL_BY_REFERENCE set on the
1738 called function RESULT_DECL, meaning the function returns in memory by
1739 invisible reference. This check lets front-ends not set TREE_ADDRESSABLE
1740 on the function type, which used to be the way to request such a return
1741 mechanism but might now be causing troubles at gimplification time if
1742 temporaries with the function type need to be created. */
1743 if (TREE_CODE (exp) == CALL_EXPR && fndecl && DECL_RESULT (fndecl)
1744 && DECL_BY_REFERENCE (DECL_RESULT (fndecl)))
1745 return 1;
1747 if (targetm.calls.return_in_memory (type, fntype))
1748 return 1;
1749 /* Types that are TREE_ADDRESSABLE must be constructed in memory,
1750 and thus can't be returned in registers. */
1751 if (TREE_ADDRESSABLE (type))
1752 return 1;
1753 if (flag_pcc_struct_return && AGGREGATE_TYPE_P (type))
1754 return 1;
1755 /* Make sure we have suitable call-clobbered regs to return
1756 the value in; if not, we must return it in memory. */
1757 reg = hard_function_value (type, 0, fntype, 0);
1759 /* If we have something other than a REG (e.g. a PARALLEL), then assume
1760 it is OK. */
1761 if (!REG_P (reg))
1762 return 0;
1764 regno = REGNO (reg);
1765 nregs = hard_regno_nregs[regno][TYPE_MODE (type)];
1766 for (i = 0; i < nregs; i++)
1767 if (! call_used_regs[regno + i])
1768 return 1;
1769 return 0;
1772 /* Return true if we should assign DECL a pseudo register; false if it
1773 should live on the local stack. */
1775 bool
1776 use_register_for_decl (const_tree decl)
1778 if (!targetm.calls.allocate_stack_slots_for_args())
1779 return true;
1781 /* Honor volatile. */
1782 if (TREE_SIDE_EFFECTS (decl))
1783 return false;
1785 /* Honor addressability. */
1786 if (TREE_ADDRESSABLE (decl))
1787 return false;
1789 /* Only register-like things go in registers. */
1790 if (DECL_MODE (decl) == BLKmode)
1791 return false;
1793 /* If -ffloat-store specified, don't put explicit float variables
1794 into registers. */
1795 /* ??? This should be checked after DECL_ARTIFICIAL, but tree-ssa
1796 propagates values across these stores, and it probably shouldn't. */
1797 if (flag_float_store && FLOAT_TYPE_P (TREE_TYPE (decl)))
1798 return false;
1800 /* If we're not interested in tracking debugging information for
1801 this decl, then we can certainly put it in a register. */
1802 if (DECL_IGNORED_P (decl))
1803 return true;
1805 return (optimize || DECL_REGISTER (decl));
1808 /* Return true if TYPE should be passed by invisible reference. */
1810 bool
1811 pass_by_reference (CUMULATIVE_ARGS *ca, enum machine_mode mode,
1812 tree type, bool named_arg)
1814 if (type)
1816 /* If this type contains non-trivial constructors, then it is
1817 forbidden for the middle-end to create any new copies. */
1818 if (TREE_ADDRESSABLE (type))
1819 return true;
1821 /* GCC post 3.4 passes *all* variable sized types by reference. */
1822 if (!TYPE_SIZE (type) || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
1823 return true;
1826 return targetm.calls.pass_by_reference (ca, mode, type, named_arg);
1829 /* Return true if TYPE, which is passed by reference, should be callee
1830 copied instead of caller copied. */
1832 bool
1833 reference_callee_copied (CUMULATIVE_ARGS *ca, enum machine_mode mode,
1834 tree type, bool named_arg)
1836 if (type && TREE_ADDRESSABLE (type))
1837 return false;
1838 return targetm.calls.callee_copies (ca, mode, type, named_arg);
1841 /* Structures to communicate between the subroutines of assign_parms.
1842 The first holds data persistent across all parameters, the second
1843 is cleared out for each parameter. */
1845 struct assign_parm_data_all
1847 CUMULATIVE_ARGS args_so_far;
1848 struct args_size stack_args_size;
1849 tree function_result_decl;
1850 tree orig_fnargs;
1851 rtx first_conversion_insn;
1852 rtx last_conversion_insn;
1853 HOST_WIDE_INT pretend_args_size;
1854 HOST_WIDE_INT extra_pretend_bytes;
1855 int reg_parm_stack_space;
1858 struct assign_parm_data_one
1860 tree nominal_type;
1861 tree passed_type;
1862 rtx entry_parm;
1863 rtx stack_parm;
1864 enum machine_mode nominal_mode;
1865 enum machine_mode passed_mode;
1866 enum machine_mode promoted_mode;
1867 struct locate_and_pad_arg_data locate;
1868 int partial;
1869 BOOL_BITFIELD named_arg : 1;
1870 BOOL_BITFIELD passed_pointer : 1;
1871 BOOL_BITFIELD on_stack : 1;
1872 BOOL_BITFIELD loaded_in_reg : 1;
1875 /* A subroutine of assign_parms. Initialize ALL. */
1877 static void
1878 assign_parms_initialize_all (struct assign_parm_data_all *all)
1880 tree fntype;
1882 memset (all, 0, sizeof (*all));
1884 fntype = TREE_TYPE (current_function_decl);
1886 #ifdef INIT_CUMULATIVE_INCOMING_ARGS
1887 INIT_CUMULATIVE_INCOMING_ARGS (all->args_so_far, fntype, NULL_RTX);
1888 #else
1889 INIT_CUMULATIVE_ARGS (all->args_so_far, fntype, NULL_RTX,
1890 current_function_decl, -1);
1891 #endif
1893 #ifdef REG_PARM_STACK_SPACE
1894 all->reg_parm_stack_space = REG_PARM_STACK_SPACE (current_function_decl);
1895 #endif
1898 /* If ARGS contains entries with complex types, split the entry into two
1899 entries of the component type. Return a new list of substitutions are
1900 needed, else the old list. */
1902 static tree
1903 split_complex_args (tree args)
1905 tree p;
1907 /* Before allocating memory, check for the common case of no complex. */
1908 for (p = args; p; p = TREE_CHAIN (p))
1910 tree type = TREE_TYPE (p);
1911 if (TREE_CODE (type) == COMPLEX_TYPE
1912 && targetm.calls.split_complex_arg (type))
1913 goto found;
1915 return args;
1917 found:
1918 args = copy_list (args);
1920 for (p = args; p; p = TREE_CHAIN (p))
1922 tree type = TREE_TYPE (p);
1923 if (TREE_CODE (type) == COMPLEX_TYPE
1924 && targetm.calls.split_complex_arg (type))
1926 tree decl;
1927 tree subtype = TREE_TYPE (type);
1928 bool addressable = TREE_ADDRESSABLE (p);
1930 /* Rewrite the PARM_DECL's type with its component. */
1931 TREE_TYPE (p) = subtype;
1932 DECL_ARG_TYPE (p) = TREE_TYPE (DECL_ARG_TYPE (p));
1933 DECL_MODE (p) = VOIDmode;
1934 DECL_SIZE (p) = NULL;
1935 DECL_SIZE_UNIT (p) = NULL;
1936 /* If this arg must go in memory, put it in a pseudo here.
1937 We can't allow it to go in memory as per normal parms,
1938 because the usual place might not have the imag part
1939 adjacent to the real part. */
1940 DECL_ARTIFICIAL (p) = addressable;
1941 DECL_IGNORED_P (p) = addressable;
1942 TREE_ADDRESSABLE (p) = 0;
1943 layout_decl (p, 0);
1945 /* Build a second synthetic decl. */
1946 decl = build_decl (PARM_DECL, NULL_TREE, subtype);
1947 DECL_ARG_TYPE (decl) = DECL_ARG_TYPE (p);
1948 DECL_ARTIFICIAL (decl) = addressable;
1949 DECL_IGNORED_P (decl) = addressable;
1950 layout_decl (decl, 0);
1952 /* Splice it in; skip the new decl. */
1953 TREE_CHAIN (decl) = TREE_CHAIN (p);
1954 TREE_CHAIN (p) = decl;
1955 p = decl;
1959 return args;
1962 /* A subroutine of assign_parms. Adjust the parameter list to incorporate
1963 the hidden struct return argument, and (abi willing) complex args.
1964 Return the new parameter list. */
1966 static tree
1967 assign_parms_augmented_arg_list (struct assign_parm_data_all *all)
1969 tree fndecl = current_function_decl;
1970 tree fntype = TREE_TYPE (fndecl);
1971 tree fnargs = DECL_ARGUMENTS (fndecl);
1973 /* If struct value address is treated as the first argument, make it so. */
1974 if (aggregate_value_p (DECL_RESULT (fndecl), fndecl)
1975 && ! cfun->returns_pcc_struct
1976 && targetm.calls.struct_value_rtx (TREE_TYPE (fndecl), 1) == 0)
1978 tree type = build_pointer_type (TREE_TYPE (fntype));
1979 tree decl;
1981 decl = build_decl (PARM_DECL, NULL_TREE, type);
1982 DECL_ARG_TYPE (decl) = type;
1983 DECL_ARTIFICIAL (decl) = 1;
1984 DECL_IGNORED_P (decl) = 1;
1986 TREE_CHAIN (decl) = fnargs;
1987 fnargs = decl;
1988 all->function_result_decl = decl;
1991 all->orig_fnargs = fnargs;
1993 /* If the target wants to split complex arguments into scalars, do so. */
1994 if (targetm.calls.split_complex_arg)
1995 fnargs = split_complex_args (fnargs);
1997 return fnargs;
2000 /* A subroutine of assign_parms. Examine PARM and pull out type and mode
2001 data for the parameter. Incorporate ABI specifics such as pass-by-
2002 reference and type promotion. */
2004 static void
2005 assign_parm_find_data_types (struct assign_parm_data_all *all, tree parm,
2006 struct assign_parm_data_one *data)
2008 tree nominal_type, passed_type;
2009 enum machine_mode nominal_mode, passed_mode, promoted_mode;
2011 memset (data, 0, sizeof (*data));
2013 /* NAMED_ARG is a mis-nomer. We really mean 'non-varadic'. */
2014 if (!cfun->stdarg)
2015 data->named_arg = 1; /* No varadic parms. */
2016 else if (TREE_CHAIN (parm))
2017 data->named_arg = 1; /* Not the last non-varadic parm. */
2018 else if (targetm.calls.strict_argument_naming (&all->args_so_far))
2019 data->named_arg = 1; /* Only varadic ones are unnamed. */
2020 else
2021 data->named_arg = 0; /* Treat as varadic. */
2023 nominal_type = TREE_TYPE (parm);
2024 passed_type = DECL_ARG_TYPE (parm);
2026 /* Look out for errors propagating this far. Also, if the parameter's
2027 type is void then its value doesn't matter. */
2028 if (TREE_TYPE (parm) == error_mark_node
2029 /* This can happen after weird syntax errors
2030 or if an enum type is defined among the parms. */
2031 || TREE_CODE (parm) != PARM_DECL
2032 || passed_type == NULL
2033 || VOID_TYPE_P (nominal_type))
2035 nominal_type = passed_type = void_type_node;
2036 nominal_mode = passed_mode = promoted_mode = VOIDmode;
2037 goto egress;
2040 /* Find mode of arg as it is passed, and mode of arg as it should be
2041 during execution of this function. */
2042 passed_mode = TYPE_MODE (passed_type);
2043 nominal_mode = TYPE_MODE (nominal_type);
2045 /* If the parm is to be passed as a transparent union, use the type of
2046 the first field for the tests below. We have already verified that
2047 the modes are the same. */
2048 if (TREE_CODE (passed_type) == UNION_TYPE
2049 && TYPE_TRANSPARENT_UNION (passed_type))
2050 passed_type = TREE_TYPE (TYPE_FIELDS (passed_type));
2052 /* See if this arg was passed by invisible reference. */
2053 if (pass_by_reference (&all->args_so_far, passed_mode,
2054 passed_type, data->named_arg))
2056 passed_type = nominal_type = build_pointer_type (passed_type);
2057 data->passed_pointer = true;
2058 passed_mode = nominal_mode = Pmode;
2061 /* Find mode as it is passed by the ABI. */
2062 promoted_mode = passed_mode;
2063 if (targetm.calls.promote_function_args (TREE_TYPE (current_function_decl)))
2065 int unsignedp = TYPE_UNSIGNED (passed_type);
2066 promoted_mode = promote_mode (passed_type, promoted_mode,
2067 &unsignedp, 1);
2070 egress:
2071 data->nominal_type = nominal_type;
2072 data->passed_type = passed_type;
2073 data->nominal_mode = nominal_mode;
2074 data->passed_mode = passed_mode;
2075 data->promoted_mode = promoted_mode;
2078 /* A subroutine of assign_parms. Invoke setup_incoming_varargs. */
2080 static void
2081 assign_parms_setup_varargs (struct assign_parm_data_all *all,
2082 struct assign_parm_data_one *data, bool no_rtl)
2084 int varargs_pretend_bytes = 0;
2086 targetm.calls.setup_incoming_varargs (&all->args_so_far,
2087 data->promoted_mode,
2088 data->passed_type,
2089 &varargs_pretend_bytes, no_rtl);
2091 /* If the back-end has requested extra stack space, record how much is
2092 needed. Do not change pretend_args_size otherwise since it may be
2093 nonzero from an earlier partial argument. */
2094 if (varargs_pretend_bytes > 0)
2095 all->pretend_args_size = varargs_pretend_bytes;
2098 /* A subroutine of assign_parms. Set DATA->ENTRY_PARM corresponding to
2099 the incoming location of the current parameter. */
2101 static void
2102 assign_parm_find_entry_rtl (struct assign_parm_data_all *all,
2103 struct assign_parm_data_one *data)
2105 HOST_WIDE_INT pretend_bytes = 0;
2106 rtx entry_parm;
2107 bool in_regs;
2109 if (data->promoted_mode == VOIDmode)
2111 data->entry_parm = data->stack_parm = const0_rtx;
2112 return;
2115 #ifdef FUNCTION_INCOMING_ARG
2116 entry_parm = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode,
2117 data->passed_type, data->named_arg);
2118 #else
2119 entry_parm = FUNCTION_ARG (all->args_so_far, data->promoted_mode,
2120 data->passed_type, data->named_arg);
2121 #endif
2123 if (entry_parm == 0)
2124 data->promoted_mode = data->passed_mode;
2126 /* Determine parm's home in the stack, in case it arrives in the stack
2127 or we should pretend it did. Compute the stack position and rtx where
2128 the argument arrives and its size.
2130 There is one complexity here: If this was a parameter that would
2131 have been passed in registers, but wasn't only because it is
2132 __builtin_va_alist, we want locate_and_pad_parm to treat it as if
2133 it came in a register so that REG_PARM_STACK_SPACE isn't skipped.
2134 In this case, we call FUNCTION_ARG with NAMED set to 1 instead of 0
2135 as it was the previous time. */
2136 in_regs = entry_parm != 0;
2137 #ifdef STACK_PARMS_IN_REG_PARM_AREA
2138 in_regs = true;
2139 #endif
2140 if (!in_regs && !data->named_arg)
2142 if (targetm.calls.pretend_outgoing_varargs_named (&all->args_so_far))
2144 rtx tem;
2145 #ifdef FUNCTION_INCOMING_ARG
2146 tem = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode,
2147 data->passed_type, true);
2148 #else
2149 tem = FUNCTION_ARG (all->args_so_far, data->promoted_mode,
2150 data->passed_type, true);
2151 #endif
2152 in_regs = tem != NULL;
2156 /* If this parameter was passed both in registers and in the stack, use
2157 the copy on the stack. */
2158 if (targetm.calls.must_pass_in_stack (data->promoted_mode,
2159 data->passed_type))
2160 entry_parm = 0;
2162 if (entry_parm)
2164 int partial;
2166 partial = targetm.calls.arg_partial_bytes (&all->args_so_far,
2167 data->promoted_mode,
2168 data->passed_type,
2169 data->named_arg);
2170 data->partial = partial;
2172 /* The caller might already have allocated stack space for the
2173 register parameters. */
2174 if (partial != 0 && all->reg_parm_stack_space == 0)
2176 /* Part of this argument is passed in registers and part
2177 is passed on the stack. Ask the prologue code to extend
2178 the stack part so that we can recreate the full value.
2180 PRETEND_BYTES is the size of the registers we need to store.
2181 CURRENT_FUNCTION_PRETEND_ARGS_SIZE is the amount of extra
2182 stack space that the prologue should allocate.
2184 Internally, gcc assumes that the argument pointer is aligned
2185 to STACK_BOUNDARY bits. This is used both for alignment
2186 optimizations (see init_emit) and to locate arguments that are
2187 aligned to more than PARM_BOUNDARY bits. We must preserve this
2188 invariant by rounding CURRENT_FUNCTION_PRETEND_ARGS_SIZE up to
2189 a stack boundary. */
2191 /* We assume at most one partial arg, and it must be the first
2192 argument on the stack. */
2193 gcc_assert (!all->extra_pretend_bytes && !all->pretend_args_size);
2195 pretend_bytes = partial;
2196 all->pretend_args_size = CEIL_ROUND (pretend_bytes, STACK_BYTES);
2198 /* We want to align relative to the actual stack pointer, so
2199 don't include this in the stack size until later. */
2200 all->extra_pretend_bytes = all->pretend_args_size;
2204 locate_and_pad_parm (data->promoted_mode, data->passed_type, in_regs,
2205 entry_parm ? data->partial : 0, current_function_decl,
2206 &all->stack_args_size, &data->locate);
2208 /* Adjust offsets to include the pretend args. */
2209 pretend_bytes = all->extra_pretend_bytes - pretend_bytes;
2210 data->locate.slot_offset.constant += pretend_bytes;
2211 data->locate.offset.constant += pretend_bytes;
2213 data->entry_parm = entry_parm;
2216 /* A subroutine of assign_parms. If there is actually space on the stack
2217 for this parm, count it in stack_args_size and return true. */
2219 static bool
2220 assign_parm_is_stack_parm (struct assign_parm_data_all *all,
2221 struct assign_parm_data_one *data)
2223 /* Trivially true if we've no incoming register. */
2224 if (data->entry_parm == NULL)
2226 /* Also true if we're partially in registers and partially not,
2227 since we've arranged to drop the entire argument on the stack. */
2228 else if (data->partial != 0)
2230 /* Also true if the target says that it's passed in both registers
2231 and on the stack. */
2232 else if (GET_CODE (data->entry_parm) == PARALLEL
2233 && XEXP (XVECEXP (data->entry_parm, 0, 0), 0) == NULL_RTX)
2235 /* Also true if the target says that there's stack allocated for
2236 all register parameters. */
2237 else if (all->reg_parm_stack_space > 0)
2239 /* Otherwise, no, this parameter has no ABI defined stack slot. */
2240 else
2241 return false;
2243 all->stack_args_size.constant += data->locate.size.constant;
2244 if (data->locate.size.var)
2245 ADD_PARM_SIZE (all->stack_args_size, data->locate.size.var);
2247 return true;
2250 /* A subroutine of assign_parms. Given that this parameter is allocated
2251 stack space by the ABI, find it. */
2253 static void
2254 assign_parm_find_stack_rtl (tree parm, struct assign_parm_data_one *data)
2256 rtx offset_rtx, stack_parm;
2257 unsigned int align, boundary;
2259 /* If we're passing this arg using a reg, make its stack home the
2260 aligned stack slot. */
2261 if (data->entry_parm)
2262 offset_rtx = ARGS_SIZE_RTX (data->locate.slot_offset);
2263 else
2264 offset_rtx = ARGS_SIZE_RTX (data->locate.offset);
2266 stack_parm = crtl->args.internal_arg_pointer;
2267 if (offset_rtx != const0_rtx)
2268 stack_parm = gen_rtx_PLUS (Pmode, stack_parm, offset_rtx);
2269 stack_parm = gen_rtx_MEM (data->promoted_mode, stack_parm);
2271 set_mem_attributes (stack_parm, parm, 1);
2273 boundary = data->locate.boundary;
2274 align = BITS_PER_UNIT;
2276 /* If we're padding upward, we know that the alignment of the slot
2277 is FUNCTION_ARG_BOUNDARY. If we're using slot_offset, we're
2278 intentionally forcing upward padding. Otherwise we have to come
2279 up with a guess at the alignment based on OFFSET_RTX. */
2280 if (data->locate.where_pad != downward || data->entry_parm)
2281 align = boundary;
2282 else if (GET_CODE (offset_rtx) == CONST_INT)
2284 align = INTVAL (offset_rtx) * BITS_PER_UNIT | boundary;
2285 align = align & -align;
2287 set_mem_align (stack_parm, align);
2289 if (data->entry_parm)
2290 set_reg_attrs_for_parm (data->entry_parm, stack_parm);
2292 data->stack_parm = stack_parm;
2295 /* A subroutine of assign_parms. Adjust DATA->ENTRY_RTL such that it's
2296 always valid and contiguous. */
2298 static void
2299 assign_parm_adjust_entry_rtl (struct assign_parm_data_one *data)
2301 rtx entry_parm = data->entry_parm;
2302 rtx stack_parm = data->stack_parm;
2304 /* If this parm was passed part in regs and part in memory, pretend it
2305 arrived entirely in memory by pushing the register-part onto the stack.
2306 In the special case of a DImode or DFmode that is split, we could put
2307 it together in a pseudoreg directly, but for now that's not worth
2308 bothering with. */
2309 if (data->partial != 0)
2311 /* Handle calls that pass values in multiple non-contiguous
2312 locations. The Irix 6 ABI has examples of this. */
2313 if (GET_CODE (entry_parm) == PARALLEL)
2314 emit_group_store (validize_mem (stack_parm), entry_parm,
2315 data->passed_type,
2316 int_size_in_bytes (data->passed_type));
2317 else
2319 gcc_assert (data->partial % UNITS_PER_WORD == 0);
2320 move_block_from_reg (REGNO (entry_parm), validize_mem (stack_parm),
2321 data->partial / UNITS_PER_WORD);
2324 entry_parm = stack_parm;
2327 /* If we didn't decide this parm came in a register, by default it came
2328 on the stack. */
2329 else if (entry_parm == NULL)
2330 entry_parm = stack_parm;
2332 /* When an argument is passed in multiple locations, we can't make use
2333 of this information, but we can save some copying if the whole argument
2334 is passed in a single register. */
2335 else if (GET_CODE (entry_parm) == PARALLEL
2336 && data->nominal_mode != BLKmode
2337 && data->passed_mode != BLKmode)
2339 size_t i, len = XVECLEN (entry_parm, 0);
2341 for (i = 0; i < len; i++)
2342 if (XEXP (XVECEXP (entry_parm, 0, i), 0) != NULL_RTX
2343 && REG_P (XEXP (XVECEXP (entry_parm, 0, i), 0))
2344 && (GET_MODE (XEXP (XVECEXP (entry_parm, 0, i), 0))
2345 == data->passed_mode)
2346 && INTVAL (XEXP (XVECEXP (entry_parm, 0, i), 1)) == 0)
2348 entry_parm = XEXP (XVECEXP (entry_parm, 0, i), 0);
2349 break;
2353 data->entry_parm = entry_parm;
2356 /* A subroutine of assign_parms. Adjust DATA->STACK_RTL such that it's
2357 always valid and properly aligned. */
2359 static void
2360 assign_parm_adjust_stack_rtl (struct assign_parm_data_one *data)
2362 rtx stack_parm = data->stack_parm;
2364 /* If we can't trust the parm stack slot to be aligned enough for its
2365 ultimate type, don't use that slot after entry. We'll make another
2366 stack slot, if we need one. */
2367 if (stack_parm
2368 && ((STRICT_ALIGNMENT
2369 && GET_MODE_ALIGNMENT (data->nominal_mode) > MEM_ALIGN (stack_parm))
2370 || (data->nominal_type
2371 && TYPE_ALIGN (data->nominal_type) > MEM_ALIGN (stack_parm)
2372 && MEM_ALIGN (stack_parm) < PREFERRED_STACK_BOUNDARY)))
2373 stack_parm = NULL;
2375 /* If parm was passed in memory, and we need to convert it on entry,
2376 don't store it back in that same slot. */
2377 else if (data->entry_parm == stack_parm
2378 && data->nominal_mode != BLKmode
2379 && data->nominal_mode != data->passed_mode)
2380 stack_parm = NULL;
2382 /* If stack protection is in effect for this function, don't leave any
2383 pointers in their passed stack slots. */
2384 else if (crtl->stack_protect_guard
2385 && (flag_stack_protect == 2
2386 || data->passed_pointer
2387 || POINTER_TYPE_P (data->nominal_type)))
2388 stack_parm = NULL;
2390 data->stack_parm = stack_parm;
2393 /* A subroutine of assign_parms. Return true if the current parameter
2394 should be stored as a BLKmode in the current frame. */
2396 static bool
2397 assign_parm_setup_block_p (struct assign_parm_data_one *data)
2399 if (data->nominal_mode == BLKmode)
2400 return true;
2401 if (GET_CODE (data->entry_parm) == PARALLEL)
2402 return true;
2404 #ifdef BLOCK_REG_PADDING
2405 /* Only assign_parm_setup_block knows how to deal with register arguments
2406 that are padded at the least significant end. */
2407 if (REG_P (data->entry_parm)
2408 && GET_MODE_SIZE (data->promoted_mode) < UNITS_PER_WORD
2409 && (BLOCK_REG_PADDING (data->passed_mode, data->passed_type, 1)
2410 == (BYTES_BIG_ENDIAN ? upward : downward)))
2411 return true;
2412 #endif
2414 return false;
2417 /* A subroutine of assign_parms. Arrange for the parameter to be
2418 present and valid in DATA->STACK_RTL. */
2420 static void
2421 assign_parm_setup_block (struct assign_parm_data_all *all,
2422 tree parm, struct assign_parm_data_one *data)
2424 rtx entry_parm = data->entry_parm;
2425 rtx stack_parm = data->stack_parm;
2426 HOST_WIDE_INT size;
2427 HOST_WIDE_INT size_stored;
2428 rtx orig_entry_parm = entry_parm;
2430 if (GET_CODE (entry_parm) == PARALLEL)
2431 entry_parm = emit_group_move_into_temps (entry_parm);
2433 /* If we've a non-block object that's nevertheless passed in parts,
2434 reconstitute it in register operations rather than on the stack. */
2435 if (GET_CODE (entry_parm) == PARALLEL
2436 && data->nominal_mode != BLKmode)
2438 rtx elt0 = XEXP (XVECEXP (orig_entry_parm, 0, 0), 0);
2440 if ((XVECLEN (entry_parm, 0) > 1
2441 || hard_regno_nregs[REGNO (elt0)][GET_MODE (elt0)] > 1)
2442 && use_register_for_decl (parm))
2444 rtx parmreg = gen_reg_rtx (data->nominal_mode);
2446 push_to_sequence2 (all->first_conversion_insn,
2447 all->last_conversion_insn);
2449 /* For values returned in multiple registers, handle possible
2450 incompatible calls to emit_group_store.
2452 For example, the following would be invalid, and would have to
2453 be fixed by the conditional below:
2455 emit_group_store ((reg:SF), (parallel:DF))
2456 emit_group_store ((reg:SI), (parallel:DI))
2458 An example of this are doubles in e500 v2:
2459 (parallel:DF (expr_list (reg:SI) (const_int 0))
2460 (expr_list (reg:SI) (const_int 4))). */
2461 if (data->nominal_mode != data->passed_mode)
2463 rtx t = gen_reg_rtx (GET_MODE (entry_parm));
2464 emit_group_store (t, entry_parm, NULL_TREE,
2465 GET_MODE_SIZE (GET_MODE (entry_parm)));
2466 convert_move (parmreg, t, 0);
2468 else
2469 emit_group_store (parmreg, entry_parm, data->nominal_type,
2470 int_size_in_bytes (data->nominal_type));
2472 all->first_conversion_insn = get_insns ();
2473 all->last_conversion_insn = get_last_insn ();
2474 end_sequence ();
2476 SET_DECL_RTL (parm, parmreg);
2477 return;
2481 size = int_size_in_bytes (data->passed_type);
2482 size_stored = CEIL_ROUND (size, UNITS_PER_WORD);
2483 if (stack_parm == 0)
2485 DECL_ALIGN (parm) = MAX (DECL_ALIGN (parm), BITS_PER_WORD);
2486 stack_parm = assign_stack_local (BLKmode, size_stored,
2487 DECL_ALIGN (parm));
2488 if (GET_MODE_SIZE (GET_MODE (entry_parm)) == size)
2489 PUT_MODE (stack_parm, GET_MODE (entry_parm));
2490 set_mem_attributes (stack_parm, parm, 1);
2493 /* If a BLKmode arrives in registers, copy it to a stack slot. Handle
2494 calls that pass values in multiple non-contiguous locations. */
2495 if (REG_P (entry_parm) || GET_CODE (entry_parm) == PARALLEL)
2497 rtx mem;
2499 /* Note that we will be storing an integral number of words.
2500 So we have to be careful to ensure that we allocate an
2501 integral number of words. We do this above when we call
2502 assign_stack_local if space was not allocated in the argument
2503 list. If it was, this will not work if PARM_BOUNDARY is not
2504 a multiple of BITS_PER_WORD. It isn't clear how to fix this
2505 if it becomes a problem. Exception is when BLKmode arrives
2506 with arguments not conforming to word_mode. */
2508 if (data->stack_parm == 0)
2510 else if (GET_CODE (entry_parm) == PARALLEL)
2512 else
2513 gcc_assert (!size || !(PARM_BOUNDARY % BITS_PER_WORD));
2515 mem = validize_mem (stack_parm);
2517 /* Handle values in multiple non-contiguous locations. */
2518 if (GET_CODE (entry_parm) == PARALLEL)
2520 push_to_sequence2 (all->first_conversion_insn,
2521 all->last_conversion_insn);
2522 emit_group_store (mem, entry_parm, data->passed_type, size);
2523 all->first_conversion_insn = get_insns ();
2524 all->last_conversion_insn = get_last_insn ();
2525 end_sequence ();
2528 else if (size == 0)
2531 /* If SIZE is that of a mode no bigger than a word, just use
2532 that mode's store operation. */
2533 else if (size <= UNITS_PER_WORD)
2535 enum machine_mode mode
2536 = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0);
2538 if (mode != BLKmode
2539 #ifdef BLOCK_REG_PADDING
2540 && (size == UNITS_PER_WORD
2541 || (BLOCK_REG_PADDING (mode, data->passed_type, 1)
2542 != (BYTES_BIG_ENDIAN ? upward : downward)))
2543 #endif
2546 rtx reg;
2548 /* We are really truncating a word_mode value containing
2549 SIZE bytes into a value of mode MODE. If such an
2550 operation requires no actual instructions, we can refer
2551 to the value directly in mode MODE, otherwise we must
2552 start with the register in word_mode and explicitly
2553 convert it. */
2554 if (TRULY_NOOP_TRUNCATION (size * BITS_PER_UNIT, BITS_PER_WORD))
2555 reg = gen_rtx_REG (mode, REGNO (entry_parm));
2556 else
2558 reg = gen_rtx_REG (word_mode, REGNO (entry_parm));
2559 reg = convert_to_mode (mode, copy_to_reg (reg), 1);
2561 emit_move_insn (change_address (mem, mode, 0), reg);
2564 /* Blocks smaller than a word on a BYTES_BIG_ENDIAN
2565 machine must be aligned to the left before storing
2566 to memory. Note that the previous test doesn't
2567 handle all cases (e.g. SIZE == 3). */
2568 else if (size != UNITS_PER_WORD
2569 #ifdef BLOCK_REG_PADDING
2570 && (BLOCK_REG_PADDING (mode, data->passed_type, 1)
2571 == downward)
2572 #else
2573 && BYTES_BIG_ENDIAN
2574 #endif
2577 rtx tem, x;
2578 int by = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
2579 rtx reg = gen_rtx_REG (word_mode, REGNO (entry_parm));
2581 x = expand_shift (LSHIFT_EXPR, word_mode, reg,
2582 build_int_cst (NULL_TREE, by),
2583 NULL_RTX, 1);
2584 tem = change_address (mem, word_mode, 0);
2585 emit_move_insn (tem, x);
2587 else
2588 move_block_from_reg (REGNO (entry_parm), mem,
2589 size_stored / UNITS_PER_WORD);
2591 else
2592 move_block_from_reg (REGNO (entry_parm), mem,
2593 size_stored / UNITS_PER_WORD);
2595 else if (data->stack_parm == 0)
2597 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
2598 emit_block_move (stack_parm, data->entry_parm, GEN_INT (size),
2599 BLOCK_OP_NORMAL);
2600 all->first_conversion_insn = get_insns ();
2601 all->last_conversion_insn = get_last_insn ();
2602 end_sequence ();
2605 data->stack_parm = stack_parm;
2606 SET_DECL_RTL (parm, stack_parm);
2609 /* A subroutine of assign_parms. Allocate a pseudo to hold the current
2610 parameter. Get it there. Perform all ABI specified conversions. */
2612 static void
2613 assign_parm_setup_reg (struct assign_parm_data_all *all, tree parm,
2614 struct assign_parm_data_one *data)
2616 rtx parmreg;
2617 enum machine_mode promoted_nominal_mode;
2618 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (parm));
2619 bool did_conversion = false;
2621 /* Store the parm in a pseudoregister during the function, but we may
2622 need to do it in a wider mode. */
2624 /* This is not really promoting for a call. However we need to be
2625 consistent with assign_parm_find_data_types and expand_expr_real_1. */
2626 promoted_nominal_mode
2627 = promote_mode (data->nominal_type, data->nominal_mode, &unsignedp, 1);
2629 parmreg = gen_reg_rtx (promoted_nominal_mode);
2631 if (!DECL_ARTIFICIAL (parm))
2632 mark_user_reg (parmreg);
2634 /* If this was an item that we received a pointer to,
2635 set DECL_RTL appropriately. */
2636 if (data->passed_pointer)
2638 rtx x = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data->passed_type)), parmreg);
2639 set_mem_attributes (x, parm, 1);
2640 SET_DECL_RTL (parm, x);
2642 else
2643 SET_DECL_RTL (parm, parmreg);
2645 /* Copy the value into the register. */
2646 if (data->nominal_mode != data->passed_mode
2647 || promoted_nominal_mode != data->promoted_mode)
2649 int save_tree_used;
2651 /* ENTRY_PARM has been converted to PROMOTED_MODE, its
2652 mode, by the caller. We now have to convert it to
2653 NOMINAL_MODE, if different. However, PARMREG may be in
2654 a different mode than NOMINAL_MODE if it is being stored
2655 promoted.
2657 If ENTRY_PARM is a hard register, it might be in a register
2658 not valid for operating in its mode (e.g., an odd-numbered
2659 register for a DFmode). In that case, moves are the only
2660 thing valid, so we can't do a convert from there. This
2661 occurs when the calling sequence allow such misaligned
2662 usages.
2664 In addition, the conversion may involve a call, which could
2665 clobber parameters which haven't been copied to pseudo
2666 registers yet. Therefore, we must first copy the parm to
2667 a pseudo reg here, and save the conversion until after all
2668 parameters have been moved. */
2670 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
2672 emit_move_insn (tempreg, validize_mem (data->entry_parm));
2674 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
2675 tempreg = convert_to_mode (data->nominal_mode, tempreg, unsignedp);
2677 if (GET_CODE (tempreg) == SUBREG
2678 && GET_MODE (tempreg) == data->nominal_mode
2679 && REG_P (SUBREG_REG (tempreg))
2680 && data->nominal_mode == data->passed_mode
2681 && GET_MODE (SUBREG_REG (tempreg)) == GET_MODE (data->entry_parm)
2682 && GET_MODE_SIZE (GET_MODE (tempreg))
2683 < GET_MODE_SIZE (GET_MODE (data->entry_parm)))
2685 /* The argument is already sign/zero extended, so note it
2686 into the subreg. */
2687 SUBREG_PROMOTED_VAR_P (tempreg) = 1;
2688 SUBREG_PROMOTED_UNSIGNED_SET (tempreg, unsignedp);
2691 /* TREE_USED gets set erroneously during expand_assignment. */
2692 save_tree_used = TREE_USED (parm);
2693 expand_assignment (parm, make_tree (data->nominal_type, tempreg), false);
2694 TREE_USED (parm) = save_tree_used;
2695 all->first_conversion_insn = get_insns ();
2696 all->last_conversion_insn = get_last_insn ();
2697 end_sequence ();
2699 did_conversion = true;
2701 else
2702 emit_move_insn (parmreg, validize_mem (data->entry_parm));
2704 /* If we were passed a pointer but the actual value can safely live
2705 in a register, put it in one. */
2706 if (data->passed_pointer
2707 && TYPE_MODE (TREE_TYPE (parm)) != BLKmode
2708 /* If by-reference argument was promoted, demote it. */
2709 && (TYPE_MODE (TREE_TYPE (parm)) != GET_MODE (DECL_RTL (parm))
2710 || use_register_for_decl (parm)))
2712 /* We can't use nominal_mode, because it will have been set to
2713 Pmode above. We must use the actual mode of the parm. */
2714 parmreg = gen_reg_rtx (TYPE_MODE (TREE_TYPE (parm)));
2715 mark_user_reg (parmreg);
2717 if (GET_MODE (parmreg) != GET_MODE (DECL_RTL (parm)))
2719 rtx tempreg = gen_reg_rtx (GET_MODE (DECL_RTL (parm)));
2720 int unsigned_p = TYPE_UNSIGNED (TREE_TYPE (parm));
2722 push_to_sequence2 (all->first_conversion_insn,
2723 all->last_conversion_insn);
2724 emit_move_insn (tempreg, DECL_RTL (parm));
2725 tempreg = convert_to_mode (GET_MODE (parmreg), tempreg, unsigned_p);
2726 emit_move_insn (parmreg, tempreg);
2727 all->first_conversion_insn = get_insns ();
2728 all->last_conversion_insn = get_last_insn ();
2729 end_sequence ();
2731 did_conversion = true;
2733 else
2734 emit_move_insn (parmreg, DECL_RTL (parm));
2736 SET_DECL_RTL (parm, parmreg);
2738 /* STACK_PARM is the pointer, not the parm, and PARMREG is
2739 now the parm. */
2740 data->stack_parm = NULL;
2743 /* Mark the register as eliminable if we did no conversion and it was
2744 copied from memory at a fixed offset, and the arg pointer was not
2745 copied to a pseudo-reg. If the arg pointer is a pseudo reg or the
2746 offset formed an invalid address, such memory-equivalences as we
2747 make here would screw up life analysis for it. */
2748 if (data->nominal_mode == data->passed_mode
2749 && !did_conversion
2750 && data->stack_parm != 0
2751 && MEM_P (data->stack_parm)
2752 && data->locate.offset.var == 0
2753 && reg_mentioned_p (virtual_incoming_args_rtx,
2754 XEXP (data->stack_parm, 0)))
2756 rtx linsn = get_last_insn ();
2757 rtx sinsn, set;
2759 /* Mark complex types separately. */
2760 if (GET_CODE (parmreg) == CONCAT)
2762 enum machine_mode submode
2763 = GET_MODE_INNER (GET_MODE (parmreg));
2764 int regnor = REGNO (XEXP (parmreg, 0));
2765 int regnoi = REGNO (XEXP (parmreg, 1));
2766 rtx stackr = adjust_address_nv (data->stack_parm, submode, 0);
2767 rtx stacki = adjust_address_nv (data->stack_parm, submode,
2768 GET_MODE_SIZE (submode));
2770 /* Scan backwards for the set of the real and
2771 imaginary parts. */
2772 for (sinsn = linsn; sinsn != 0;
2773 sinsn = prev_nonnote_insn (sinsn))
2775 set = single_set (sinsn);
2776 if (set == 0)
2777 continue;
2779 if (SET_DEST (set) == regno_reg_rtx [regnoi])
2780 set_unique_reg_note (sinsn, REG_EQUIV, stacki);
2781 else if (SET_DEST (set) == regno_reg_rtx [regnor])
2782 set_unique_reg_note (sinsn, REG_EQUIV, stackr);
2785 else if ((set = single_set (linsn)) != 0
2786 && SET_DEST (set) == parmreg)
2787 set_unique_reg_note (linsn, REG_EQUIV, data->stack_parm);
2790 /* For pointer data type, suggest pointer register. */
2791 if (POINTER_TYPE_P (TREE_TYPE (parm)))
2792 mark_reg_pointer (parmreg,
2793 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
2796 /* A subroutine of assign_parms. Allocate stack space to hold the current
2797 parameter. Get it there. Perform all ABI specified conversions. */
2799 static void
2800 assign_parm_setup_stack (struct assign_parm_data_all *all, tree parm,
2801 struct assign_parm_data_one *data)
2803 /* Value must be stored in the stack slot STACK_PARM during function
2804 execution. */
2805 bool to_conversion = false;
2807 if (data->promoted_mode != data->nominal_mode)
2809 /* Conversion is required. */
2810 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
2812 emit_move_insn (tempreg, validize_mem (data->entry_parm));
2814 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
2815 to_conversion = true;
2817 data->entry_parm = convert_to_mode (data->nominal_mode, tempreg,
2818 TYPE_UNSIGNED (TREE_TYPE (parm)));
2820 if (data->stack_parm)
2821 /* ??? This may need a big-endian conversion on sparc64. */
2822 data->stack_parm
2823 = adjust_address (data->stack_parm, data->nominal_mode, 0);
2826 if (data->entry_parm != data->stack_parm)
2828 rtx src, dest;
2830 if (data->stack_parm == 0)
2832 data->stack_parm
2833 = assign_stack_local (GET_MODE (data->entry_parm),
2834 GET_MODE_SIZE (GET_MODE (data->entry_parm)),
2835 TYPE_ALIGN (data->passed_type));
2836 set_mem_attributes (data->stack_parm, parm, 1);
2839 dest = validize_mem (data->stack_parm);
2840 src = validize_mem (data->entry_parm);
2842 if (MEM_P (src))
2844 /* Use a block move to handle potentially misaligned entry_parm. */
2845 if (!to_conversion)
2846 push_to_sequence2 (all->first_conversion_insn,
2847 all->last_conversion_insn);
2848 to_conversion = true;
2850 emit_block_move (dest, src,
2851 GEN_INT (int_size_in_bytes (data->passed_type)),
2852 BLOCK_OP_NORMAL);
2854 else
2855 emit_move_insn (dest, src);
2858 if (to_conversion)
2860 all->first_conversion_insn = get_insns ();
2861 all->last_conversion_insn = get_last_insn ();
2862 end_sequence ();
2865 SET_DECL_RTL (parm, data->stack_parm);
2868 /* A subroutine of assign_parms. If the ABI splits complex arguments, then
2869 undo the frobbing that we did in assign_parms_augmented_arg_list. */
2871 static void
2872 assign_parms_unsplit_complex (struct assign_parm_data_all *all, tree fnargs)
2874 tree parm;
2875 tree orig_fnargs = all->orig_fnargs;
2877 for (parm = orig_fnargs; parm; parm = TREE_CHAIN (parm))
2879 if (TREE_CODE (TREE_TYPE (parm)) == COMPLEX_TYPE
2880 && targetm.calls.split_complex_arg (TREE_TYPE (parm)))
2882 rtx tmp, real, imag;
2883 enum machine_mode inner = GET_MODE_INNER (DECL_MODE (parm));
2885 real = DECL_RTL (fnargs);
2886 imag = DECL_RTL (TREE_CHAIN (fnargs));
2887 if (inner != GET_MODE (real))
2889 real = gen_lowpart_SUBREG (inner, real);
2890 imag = gen_lowpart_SUBREG (inner, imag);
2893 if (TREE_ADDRESSABLE (parm))
2895 rtx rmem, imem;
2896 HOST_WIDE_INT size = int_size_in_bytes (TREE_TYPE (parm));
2898 /* split_complex_arg put the real and imag parts in
2899 pseudos. Move them to memory. */
2900 tmp = assign_stack_local (DECL_MODE (parm), size,
2901 TYPE_ALIGN (TREE_TYPE (parm)));
2902 set_mem_attributes (tmp, parm, 1);
2903 rmem = adjust_address_nv (tmp, inner, 0);
2904 imem = adjust_address_nv (tmp, inner, GET_MODE_SIZE (inner));
2905 push_to_sequence2 (all->first_conversion_insn,
2906 all->last_conversion_insn);
2907 emit_move_insn (rmem, real);
2908 emit_move_insn (imem, imag);
2909 all->first_conversion_insn = get_insns ();
2910 all->last_conversion_insn = get_last_insn ();
2911 end_sequence ();
2913 else
2914 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
2915 SET_DECL_RTL (parm, tmp);
2917 real = DECL_INCOMING_RTL (fnargs);
2918 imag = DECL_INCOMING_RTL (TREE_CHAIN (fnargs));
2919 if (inner != GET_MODE (real))
2921 real = gen_lowpart_SUBREG (inner, real);
2922 imag = gen_lowpart_SUBREG (inner, imag);
2924 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
2925 set_decl_incoming_rtl (parm, tmp, false);
2926 fnargs = TREE_CHAIN (fnargs);
2928 else
2930 SET_DECL_RTL (parm, DECL_RTL (fnargs));
2931 set_decl_incoming_rtl (parm, DECL_INCOMING_RTL (fnargs), false);
2933 /* Set MEM_EXPR to the original decl, i.e. to PARM,
2934 instead of the copy of decl, i.e. FNARGS. */
2935 if (DECL_INCOMING_RTL (parm) && MEM_P (DECL_INCOMING_RTL (parm)))
2936 set_mem_expr (DECL_INCOMING_RTL (parm), parm);
2939 fnargs = TREE_CHAIN (fnargs);
2943 /* Assign RTL expressions to the function's parameters. This may involve
2944 copying them into registers and using those registers as the DECL_RTL. */
2946 static void
2947 assign_parms (tree fndecl)
2949 struct assign_parm_data_all all;
2950 tree fnargs, parm;
2952 crtl->args.internal_arg_pointer
2953 = targetm.calls.internal_arg_pointer ();
2955 assign_parms_initialize_all (&all);
2956 fnargs = assign_parms_augmented_arg_list (&all);
2958 for (parm = fnargs; parm; parm = TREE_CHAIN (parm))
2960 struct assign_parm_data_one data;
2962 /* Extract the type of PARM; adjust it according to ABI. */
2963 assign_parm_find_data_types (&all, parm, &data);
2965 /* Early out for errors and void parameters. */
2966 if (data.passed_mode == VOIDmode)
2968 SET_DECL_RTL (parm, const0_rtx);
2969 DECL_INCOMING_RTL (parm) = DECL_RTL (parm);
2970 continue;
2973 if (cfun->stdarg && !TREE_CHAIN (parm))
2974 assign_parms_setup_varargs (&all, &data, false);
2976 /* Find out where the parameter arrives in this function. */
2977 assign_parm_find_entry_rtl (&all, &data);
2979 /* Find out where stack space for this parameter might be. */
2980 if (assign_parm_is_stack_parm (&all, &data))
2982 assign_parm_find_stack_rtl (parm, &data);
2983 assign_parm_adjust_entry_rtl (&data);
2986 /* Record permanently how this parm was passed. */
2987 set_decl_incoming_rtl (parm, data.entry_parm, data.passed_pointer);
2989 /* Update info on where next arg arrives in registers. */
2990 FUNCTION_ARG_ADVANCE (all.args_so_far, data.promoted_mode,
2991 data.passed_type, data.named_arg);
2993 assign_parm_adjust_stack_rtl (&data);
2995 if (assign_parm_setup_block_p (&data))
2996 assign_parm_setup_block (&all, parm, &data);
2997 else if (data.passed_pointer || use_register_for_decl (parm))
2998 assign_parm_setup_reg (&all, parm, &data);
2999 else
3000 assign_parm_setup_stack (&all, parm, &data);
3003 if (targetm.calls.split_complex_arg && fnargs != all.orig_fnargs)
3004 assign_parms_unsplit_complex (&all, fnargs);
3006 /* Output all parameter conversion instructions (possibly including calls)
3007 now that all parameters have been copied out of hard registers. */
3008 emit_insn (all.first_conversion_insn);
3010 /* If we are receiving a struct value address as the first argument, set up
3011 the RTL for the function result. As this might require code to convert
3012 the transmitted address to Pmode, we do this here to ensure that possible
3013 preliminary conversions of the address have been emitted already. */
3014 if (all.function_result_decl)
3016 tree result = DECL_RESULT (current_function_decl);
3017 rtx addr = DECL_RTL (all.function_result_decl);
3018 rtx x;
3020 if (DECL_BY_REFERENCE (result))
3021 x = addr;
3022 else
3024 addr = convert_memory_address (Pmode, addr);
3025 x = gen_rtx_MEM (DECL_MODE (result), addr);
3026 set_mem_attributes (x, result, 1);
3028 SET_DECL_RTL (result, x);
3031 /* We have aligned all the args, so add space for the pretend args. */
3032 crtl->args.pretend_args_size = all.pretend_args_size;
3033 all.stack_args_size.constant += all.extra_pretend_bytes;
3034 crtl->args.size = all.stack_args_size.constant;
3036 /* Adjust function incoming argument size for alignment and
3037 minimum length. */
3039 #ifdef REG_PARM_STACK_SPACE
3040 crtl->args.size = MAX (crtl->args.size,
3041 REG_PARM_STACK_SPACE (fndecl));
3042 #endif
3044 crtl->args.size = CEIL_ROUND (crtl->args.size,
3045 PARM_BOUNDARY / BITS_PER_UNIT);
3047 #ifdef ARGS_GROW_DOWNWARD
3048 crtl->args.arg_offset_rtx
3049 = (all.stack_args_size.var == 0 ? GEN_INT (-all.stack_args_size.constant)
3050 : expand_expr (size_diffop (all.stack_args_size.var,
3051 size_int (-all.stack_args_size.constant)),
3052 NULL_RTX, VOIDmode, 0));
3053 #else
3054 crtl->args.arg_offset_rtx = ARGS_SIZE_RTX (all.stack_args_size);
3055 #endif
3057 /* See how many bytes, if any, of its args a function should try to pop
3058 on return. */
3060 crtl->args.pops_args = RETURN_POPS_ARGS (fndecl, TREE_TYPE (fndecl),
3061 crtl->args.size);
3063 /* For stdarg.h function, save info about
3064 regs and stack space used by the named args. */
3066 crtl->args.info = all.args_so_far;
3068 /* Set the rtx used for the function return value. Put this in its
3069 own variable so any optimizers that need this information don't have
3070 to include tree.h. Do this here so it gets done when an inlined
3071 function gets output. */
3073 crtl->return_rtx
3074 = (DECL_RTL_SET_P (DECL_RESULT (fndecl))
3075 ? DECL_RTL (DECL_RESULT (fndecl)) : NULL_RTX);
3077 /* If scalar return value was computed in a pseudo-reg, or was a named
3078 return value that got dumped to the stack, copy that to the hard
3079 return register. */
3080 if (DECL_RTL_SET_P (DECL_RESULT (fndecl)))
3082 tree decl_result = DECL_RESULT (fndecl);
3083 rtx decl_rtl = DECL_RTL (decl_result);
3085 if (REG_P (decl_rtl)
3086 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
3087 : DECL_REGISTER (decl_result))
3089 rtx real_decl_rtl;
3091 real_decl_rtl = targetm.calls.function_value (TREE_TYPE (decl_result),
3092 fndecl, true);
3093 REG_FUNCTION_VALUE_P (real_decl_rtl) = 1;
3094 /* The delay slot scheduler assumes that crtl->return_rtx
3095 holds the hard register containing the return value, not a
3096 temporary pseudo. */
3097 crtl->return_rtx = real_decl_rtl;
3102 /* A subroutine of gimplify_parameters, invoked via walk_tree.
3103 For all seen types, gimplify their sizes. */
3105 static tree
3106 gimplify_parm_type (tree *tp, int *walk_subtrees, void *data)
3108 tree t = *tp;
3110 *walk_subtrees = 0;
3111 if (TYPE_P (t))
3113 if (POINTER_TYPE_P (t))
3114 *walk_subtrees = 1;
3115 else if (TYPE_SIZE (t) && !TREE_CONSTANT (TYPE_SIZE (t))
3116 && !TYPE_SIZES_GIMPLIFIED (t))
3118 gimplify_type_sizes (t, (tree *) data);
3119 *walk_subtrees = 1;
3123 return NULL;
3126 /* Gimplify the parameter list for current_function_decl. This involves
3127 evaluating SAVE_EXPRs of variable sized parameters and generating code
3128 to implement callee-copies reference parameters. Returns a list of
3129 statements to add to the beginning of the function, or NULL if nothing
3130 to do. */
3132 tree
3133 gimplify_parameters (void)
3135 struct assign_parm_data_all all;
3136 tree fnargs, parm, stmts = NULL;
3138 assign_parms_initialize_all (&all);
3139 fnargs = assign_parms_augmented_arg_list (&all);
3141 for (parm = fnargs; parm; parm = TREE_CHAIN (parm))
3143 struct assign_parm_data_one data;
3145 /* Extract the type of PARM; adjust it according to ABI. */
3146 assign_parm_find_data_types (&all, parm, &data);
3148 /* Early out for errors and void parameters. */
3149 if (data.passed_mode == VOIDmode || DECL_SIZE (parm) == NULL)
3150 continue;
3152 /* Update info on where next arg arrives in registers. */
3153 FUNCTION_ARG_ADVANCE (all.args_so_far, data.promoted_mode,
3154 data.passed_type, data.named_arg);
3156 /* ??? Once upon a time variable_size stuffed parameter list
3157 SAVE_EXPRs (amongst others) onto a pending sizes list. This
3158 turned out to be less than manageable in the gimple world.
3159 Now we have to hunt them down ourselves. */
3160 walk_tree_without_duplicates (&data.passed_type,
3161 gimplify_parm_type, &stmts);
3163 if (!TREE_CONSTANT (DECL_SIZE (parm)))
3165 gimplify_one_sizepos (&DECL_SIZE (parm), &stmts);
3166 gimplify_one_sizepos (&DECL_SIZE_UNIT (parm), &stmts);
3169 if (data.passed_pointer)
3171 tree type = TREE_TYPE (data.passed_type);
3172 if (reference_callee_copied (&all.args_so_far, TYPE_MODE (type),
3173 type, data.named_arg))
3175 tree local, t;
3177 /* For constant sized objects, this is trivial; for
3178 variable-sized objects, we have to play games. */
3179 if (TREE_CONSTANT (DECL_SIZE (parm)))
3181 local = create_tmp_var (type, get_name (parm));
3182 DECL_IGNORED_P (local) = 0;
3184 else
3186 tree ptr_type, addr;
3188 ptr_type = build_pointer_type (type);
3189 addr = create_tmp_var (ptr_type, get_name (parm));
3190 DECL_IGNORED_P (addr) = 0;
3191 local = build_fold_indirect_ref (addr);
3193 t = built_in_decls[BUILT_IN_ALLOCA];
3194 t = build_call_expr (t, 1, DECL_SIZE_UNIT (parm));
3195 t = fold_convert (ptr_type, t);
3196 t = build_gimple_modify_stmt (addr, t);
3197 gimplify_and_add (t, &stmts);
3200 t = build_gimple_modify_stmt (local, parm);
3201 gimplify_and_add (t, &stmts);
3203 SET_DECL_VALUE_EXPR (parm, local);
3204 DECL_HAS_VALUE_EXPR_P (parm) = 1;
3209 return stmts;
3212 /* Compute the size and offset from the start of the stacked arguments for a
3213 parm passed in mode PASSED_MODE and with type TYPE.
3215 INITIAL_OFFSET_PTR points to the current offset into the stacked
3216 arguments.
3218 The starting offset and size for this parm are returned in
3219 LOCATE->OFFSET and LOCATE->SIZE, respectively. When IN_REGS is
3220 nonzero, the offset is that of stack slot, which is returned in
3221 LOCATE->SLOT_OFFSET. LOCATE->ALIGNMENT_PAD is the amount of
3222 padding required from the initial offset ptr to the stack slot.
3224 IN_REGS is nonzero if the argument will be passed in registers. It will
3225 never be set if REG_PARM_STACK_SPACE is not defined.
3227 FNDECL is the function in which the argument was defined.
3229 There are two types of rounding that are done. The first, controlled by
3230 FUNCTION_ARG_BOUNDARY, forces the offset from the start of the argument
3231 list to be aligned to the specific boundary (in bits). This rounding
3232 affects the initial and starting offsets, but not the argument size.
3234 The second, controlled by FUNCTION_ARG_PADDING and PARM_BOUNDARY,
3235 optionally rounds the size of the parm to PARM_BOUNDARY. The
3236 initial offset is not affected by this rounding, while the size always
3237 is and the starting offset may be. */
3239 /* LOCATE->OFFSET will be negative for ARGS_GROW_DOWNWARD case;
3240 INITIAL_OFFSET_PTR is positive because locate_and_pad_parm's
3241 callers pass in the total size of args so far as
3242 INITIAL_OFFSET_PTR. LOCATE->SIZE is always positive. */
3244 void
3245 locate_and_pad_parm (enum machine_mode passed_mode, tree type, int in_regs,
3246 int partial, tree fndecl ATTRIBUTE_UNUSED,
3247 struct args_size *initial_offset_ptr,
3248 struct locate_and_pad_arg_data *locate)
3250 tree sizetree;
3251 enum direction where_pad;
3252 unsigned int boundary;
3253 int reg_parm_stack_space = 0;
3254 int part_size_in_regs;
3256 #ifdef REG_PARM_STACK_SPACE
3257 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
3259 /* If we have found a stack parm before we reach the end of the
3260 area reserved for registers, skip that area. */
3261 if (! in_regs)
3263 if (reg_parm_stack_space > 0)
3265 if (initial_offset_ptr->var)
3267 initial_offset_ptr->var
3268 = size_binop (MAX_EXPR, ARGS_SIZE_TREE (*initial_offset_ptr),
3269 ssize_int (reg_parm_stack_space));
3270 initial_offset_ptr->constant = 0;
3272 else if (initial_offset_ptr->constant < reg_parm_stack_space)
3273 initial_offset_ptr->constant = reg_parm_stack_space;
3276 #endif /* REG_PARM_STACK_SPACE */
3278 part_size_in_regs = (reg_parm_stack_space == 0 ? partial : 0);
3280 sizetree
3281 = type ? size_in_bytes (type) : size_int (GET_MODE_SIZE (passed_mode));
3282 where_pad = FUNCTION_ARG_PADDING (passed_mode, type);
3283 boundary = FUNCTION_ARG_BOUNDARY (passed_mode, type);
3284 locate->where_pad = where_pad;
3285 locate->boundary = boundary;
3287 /* Remember if the outgoing parameter requires extra alignment on the
3288 calling function side. */
3289 if (boundary > PREFERRED_STACK_BOUNDARY)
3290 boundary = PREFERRED_STACK_BOUNDARY;
3291 if (crtl->stack_alignment_needed < boundary)
3292 crtl->stack_alignment_needed = boundary;
3294 #ifdef ARGS_GROW_DOWNWARD
3295 locate->slot_offset.constant = -initial_offset_ptr->constant;
3296 if (initial_offset_ptr->var)
3297 locate->slot_offset.var = size_binop (MINUS_EXPR, ssize_int (0),
3298 initial_offset_ptr->var);
3301 tree s2 = sizetree;
3302 if (where_pad != none
3303 && (!host_integerp (sizetree, 1)
3304 || (tree_low_cst (sizetree, 1) * BITS_PER_UNIT) % PARM_BOUNDARY))
3305 s2 = round_up (s2, PARM_BOUNDARY / BITS_PER_UNIT);
3306 SUB_PARM_SIZE (locate->slot_offset, s2);
3309 locate->slot_offset.constant += part_size_in_regs;
3311 if (!in_regs
3312 #ifdef REG_PARM_STACK_SPACE
3313 || REG_PARM_STACK_SPACE (fndecl) > 0
3314 #endif
3316 pad_to_arg_alignment (&locate->slot_offset, boundary,
3317 &locate->alignment_pad);
3319 locate->size.constant = (-initial_offset_ptr->constant
3320 - locate->slot_offset.constant);
3321 if (initial_offset_ptr->var)
3322 locate->size.var = size_binop (MINUS_EXPR,
3323 size_binop (MINUS_EXPR,
3324 ssize_int (0),
3325 initial_offset_ptr->var),
3326 locate->slot_offset.var);
3328 /* Pad_below needs the pre-rounded size to know how much to pad
3329 below. */
3330 locate->offset = locate->slot_offset;
3331 if (where_pad == downward)
3332 pad_below (&locate->offset, passed_mode, sizetree);
3334 #else /* !ARGS_GROW_DOWNWARD */
3335 if (!in_regs
3336 #ifdef REG_PARM_STACK_SPACE
3337 || REG_PARM_STACK_SPACE (fndecl) > 0
3338 #endif
3340 pad_to_arg_alignment (initial_offset_ptr, boundary,
3341 &locate->alignment_pad);
3342 locate->slot_offset = *initial_offset_ptr;
3344 #ifdef PUSH_ROUNDING
3345 if (passed_mode != BLKmode)
3346 sizetree = size_int (PUSH_ROUNDING (TREE_INT_CST_LOW (sizetree)));
3347 #endif
3349 /* Pad_below needs the pre-rounded size to know how much to pad below
3350 so this must be done before rounding up. */
3351 locate->offset = locate->slot_offset;
3352 if (where_pad == downward)
3353 pad_below (&locate->offset, passed_mode, sizetree);
3355 if (where_pad != none
3356 && (!host_integerp (sizetree, 1)
3357 || (tree_low_cst (sizetree, 1) * BITS_PER_UNIT) % PARM_BOUNDARY))
3358 sizetree = round_up (sizetree, PARM_BOUNDARY / BITS_PER_UNIT);
3360 ADD_PARM_SIZE (locate->size, sizetree);
3362 locate->size.constant -= part_size_in_regs;
3363 #endif /* ARGS_GROW_DOWNWARD */
3366 /* Round the stack offset in *OFFSET_PTR up to a multiple of BOUNDARY.
3367 BOUNDARY is measured in bits, but must be a multiple of a storage unit. */
3369 static void
3370 pad_to_arg_alignment (struct args_size *offset_ptr, int boundary,
3371 struct args_size *alignment_pad)
3373 tree save_var = NULL_TREE;
3374 HOST_WIDE_INT save_constant = 0;
3375 int boundary_in_bytes = boundary / BITS_PER_UNIT;
3376 HOST_WIDE_INT sp_offset = STACK_POINTER_OFFSET;
3378 #ifdef SPARC_STACK_BOUNDARY_HACK
3379 /* ??? The SPARC port may claim a STACK_BOUNDARY higher than
3380 the real alignment of %sp. However, when it does this, the
3381 alignment of %sp+STACK_POINTER_OFFSET is STACK_BOUNDARY. */
3382 if (SPARC_STACK_BOUNDARY_HACK)
3383 sp_offset = 0;
3384 #endif
3386 if (boundary > PARM_BOUNDARY)
3388 save_var = offset_ptr->var;
3389 save_constant = offset_ptr->constant;
3392 alignment_pad->var = NULL_TREE;
3393 alignment_pad->constant = 0;
3395 if (boundary > BITS_PER_UNIT)
3397 if (offset_ptr->var)
3399 tree sp_offset_tree = ssize_int (sp_offset);
3400 tree offset = size_binop (PLUS_EXPR,
3401 ARGS_SIZE_TREE (*offset_ptr),
3402 sp_offset_tree);
3403 #ifdef ARGS_GROW_DOWNWARD
3404 tree rounded = round_down (offset, boundary / BITS_PER_UNIT);
3405 #else
3406 tree rounded = round_up (offset, boundary / BITS_PER_UNIT);
3407 #endif
3409 offset_ptr->var = size_binop (MINUS_EXPR, rounded, sp_offset_tree);
3410 /* ARGS_SIZE_TREE includes constant term. */
3411 offset_ptr->constant = 0;
3412 if (boundary > PARM_BOUNDARY)
3413 alignment_pad->var = size_binop (MINUS_EXPR, offset_ptr->var,
3414 save_var);
3416 else
3418 offset_ptr->constant = -sp_offset +
3419 #ifdef ARGS_GROW_DOWNWARD
3420 FLOOR_ROUND (offset_ptr->constant + sp_offset, boundary_in_bytes);
3421 #else
3422 CEIL_ROUND (offset_ptr->constant + sp_offset, boundary_in_bytes);
3423 #endif
3424 if (boundary > PARM_BOUNDARY)
3425 alignment_pad->constant = offset_ptr->constant - save_constant;
3430 static void
3431 pad_below (struct args_size *offset_ptr, enum machine_mode passed_mode, tree sizetree)
3433 if (passed_mode != BLKmode)
3435 if (GET_MODE_BITSIZE (passed_mode) % PARM_BOUNDARY)
3436 offset_ptr->constant
3437 += (((GET_MODE_BITSIZE (passed_mode) + PARM_BOUNDARY - 1)
3438 / PARM_BOUNDARY * PARM_BOUNDARY / BITS_PER_UNIT)
3439 - GET_MODE_SIZE (passed_mode));
3441 else
3443 if (TREE_CODE (sizetree) != INTEGER_CST
3444 || (TREE_INT_CST_LOW (sizetree) * BITS_PER_UNIT) % PARM_BOUNDARY)
3446 /* Round the size up to multiple of PARM_BOUNDARY bits. */
3447 tree s2 = round_up (sizetree, PARM_BOUNDARY / BITS_PER_UNIT);
3448 /* Add it in. */
3449 ADD_PARM_SIZE (*offset_ptr, s2);
3450 SUB_PARM_SIZE (*offset_ptr, sizetree);
3456 /* True if register REGNO was alive at a place where `setjmp' was
3457 called and was set more than once or is an argument. Such regs may
3458 be clobbered by `longjmp'. */
3460 static bool
3461 regno_clobbered_at_setjmp (bitmap setjmp_crosses, int regno)
3463 /* There appear to be cases where some local vars never reach the
3464 backend but have bogus regnos. */
3465 if (regno >= max_reg_num ())
3466 return false;
3468 return ((REG_N_SETS (regno) > 1
3469 || REGNO_REG_SET_P (df_get_live_out (ENTRY_BLOCK_PTR), regno))
3470 && REGNO_REG_SET_P (setjmp_crosses, regno));
3473 /* Walk the tree of blocks describing the binding levels within a
3474 function and warn about variables the might be killed by setjmp or
3475 vfork. This is done after calling flow_analysis before register
3476 allocation since that will clobber the pseudo-regs to hard
3477 regs. */
3479 static void
3480 setjmp_vars_warning (bitmap setjmp_crosses, tree block)
3482 tree decl, sub;
3484 for (decl = BLOCK_VARS (block); decl; decl = TREE_CHAIN (decl))
3486 if (TREE_CODE (decl) == VAR_DECL
3487 && DECL_RTL_SET_P (decl)
3488 && REG_P (DECL_RTL (decl))
3489 && regno_clobbered_at_setjmp (setjmp_crosses, REGNO (DECL_RTL (decl))))
3490 warning (OPT_Wclobbered, "variable %q+D might be clobbered by"
3491 " %<longjmp%> or %<vfork%>", decl);
3494 for (sub = BLOCK_SUBBLOCKS (block); sub; sub = BLOCK_CHAIN (sub))
3495 setjmp_vars_warning (setjmp_crosses, sub);
3498 /* Do the appropriate part of setjmp_vars_warning
3499 but for arguments instead of local variables. */
3501 static void
3502 setjmp_args_warning (bitmap setjmp_crosses)
3504 tree decl;
3505 for (decl = DECL_ARGUMENTS (current_function_decl);
3506 decl; decl = TREE_CHAIN (decl))
3507 if (DECL_RTL (decl) != 0
3508 && REG_P (DECL_RTL (decl))
3509 && regno_clobbered_at_setjmp (setjmp_crosses, REGNO (DECL_RTL (decl))))
3510 warning (OPT_Wclobbered,
3511 "argument %q+D might be clobbered by %<longjmp%> or %<vfork%>",
3512 decl);
3515 /* Generate warning messages for variables live across setjmp. */
3517 void
3518 generate_setjmp_warnings (void)
3520 bitmap setjmp_crosses = regstat_get_setjmp_crosses ();
3522 if (n_basic_blocks == NUM_FIXED_BLOCKS
3523 || bitmap_empty_p (setjmp_crosses))
3524 return;
3526 setjmp_vars_warning (setjmp_crosses, DECL_INITIAL (current_function_decl));
3527 setjmp_args_warning (setjmp_crosses);
3531 /* Identify BLOCKs referenced by more than one NOTE_INSN_BLOCK_{BEG,END},
3532 and create duplicate blocks. */
3533 /* ??? Need an option to either create block fragments or to create
3534 abstract origin duplicates of a source block. It really depends
3535 on what optimization has been performed. */
3537 void
3538 reorder_blocks (void)
3540 tree block = DECL_INITIAL (current_function_decl);
3541 VEC(tree,heap) *block_stack;
3543 if (block == NULL_TREE)
3544 return;
3546 block_stack = VEC_alloc (tree, heap, 10);
3548 /* Reset the TREE_ASM_WRITTEN bit for all blocks. */
3549 clear_block_marks (block);
3551 /* Prune the old trees away, so that they don't get in the way. */
3552 BLOCK_SUBBLOCKS (block) = NULL_TREE;
3553 BLOCK_CHAIN (block) = NULL_TREE;
3555 /* Recreate the block tree from the note nesting. */
3556 reorder_blocks_1 (get_insns (), block, &block_stack);
3557 BLOCK_SUBBLOCKS (block) = blocks_nreverse (BLOCK_SUBBLOCKS (block));
3559 VEC_free (tree, heap, block_stack);
3562 /* Helper function for reorder_blocks. Reset TREE_ASM_WRITTEN. */
3564 void
3565 clear_block_marks (tree block)
3567 while (block)
3569 TREE_ASM_WRITTEN (block) = 0;
3570 clear_block_marks (BLOCK_SUBBLOCKS (block));
3571 block = BLOCK_CHAIN (block);
3575 static void
3576 reorder_blocks_1 (rtx insns, tree current_block, VEC(tree,heap) **p_block_stack)
3578 rtx insn;
3580 for (insn = insns; insn; insn = NEXT_INSN (insn))
3582 if (NOTE_P (insn))
3584 if (NOTE_KIND (insn) == NOTE_INSN_BLOCK_BEG)
3586 tree block = NOTE_BLOCK (insn);
3587 tree origin;
3589 origin = (BLOCK_FRAGMENT_ORIGIN (block)
3590 ? BLOCK_FRAGMENT_ORIGIN (block)
3591 : block);
3593 /* If we have seen this block before, that means it now
3594 spans multiple address regions. Create a new fragment. */
3595 if (TREE_ASM_WRITTEN (block))
3597 tree new_block = copy_node (block);
3599 BLOCK_FRAGMENT_ORIGIN (new_block) = origin;
3600 BLOCK_FRAGMENT_CHAIN (new_block)
3601 = BLOCK_FRAGMENT_CHAIN (origin);
3602 BLOCK_FRAGMENT_CHAIN (origin) = new_block;
3604 NOTE_BLOCK (insn) = new_block;
3605 block = new_block;
3608 BLOCK_SUBBLOCKS (block) = 0;
3609 TREE_ASM_WRITTEN (block) = 1;
3610 /* When there's only one block for the entire function,
3611 current_block == block and we mustn't do this, it
3612 will cause infinite recursion. */
3613 if (block != current_block)
3615 if (block != origin)
3616 gcc_assert (BLOCK_SUPERCONTEXT (origin) == current_block);
3618 BLOCK_SUPERCONTEXT (block) = current_block;
3619 BLOCK_CHAIN (block) = BLOCK_SUBBLOCKS (current_block);
3620 BLOCK_SUBBLOCKS (current_block) = block;
3621 current_block = origin;
3623 VEC_safe_push (tree, heap, *p_block_stack, block);
3625 else if (NOTE_KIND (insn) == NOTE_INSN_BLOCK_END)
3627 NOTE_BLOCK (insn) = VEC_pop (tree, *p_block_stack);
3628 BLOCK_SUBBLOCKS (current_block)
3629 = blocks_nreverse (BLOCK_SUBBLOCKS (current_block));
3630 current_block = BLOCK_SUPERCONTEXT (current_block);
3636 /* Reverse the order of elements in the chain T of blocks,
3637 and return the new head of the chain (old last element). */
3639 tree
3640 blocks_nreverse (tree t)
3642 tree prev = 0, decl, next;
3643 for (decl = t; decl; decl = next)
3645 next = BLOCK_CHAIN (decl);
3646 BLOCK_CHAIN (decl) = prev;
3647 prev = decl;
3649 return prev;
3652 /* Count the subblocks of the list starting with BLOCK. If VECTOR is
3653 non-NULL, list them all into VECTOR, in a depth-first preorder
3654 traversal of the block tree. Also clear TREE_ASM_WRITTEN in all
3655 blocks. */
3657 static int
3658 all_blocks (tree block, tree *vector)
3660 int n_blocks = 0;
3662 while (block)
3664 TREE_ASM_WRITTEN (block) = 0;
3666 /* Record this block. */
3667 if (vector)
3668 vector[n_blocks] = block;
3670 ++n_blocks;
3672 /* Record the subblocks, and their subblocks... */
3673 n_blocks += all_blocks (BLOCK_SUBBLOCKS (block),
3674 vector ? vector + n_blocks : 0);
3675 block = BLOCK_CHAIN (block);
3678 return n_blocks;
3681 /* Return a vector containing all the blocks rooted at BLOCK. The
3682 number of elements in the vector is stored in N_BLOCKS_P. The
3683 vector is dynamically allocated; it is the caller's responsibility
3684 to call `free' on the pointer returned. */
3686 static tree *
3687 get_block_vector (tree block, int *n_blocks_p)
3689 tree *block_vector;
3691 *n_blocks_p = all_blocks (block, NULL);
3692 block_vector = XNEWVEC (tree, *n_blocks_p);
3693 all_blocks (block, block_vector);
3695 return block_vector;
3698 static GTY(()) int next_block_index = 2;
3700 /* Set BLOCK_NUMBER for all the blocks in FN. */
3702 void
3703 number_blocks (tree fn)
3705 int i;
3706 int n_blocks;
3707 tree *block_vector;
3709 /* For SDB and XCOFF debugging output, we start numbering the blocks
3710 from 1 within each function, rather than keeping a running
3711 count. */
3712 #if defined (SDB_DEBUGGING_INFO) || defined (XCOFF_DEBUGGING_INFO)
3713 if (write_symbols == SDB_DEBUG || write_symbols == XCOFF_DEBUG)
3714 next_block_index = 1;
3715 #endif
3717 block_vector = get_block_vector (DECL_INITIAL (fn), &n_blocks);
3719 /* The top-level BLOCK isn't numbered at all. */
3720 for (i = 1; i < n_blocks; ++i)
3721 /* We number the blocks from two. */
3722 BLOCK_NUMBER (block_vector[i]) = next_block_index++;
3724 free (block_vector);
3726 return;
3729 /* If VAR is present in a subblock of BLOCK, return the subblock. */
3731 tree
3732 debug_find_var_in_block_tree (tree var, tree block)
3734 tree t;
3736 for (t = BLOCK_VARS (block); t; t = TREE_CHAIN (t))
3737 if (t == var)
3738 return block;
3740 for (t = BLOCK_SUBBLOCKS (block); t; t = TREE_CHAIN (t))
3742 tree ret = debug_find_var_in_block_tree (var, t);
3743 if (ret)
3744 return ret;
3747 return NULL_TREE;
3750 /* Keep track of whether we're in a dummy function context. If we are,
3751 we don't want to invoke the set_current_function hook, because we'll
3752 get into trouble if the hook calls target_reinit () recursively or
3753 when the initial initialization is not yet complete. */
3755 static bool in_dummy_function;
3757 /* Invoke the target hook when setting cfun. */
3759 static void
3760 invoke_set_current_function_hook (tree fndecl)
3762 if (!in_dummy_function)
3763 targetm.set_current_function (fndecl);
3766 /* cfun should never be set directly; use this function. */
3768 void
3769 set_cfun (struct function *new_cfun)
3771 if (cfun != new_cfun)
3773 cfun = new_cfun;
3774 invoke_set_current_function_hook (new_cfun ? new_cfun->decl : NULL_TREE);
3778 /* Keep track of the cfun stack. */
3780 typedef struct function *function_p;
3782 DEF_VEC_P(function_p);
3783 DEF_VEC_ALLOC_P(function_p,heap);
3785 /* Initialized with NOGC, making this poisonous to the garbage collector. */
3787 static VEC(function_p,heap) *cfun_stack;
3789 /* We save the value of in_system_header here when pushing the first
3790 function on the cfun stack, and we restore it from here when
3791 popping the last function. */
3793 static bool saved_in_system_header;
3795 /* Push the current cfun onto the stack, and set cfun to new_cfun. */
3797 void
3798 push_cfun (struct function *new_cfun)
3800 if (cfun == NULL)
3801 saved_in_system_header = in_system_header;
3802 VEC_safe_push (function_p, heap, cfun_stack, cfun);
3803 if (new_cfun)
3804 in_system_header = DECL_IN_SYSTEM_HEADER (new_cfun->decl);
3805 set_cfun (new_cfun);
3808 /* Pop cfun from the stack. */
3810 void
3811 pop_cfun (void)
3813 struct function *new_cfun = VEC_pop (function_p, cfun_stack);
3814 in_system_header = ((new_cfun == NULL) ? saved_in_system_header
3815 : DECL_IN_SYSTEM_HEADER (new_cfun->decl));
3816 set_cfun (new_cfun);
3819 /* Return value of funcdef and increase it. */
3821 get_next_funcdef_no (void)
3823 return funcdef_no++;
3826 /* Allocate a function structure for FNDECL and set its contents
3827 to the defaults. Set cfun to the newly-allocated object.
3828 Some of the helper functions invoked during initialization assume
3829 that cfun has already been set. Therefore, assign the new object
3830 directly into cfun and invoke the back end hook explicitly at the
3831 very end, rather than initializing a temporary and calling set_cfun
3832 on it.
3834 ABSTRACT_P is true if this is a function that will never be seen by
3835 the middle-end. Such functions are front-end concepts (like C++
3836 function templates) that do not correspond directly to functions
3837 placed in object files. */
3839 void
3840 allocate_struct_function (tree fndecl, bool abstract_p)
3842 tree result;
3843 tree fntype = fndecl ? TREE_TYPE (fndecl) : NULL_TREE;
3845 cfun = ggc_alloc_cleared (sizeof (struct function));
3847 current_function_funcdef_no = get_next_funcdef_no ();
3849 cfun->function_frequency = FUNCTION_FREQUENCY_NORMAL;
3851 init_eh_for_function ();
3853 if (init_machine_status)
3854 cfun->machine = (*init_machine_status) ();
3856 if (fndecl != NULL_TREE)
3858 DECL_STRUCT_FUNCTION (fndecl) = cfun;
3859 cfun->decl = fndecl;
3861 result = DECL_RESULT (fndecl);
3862 if (!abstract_p && aggregate_value_p (result, fndecl))
3864 #ifdef PCC_STATIC_STRUCT_RETURN
3865 cfun->returns_pcc_struct = 1;
3866 #endif
3867 cfun->returns_struct = 1;
3870 cfun->stdarg
3871 = (fntype
3872 && TYPE_ARG_TYPES (fntype) != 0
3873 && (TREE_VALUE (tree_last (TYPE_ARG_TYPES (fntype)))
3874 != void_type_node));
3876 /* Assume all registers in stdarg functions need to be saved. */
3877 cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
3878 cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
3881 invoke_set_current_function_hook (fndecl);
3884 /* This is like allocate_struct_function, but pushes a new cfun for FNDECL
3885 instead of just setting it. */
3887 void
3888 push_struct_function (tree fndecl)
3890 if (cfun == NULL)
3891 saved_in_system_header = in_system_header;
3892 VEC_safe_push (function_p, heap, cfun_stack, cfun);
3893 if (fndecl)
3894 in_system_header = DECL_IN_SYSTEM_HEADER (fndecl);
3895 allocate_struct_function (fndecl, false);
3898 /* Reset cfun, and other non-struct-function variables to defaults as
3899 appropriate for emitting rtl at the start of a function. */
3901 static void
3902 prepare_function_start (void)
3904 gcc_assert (!crtl->emit.x_last_insn);
3905 init_emit ();
3906 init_varasm_status ();
3907 init_expr ();
3909 cse_not_expected = ! optimize;
3911 /* Caller save not needed yet. */
3912 caller_save_needed = 0;
3914 /* We haven't done register allocation yet. */
3915 reg_renumber = 0;
3917 /* Indicate that we have not instantiated virtual registers yet. */
3918 virtuals_instantiated = 0;
3920 /* Indicate that we want CONCATs now. */
3921 generating_concat_p = 1;
3923 /* Indicate we have no need of a frame pointer yet. */
3924 frame_pointer_needed = 0;
3927 /* Initialize the rtl expansion mechanism so that we can do simple things
3928 like generate sequences. This is used to provide a context during global
3929 initialization of some passes. You must call expand_dummy_function_end
3930 to exit this context. */
3932 void
3933 init_dummy_function_start (void)
3935 gcc_assert (!in_dummy_function);
3936 in_dummy_function = true;
3937 push_struct_function (NULL_TREE);
3938 prepare_function_start ();
3941 /* Generate RTL for the start of the function SUBR (a FUNCTION_DECL tree node)
3942 and initialize static variables for generating RTL for the statements
3943 of the function. */
3945 void
3946 init_function_start (tree subr)
3948 if (subr && DECL_STRUCT_FUNCTION (subr))
3949 set_cfun (DECL_STRUCT_FUNCTION (subr));
3950 else
3951 allocate_struct_function (subr, false);
3952 prepare_function_start ();
3954 /* Warn if this value is an aggregate type,
3955 regardless of which calling convention we are using for it. */
3956 if (AGGREGATE_TYPE_P (TREE_TYPE (DECL_RESULT (subr))))
3957 warning (OPT_Waggregate_return, "function returns an aggregate");
3960 /* Make sure all values used by the optimization passes have sane
3961 defaults. */
3962 unsigned int
3963 init_function_for_compilation (void)
3965 reg_renumber = 0;
3967 /* No prologue/epilogue insns yet. Make sure that these vectors are
3968 empty. */
3969 gcc_assert (VEC_length (int, prologue) == 0);
3970 gcc_assert (VEC_length (int, epilogue) == 0);
3971 gcc_assert (VEC_length (int, sibcall_epilogue) == 0);
3972 return 0;
3975 struct rtl_opt_pass pass_init_function =
3978 RTL_PASS,
3979 NULL, /* name */
3980 NULL, /* gate */
3981 init_function_for_compilation, /* execute */
3982 NULL, /* sub */
3983 NULL, /* next */
3984 0, /* static_pass_number */
3985 0, /* tv_id */
3986 0, /* properties_required */
3987 0, /* properties_provided */
3988 0, /* properties_destroyed */
3989 0, /* todo_flags_start */
3990 0 /* todo_flags_finish */
3995 void
3996 expand_main_function (void)
3998 #if (defined(INVOKE__main) \
3999 || (!defined(HAS_INIT_SECTION) \
4000 && !defined(INIT_SECTION_ASM_OP) \
4001 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
4002 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
4003 #endif
4006 /* Expand code to initialize the stack_protect_guard. This is invoked at
4007 the beginning of a function to be protected. */
4009 #ifndef HAVE_stack_protect_set
4010 # define HAVE_stack_protect_set 0
4011 # define gen_stack_protect_set(x,y) (gcc_unreachable (), NULL_RTX)
4012 #endif
4014 void
4015 stack_protect_prologue (void)
4017 tree guard_decl = targetm.stack_protect_guard ();
4018 rtx x, y;
4020 /* Avoid expand_expr here, because we don't want guard_decl pulled
4021 into registers unless absolutely necessary. And we know that
4022 crtl->stack_protect_guard is a local stack slot, so this skips
4023 all the fluff. */
4024 x = validize_mem (DECL_RTL (crtl->stack_protect_guard));
4025 y = validize_mem (DECL_RTL (guard_decl));
4027 /* Allow the target to copy from Y to X without leaking Y into a
4028 register. */
4029 if (HAVE_stack_protect_set)
4031 rtx insn = gen_stack_protect_set (x, y);
4032 if (insn)
4034 emit_insn (insn);
4035 return;
4039 /* Otherwise do a straight move. */
4040 emit_move_insn (x, y);
4043 /* Expand code to verify the stack_protect_guard. This is invoked at
4044 the end of a function to be protected. */
4046 #ifndef HAVE_stack_protect_test
4047 # define HAVE_stack_protect_test 0
4048 # define gen_stack_protect_test(x, y, z) (gcc_unreachable (), NULL_RTX)
4049 #endif
4051 void
4052 stack_protect_epilogue (void)
4054 tree guard_decl = targetm.stack_protect_guard ();
4055 rtx label = gen_label_rtx ();
4056 rtx x, y, tmp;
4058 /* Avoid expand_expr here, because we don't want guard_decl pulled
4059 into registers unless absolutely necessary. And we know that
4060 crtl->stack_protect_guard is a local stack slot, so this skips
4061 all the fluff. */
4062 x = validize_mem (DECL_RTL (crtl->stack_protect_guard));
4063 y = validize_mem (DECL_RTL (guard_decl));
4065 /* Allow the target to compare Y with X without leaking either into
4066 a register. */
4067 switch (HAVE_stack_protect_test != 0)
4069 case 1:
4070 tmp = gen_stack_protect_test (x, y, label);
4071 if (tmp)
4073 emit_insn (tmp);
4074 break;
4076 /* FALLTHRU */
4078 default:
4079 emit_cmp_and_jump_insns (x, y, EQ, NULL_RTX, ptr_mode, 1, label);
4080 break;
4083 /* The noreturn predictor has been moved to the tree level. The rtl-level
4084 predictors estimate this branch about 20%, which isn't enough to get
4085 things moved out of line. Since this is the only extant case of adding
4086 a noreturn function at the rtl level, it doesn't seem worth doing ought
4087 except adding the prediction by hand. */
4088 tmp = get_last_insn ();
4089 if (JUMP_P (tmp))
4090 predict_insn_def (tmp, PRED_NORETURN, TAKEN);
4092 expand_expr_stmt (targetm.stack_protect_fail ());
4093 emit_label (label);
4096 /* Start the RTL for a new function, and set variables used for
4097 emitting RTL.
4098 SUBR is the FUNCTION_DECL node.
4099 PARMS_HAVE_CLEANUPS is nonzero if there are cleanups associated with
4100 the function's parameters, which must be run at any return statement. */
4102 void
4103 expand_function_start (tree subr)
4105 /* Make sure volatile mem refs aren't considered
4106 valid operands of arithmetic insns. */
4107 init_recog_no_volatile ();
4109 crtl->profile
4110 = (profile_flag
4111 && ! DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (subr));
4113 crtl->limit_stack
4114 = (stack_limit_rtx != NULL_RTX && ! DECL_NO_LIMIT_STACK (subr));
4116 /* Make the label for return statements to jump to. Do not special
4117 case machines with special return instructions -- they will be
4118 handled later during jump, ifcvt, or epilogue creation. */
4119 return_label = gen_label_rtx ();
4121 /* Initialize rtx used to return the value. */
4122 /* Do this before assign_parms so that we copy the struct value address
4123 before any library calls that assign parms might generate. */
4125 /* Decide whether to return the value in memory or in a register. */
4126 if (aggregate_value_p (DECL_RESULT (subr), subr))
4128 /* Returning something that won't go in a register. */
4129 rtx value_address = 0;
4131 #ifdef PCC_STATIC_STRUCT_RETURN
4132 if (cfun->returns_pcc_struct)
4134 int size = int_size_in_bytes (TREE_TYPE (DECL_RESULT (subr)));
4135 value_address = assemble_static_space (size);
4137 else
4138 #endif
4140 rtx sv = targetm.calls.struct_value_rtx (TREE_TYPE (subr), 2);
4141 /* Expect to be passed the address of a place to store the value.
4142 If it is passed as an argument, assign_parms will take care of
4143 it. */
4144 if (sv)
4146 value_address = gen_reg_rtx (Pmode);
4147 emit_move_insn (value_address, sv);
4150 if (value_address)
4152 rtx x = value_address;
4153 if (!DECL_BY_REFERENCE (DECL_RESULT (subr)))
4155 x = gen_rtx_MEM (DECL_MODE (DECL_RESULT (subr)), x);
4156 set_mem_attributes (x, DECL_RESULT (subr), 1);
4158 SET_DECL_RTL (DECL_RESULT (subr), x);
4161 else if (DECL_MODE (DECL_RESULT (subr)) == VOIDmode)
4162 /* If return mode is void, this decl rtl should not be used. */
4163 SET_DECL_RTL (DECL_RESULT (subr), NULL_RTX);
4164 else
4166 /* Compute the return values into a pseudo reg, which we will copy
4167 into the true return register after the cleanups are done. */
4168 tree return_type = TREE_TYPE (DECL_RESULT (subr));
4169 if (TYPE_MODE (return_type) != BLKmode
4170 && targetm.calls.return_in_msb (return_type))
4171 /* expand_function_end will insert the appropriate padding in
4172 this case. Use the return value's natural (unpadded) mode
4173 within the function proper. */
4174 SET_DECL_RTL (DECL_RESULT (subr),
4175 gen_reg_rtx (TYPE_MODE (return_type)));
4176 else
4178 /* In order to figure out what mode to use for the pseudo, we
4179 figure out what the mode of the eventual return register will
4180 actually be, and use that. */
4181 rtx hard_reg = hard_function_value (return_type, subr, 0, 1);
4183 /* Structures that are returned in registers are not
4184 aggregate_value_p, so we may see a PARALLEL or a REG. */
4185 if (REG_P (hard_reg))
4186 SET_DECL_RTL (DECL_RESULT (subr),
4187 gen_reg_rtx (GET_MODE (hard_reg)));
4188 else
4190 gcc_assert (GET_CODE (hard_reg) == PARALLEL);
4191 SET_DECL_RTL (DECL_RESULT (subr), gen_group_rtx (hard_reg));
4195 /* Set DECL_REGISTER flag so that expand_function_end will copy the
4196 result to the real return register(s). */
4197 DECL_REGISTER (DECL_RESULT (subr)) = 1;
4200 /* Initialize rtx for parameters and local variables.
4201 In some cases this requires emitting insns. */
4202 assign_parms (subr);
4204 /* If function gets a static chain arg, store it. */
4205 if (cfun->static_chain_decl)
4207 tree parm = cfun->static_chain_decl;
4208 rtx local = gen_reg_rtx (Pmode);
4210 set_decl_incoming_rtl (parm, static_chain_incoming_rtx, false);
4211 SET_DECL_RTL (parm, local);
4212 mark_reg_pointer (local, TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
4214 emit_move_insn (local, static_chain_incoming_rtx);
4217 /* If the function receives a non-local goto, then store the
4218 bits we need to restore the frame pointer. */
4219 if (cfun->nonlocal_goto_save_area)
4221 tree t_save;
4222 rtx r_save;
4224 /* ??? We need to do this save early. Unfortunately here is
4225 before the frame variable gets declared. Help out... */
4226 tree var = TREE_OPERAND (cfun->nonlocal_goto_save_area, 0);
4227 if (!DECL_RTL_SET_P (var))
4228 expand_decl (var);
4230 t_save = build4 (ARRAY_REF, ptr_type_node,
4231 cfun->nonlocal_goto_save_area,
4232 integer_zero_node, NULL_TREE, NULL_TREE);
4233 r_save = expand_expr (t_save, NULL_RTX, VOIDmode, EXPAND_WRITE);
4234 r_save = convert_memory_address (Pmode, r_save);
4236 emit_move_insn (r_save, targetm.builtin_setjmp_frame_value ());
4237 update_nonlocal_goto_save_area ();
4240 /* The following was moved from init_function_start.
4241 The move is supposed to make sdb output more accurate. */
4242 /* Indicate the beginning of the function body,
4243 as opposed to parm setup. */
4244 emit_note (NOTE_INSN_FUNCTION_BEG);
4246 gcc_assert (NOTE_P (get_last_insn ()));
4248 parm_birth_insn = get_last_insn ();
4250 if (crtl->profile)
4252 #ifdef PROFILE_HOOK
4253 PROFILE_HOOK (current_function_funcdef_no);
4254 #endif
4257 /* After the display initializations is where the stack checking
4258 probe should go. */
4259 if(flag_stack_check)
4260 stack_check_probe_note = emit_note (NOTE_INSN_DELETED);
4262 /* Make sure there is a line number after the function entry setup code. */
4263 force_next_line_note ();
4266 /* Undo the effects of init_dummy_function_start. */
4267 void
4268 expand_dummy_function_end (void)
4270 gcc_assert (in_dummy_function);
4272 /* End any sequences that failed to be closed due to syntax errors. */
4273 while (in_sequence_p ())
4274 end_sequence ();
4276 /* Outside function body, can't compute type's actual size
4277 until next function's body starts. */
4279 free_after_parsing (cfun);
4280 free_after_compilation (cfun);
4281 pop_cfun ();
4282 in_dummy_function = false;
4285 /* Call DOIT for each hard register used as a return value from
4286 the current function. */
4288 void
4289 diddle_return_value (void (*doit) (rtx, void *), void *arg)
4291 rtx outgoing = crtl->return_rtx;
4293 if (! outgoing)
4294 return;
4296 if (REG_P (outgoing))
4297 (*doit) (outgoing, arg);
4298 else if (GET_CODE (outgoing) == PARALLEL)
4300 int i;
4302 for (i = 0; i < XVECLEN (outgoing, 0); i++)
4304 rtx x = XEXP (XVECEXP (outgoing, 0, i), 0);
4306 if (REG_P (x) && REGNO (x) < FIRST_PSEUDO_REGISTER)
4307 (*doit) (x, arg);
4312 static void
4313 do_clobber_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
4315 emit_insn (gen_rtx_CLOBBER (VOIDmode, reg));
4318 void
4319 clobber_return_register (void)
4321 diddle_return_value (do_clobber_return_reg, NULL);
4323 /* In case we do use pseudo to return value, clobber it too. */
4324 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
4326 tree decl_result = DECL_RESULT (current_function_decl);
4327 rtx decl_rtl = DECL_RTL (decl_result);
4328 if (REG_P (decl_rtl) && REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER)
4330 do_clobber_return_reg (decl_rtl, NULL);
4335 static void
4336 do_use_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
4338 emit_insn (gen_rtx_USE (VOIDmode, reg));
4341 static void
4342 use_return_register (void)
4344 diddle_return_value (do_use_return_reg, NULL);
4347 /* Possibly warn about unused parameters. */
4348 void
4349 do_warn_unused_parameter (tree fn)
4351 tree decl;
4353 for (decl = DECL_ARGUMENTS (fn);
4354 decl; decl = TREE_CHAIN (decl))
4355 if (!TREE_USED (decl) && TREE_CODE (decl) == PARM_DECL
4356 && DECL_NAME (decl) && !DECL_ARTIFICIAL (decl)
4357 && !TREE_NO_WARNING (decl))
4358 warning (OPT_Wunused_parameter, "unused parameter %q+D", decl);
4361 static GTY(()) rtx initial_trampoline;
4363 /* Generate RTL for the end of the current function. */
4365 void
4366 expand_function_end (void)
4368 rtx clobber_after;
4370 /* If arg_pointer_save_area was referenced only from a nested
4371 function, we will not have initialized it yet. Do that now. */
4372 if (arg_pointer_save_area && ! crtl->arg_pointer_save_area_init)
4373 get_arg_pointer_save_area ();
4375 /* If we are doing stack checking and this function makes calls,
4376 do a stack probe at the start of the function to ensure we have enough
4377 space for another stack frame. */
4378 if (flag_stack_check && ! STACK_CHECK_BUILTIN)
4380 rtx insn, seq;
4382 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
4383 if (CALL_P (insn))
4385 start_sequence ();
4386 probe_stack_range (STACK_CHECK_PROTECT,
4387 GEN_INT (STACK_CHECK_MAX_FRAME_SIZE));
4388 seq = get_insns ();
4389 end_sequence ();
4390 emit_insn_before (seq, stack_check_probe_note);
4391 break;
4395 /* End any sequences that failed to be closed due to syntax errors. */
4396 while (in_sequence_p ())
4397 end_sequence ();
4399 clear_pending_stack_adjust ();
4400 do_pending_stack_adjust ();
4402 /* Output a linenumber for the end of the function.
4403 SDB depends on this. */
4404 force_next_line_note ();
4405 set_curr_insn_source_location (input_location);
4407 /* Before the return label (if any), clobber the return
4408 registers so that they are not propagated live to the rest of
4409 the function. This can only happen with functions that drop
4410 through; if there had been a return statement, there would
4411 have either been a return rtx, or a jump to the return label.
4413 We delay actual code generation after the current_function_value_rtx
4414 is computed. */
4415 clobber_after = get_last_insn ();
4417 /* Output the label for the actual return from the function. */
4418 emit_label (return_label);
4420 if (USING_SJLJ_EXCEPTIONS)
4422 /* Let except.c know where it should emit the call to unregister
4423 the function context for sjlj exceptions. */
4424 if (flag_exceptions)
4425 sjlj_emit_function_exit_after (get_last_insn ());
4427 else
4429 /* We want to ensure that instructions that may trap are not
4430 moved into the epilogue by scheduling, because we don't
4431 always emit unwind information for the epilogue. */
4432 if (flag_non_call_exceptions)
4433 emit_insn (gen_blockage ());
4436 /* If this is an implementation of throw, do what's necessary to
4437 communicate between __builtin_eh_return and the epilogue. */
4438 expand_eh_return ();
4440 /* If scalar return value was computed in a pseudo-reg, or was a named
4441 return value that got dumped to the stack, copy that to the hard
4442 return register. */
4443 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
4445 tree decl_result = DECL_RESULT (current_function_decl);
4446 rtx decl_rtl = DECL_RTL (decl_result);
4448 if (REG_P (decl_rtl)
4449 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
4450 : DECL_REGISTER (decl_result))
4452 rtx real_decl_rtl = crtl->return_rtx;
4454 /* This should be set in assign_parms. */
4455 gcc_assert (REG_FUNCTION_VALUE_P (real_decl_rtl));
4457 /* If this is a BLKmode structure being returned in registers,
4458 then use the mode computed in expand_return. Note that if
4459 decl_rtl is memory, then its mode may have been changed,
4460 but that crtl->return_rtx has not. */
4461 if (GET_MODE (real_decl_rtl) == BLKmode)
4462 PUT_MODE (real_decl_rtl, GET_MODE (decl_rtl));
4464 /* If a non-BLKmode return value should be padded at the least
4465 significant end of the register, shift it left by the appropriate
4466 amount. BLKmode results are handled using the group load/store
4467 machinery. */
4468 if (TYPE_MODE (TREE_TYPE (decl_result)) != BLKmode
4469 && targetm.calls.return_in_msb (TREE_TYPE (decl_result)))
4471 emit_move_insn (gen_rtx_REG (GET_MODE (decl_rtl),
4472 REGNO (real_decl_rtl)),
4473 decl_rtl);
4474 shift_return_value (GET_MODE (decl_rtl), true, real_decl_rtl);
4476 /* If a named return value dumped decl_return to memory, then
4477 we may need to re-do the PROMOTE_MODE signed/unsigned
4478 extension. */
4479 else if (GET_MODE (real_decl_rtl) != GET_MODE (decl_rtl))
4481 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (decl_result));
4483 if (targetm.calls.promote_function_return (TREE_TYPE (current_function_decl)))
4484 promote_mode (TREE_TYPE (decl_result), GET_MODE (decl_rtl),
4485 &unsignedp, 1);
4487 convert_move (real_decl_rtl, decl_rtl, unsignedp);
4489 else if (GET_CODE (real_decl_rtl) == PARALLEL)
4491 /* If expand_function_start has created a PARALLEL for decl_rtl,
4492 move the result to the real return registers. Otherwise, do
4493 a group load from decl_rtl for a named return. */
4494 if (GET_CODE (decl_rtl) == PARALLEL)
4495 emit_group_move (real_decl_rtl, decl_rtl);
4496 else
4497 emit_group_load (real_decl_rtl, decl_rtl,
4498 TREE_TYPE (decl_result),
4499 int_size_in_bytes (TREE_TYPE (decl_result)));
4501 /* In the case of complex integer modes smaller than a word, we'll
4502 need to generate some non-trivial bitfield insertions. Do that
4503 on a pseudo and not the hard register. */
4504 else if (GET_CODE (decl_rtl) == CONCAT
4505 && GET_MODE_CLASS (GET_MODE (decl_rtl)) == MODE_COMPLEX_INT
4506 && GET_MODE_BITSIZE (GET_MODE (decl_rtl)) <= BITS_PER_WORD)
4508 int old_generating_concat_p;
4509 rtx tmp;
4511 old_generating_concat_p = generating_concat_p;
4512 generating_concat_p = 0;
4513 tmp = gen_reg_rtx (GET_MODE (decl_rtl));
4514 generating_concat_p = old_generating_concat_p;
4516 emit_move_insn (tmp, decl_rtl);
4517 emit_move_insn (real_decl_rtl, tmp);
4519 else
4520 emit_move_insn (real_decl_rtl, decl_rtl);
4524 /* If returning a structure, arrange to return the address of the value
4525 in a place where debuggers expect to find it.
4527 If returning a structure PCC style,
4528 the caller also depends on this value.
4529 And cfun->returns_pcc_struct is not necessarily set. */
4530 if (cfun->returns_struct
4531 || cfun->returns_pcc_struct)
4533 rtx value_address = DECL_RTL (DECL_RESULT (current_function_decl));
4534 tree type = TREE_TYPE (DECL_RESULT (current_function_decl));
4535 rtx outgoing;
4537 if (DECL_BY_REFERENCE (DECL_RESULT (current_function_decl)))
4538 type = TREE_TYPE (type);
4539 else
4540 value_address = XEXP (value_address, 0);
4542 outgoing = targetm.calls.function_value (build_pointer_type (type),
4543 current_function_decl, true);
4545 /* Mark this as a function return value so integrate will delete the
4546 assignment and USE below when inlining this function. */
4547 REG_FUNCTION_VALUE_P (outgoing) = 1;
4549 /* The address may be ptr_mode and OUTGOING may be Pmode. */
4550 value_address = convert_memory_address (GET_MODE (outgoing),
4551 value_address);
4553 emit_move_insn (outgoing, value_address);
4555 /* Show return register used to hold result (in this case the address
4556 of the result. */
4557 crtl->return_rtx = outgoing;
4560 /* Emit the actual code to clobber return register. */
4562 rtx seq;
4564 start_sequence ();
4565 clobber_return_register ();
4566 expand_naked_return ();
4567 seq = get_insns ();
4568 end_sequence ();
4570 emit_insn_after (seq, clobber_after);
4573 /* Output the label for the naked return from the function. */
4574 emit_label (naked_return_label);
4576 /* @@@ This is a kludge. We want to ensure that instructions that
4577 may trap are not moved into the epilogue by scheduling, because
4578 we don't always emit unwind information for the epilogue. */
4579 if (! USING_SJLJ_EXCEPTIONS && flag_non_call_exceptions)
4580 emit_insn (gen_blockage ());
4582 /* If stack protection is enabled for this function, check the guard. */
4583 if (crtl->stack_protect_guard)
4584 stack_protect_epilogue ();
4586 /* If we had calls to alloca, and this machine needs
4587 an accurate stack pointer to exit the function,
4588 insert some code to save and restore the stack pointer. */
4589 if (! EXIT_IGNORE_STACK
4590 && cfun->calls_alloca)
4592 rtx tem = 0;
4594 emit_stack_save (SAVE_FUNCTION, &tem, parm_birth_insn);
4595 emit_stack_restore (SAVE_FUNCTION, tem, NULL_RTX);
4598 /* ??? This should no longer be necessary since stupid is no longer with
4599 us, but there are some parts of the compiler (eg reload_combine, and
4600 sh mach_dep_reorg) that still try and compute their own lifetime info
4601 instead of using the general framework. */
4602 use_return_register ();
4606 get_arg_pointer_save_area (void)
4608 rtx ret = arg_pointer_save_area;
4610 if (! ret)
4612 ret = assign_stack_local (Pmode, GET_MODE_SIZE (Pmode), 0);
4613 arg_pointer_save_area = ret;
4616 if (! crtl->arg_pointer_save_area_init)
4618 rtx seq;
4620 /* Save the arg pointer at the beginning of the function. The
4621 generated stack slot may not be a valid memory address, so we
4622 have to check it and fix it if necessary. */
4623 start_sequence ();
4624 emit_move_insn (validize_mem (ret), virtual_incoming_args_rtx);
4625 seq = get_insns ();
4626 end_sequence ();
4628 push_topmost_sequence ();
4629 emit_insn_after (seq, entry_of_function ());
4630 pop_topmost_sequence ();
4633 return ret;
4636 /* Extend a vector that records the INSN_UIDs of INSNS
4637 (a list of one or more insns). */
4639 static void
4640 record_insns (rtx insns, VEC(int,heap) **vecp)
4642 rtx tmp;
4644 for (tmp = insns; tmp != NULL_RTX; tmp = NEXT_INSN (tmp))
4645 VEC_safe_push (int, heap, *vecp, INSN_UID (tmp));
4648 /* Set the locator of the insn chain starting at INSN to LOC. */
4649 static void
4650 set_insn_locators (rtx insn, int loc)
4652 while (insn != NULL_RTX)
4654 if (INSN_P (insn))
4655 INSN_LOCATOR (insn) = loc;
4656 insn = NEXT_INSN (insn);
4660 /* Determine how many INSN_UIDs in VEC are part of INSN. Because we can
4661 be running after reorg, SEQUENCE rtl is possible. */
4663 static int
4664 contains (const_rtx insn, VEC(int,heap) **vec)
4666 int i, j;
4668 if (NONJUMP_INSN_P (insn)
4669 && GET_CODE (PATTERN (insn)) == SEQUENCE)
4671 int count = 0;
4672 for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
4673 for (j = VEC_length (int, *vec) - 1; j >= 0; --j)
4674 if (INSN_UID (XVECEXP (PATTERN (insn), 0, i))
4675 == VEC_index (int, *vec, j))
4676 count++;
4677 return count;
4679 else
4681 for (j = VEC_length (int, *vec) - 1; j >= 0; --j)
4682 if (INSN_UID (insn) == VEC_index (int, *vec, j))
4683 return 1;
4685 return 0;
4689 prologue_epilogue_contains (const_rtx insn)
4691 if (contains (insn, &prologue))
4692 return 1;
4693 if (contains (insn, &epilogue))
4694 return 1;
4695 return 0;
4699 sibcall_epilogue_contains (const_rtx insn)
4701 if (sibcall_epilogue)
4702 return contains (insn, &sibcall_epilogue);
4703 return 0;
4706 #ifdef HAVE_return
4707 /* Insert gen_return at the end of block BB. This also means updating
4708 block_for_insn appropriately. */
4710 static void
4711 emit_return_into_block (basic_block bb)
4713 emit_jump_insn_after (gen_return (), BB_END (bb));
4715 #endif /* HAVE_return */
4717 /* Generate the prologue and epilogue RTL if the machine supports it. Thread
4718 this into place with notes indicating where the prologue ends and where
4719 the epilogue begins. Update the basic block information when possible. */
4721 static void
4722 thread_prologue_and_epilogue_insns (void)
4724 int inserted = 0;
4725 edge e;
4726 #if defined (HAVE_sibcall_epilogue) || defined (HAVE_epilogue) || defined (HAVE_return) || defined (HAVE_prologue)
4727 rtx seq;
4728 #endif
4729 #if defined (HAVE_epilogue) || defined(HAVE_return)
4730 rtx epilogue_end = NULL_RTX;
4731 #endif
4732 edge_iterator ei;
4734 #ifdef HAVE_prologue
4735 if (HAVE_prologue)
4737 start_sequence ();
4738 seq = gen_prologue ();
4739 emit_insn (seq);
4741 /* Insert an explicit USE for the frame pointer
4742 if the profiling is on and the frame pointer is required. */
4743 if (crtl->profile && frame_pointer_needed)
4744 emit_insn (gen_rtx_USE (VOIDmode, hard_frame_pointer_rtx));
4746 /* Retain a map of the prologue insns. */
4747 record_insns (seq, &prologue);
4748 emit_note (NOTE_INSN_PROLOGUE_END);
4750 #ifndef PROFILE_BEFORE_PROLOGUE
4751 /* Ensure that instructions are not moved into the prologue when
4752 profiling is on. The call to the profiling routine can be
4753 emitted within the live range of a call-clobbered register. */
4754 if (crtl->profile)
4755 emit_insn (gen_blockage ());
4756 #endif
4758 seq = get_insns ();
4759 end_sequence ();
4760 set_insn_locators (seq, prologue_locator);
4762 /* Can't deal with multiple successors of the entry block
4763 at the moment. Function should always have at least one
4764 entry point. */
4765 gcc_assert (single_succ_p (ENTRY_BLOCK_PTR));
4767 insert_insn_on_edge (seq, single_succ_edge (ENTRY_BLOCK_PTR));
4768 inserted = 1;
4770 #endif
4772 /* If the exit block has no non-fake predecessors, we don't need
4773 an epilogue. */
4774 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
4775 if ((e->flags & EDGE_FAKE) == 0)
4776 break;
4777 if (e == NULL)
4778 goto epilogue_done;
4780 #ifdef HAVE_return
4781 if (optimize && HAVE_return)
4783 /* If we're allowed to generate a simple return instruction,
4784 then by definition we don't need a full epilogue. Examine
4785 the block that falls through to EXIT. If it does not
4786 contain any code, examine its predecessors and try to
4787 emit (conditional) return instructions. */
4789 basic_block last;
4790 rtx label;
4792 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
4793 if (e->flags & EDGE_FALLTHRU)
4794 break;
4795 if (e == NULL)
4796 goto epilogue_done;
4797 last = e->src;
4799 /* Verify that there are no active instructions in the last block. */
4800 label = BB_END (last);
4801 while (label && !LABEL_P (label))
4803 if (active_insn_p (label))
4804 break;
4805 label = PREV_INSN (label);
4808 if (BB_HEAD (last) == label && LABEL_P (label))
4810 edge_iterator ei2;
4812 for (ei2 = ei_start (last->preds); (e = ei_safe_edge (ei2)); )
4814 basic_block bb = e->src;
4815 rtx jump;
4817 if (bb == ENTRY_BLOCK_PTR)
4819 ei_next (&ei2);
4820 continue;
4823 jump = BB_END (bb);
4824 if (!JUMP_P (jump) || JUMP_LABEL (jump) != label)
4826 ei_next (&ei2);
4827 continue;
4830 /* If we have an unconditional jump, we can replace that
4831 with a simple return instruction. */
4832 if (simplejump_p (jump))
4834 emit_return_into_block (bb);
4835 delete_insn (jump);
4838 /* If we have a conditional jump, we can try to replace
4839 that with a conditional return instruction. */
4840 else if (condjump_p (jump))
4842 if (! redirect_jump (jump, 0, 0))
4844 ei_next (&ei2);
4845 continue;
4848 /* If this block has only one successor, it both jumps
4849 and falls through to the fallthru block, so we can't
4850 delete the edge. */
4851 if (single_succ_p (bb))
4853 ei_next (&ei2);
4854 continue;
4857 else
4859 ei_next (&ei2);
4860 continue;
4863 /* Fix up the CFG for the successful change we just made. */
4864 redirect_edge_succ (e, EXIT_BLOCK_PTR);
4867 /* Emit a return insn for the exit fallthru block. Whether
4868 this is still reachable will be determined later. */
4870 emit_barrier_after (BB_END (last));
4871 emit_return_into_block (last);
4872 epilogue_end = BB_END (last);
4873 single_succ_edge (last)->flags &= ~EDGE_FALLTHRU;
4874 goto epilogue_done;
4877 #endif
4878 /* Find the edge that falls through to EXIT. Other edges may exist
4879 due to RETURN instructions, but those don't need epilogues.
4880 There really shouldn't be a mixture -- either all should have
4881 been converted or none, however... */
4883 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
4884 if (e->flags & EDGE_FALLTHRU)
4885 break;
4886 if (e == NULL)
4887 goto epilogue_done;
4889 #ifdef HAVE_epilogue
4890 if (HAVE_epilogue)
4892 start_sequence ();
4893 epilogue_end = emit_note (NOTE_INSN_EPILOGUE_BEG);
4894 seq = gen_epilogue ();
4895 emit_jump_insn (seq);
4897 /* Retain a map of the epilogue insns. */
4898 record_insns (seq, &epilogue);
4899 set_insn_locators (seq, epilogue_locator);
4901 seq = get_insns ();
4902 end_sequence ();
4904 insert_insn_on_edge (seq, e);
4905 inserted = 1;
4907 else
4908 #endif
4910 basic_block cur_bb;
4912 if (! next_active_insn (BB_END (e->src)))
4913 goto epilogue_done;
4914 /* We have a fall-through edge to the exit block, the source is not
4915 at the end of the function, and there will be an assembler epilogue
4916 at the end of the function.
4917 We can't use force_nonfallthru here, because that would try to
4918 use return. Inserting a jump 'by hand' is extremely messy, so
4919 we take advantage of cfg_layout_finalize using
4920 fixup_fallthru_exit_predecessor. */
4921 cfg_layout_initialize (0);
4922 FOR_EACH_BB (cur_bb)
4923 if (cur_bb->index >= NUM_FIXED_BLOCKS
4924 && cur_bb->next_bb->index >= NUM_FIXED_BLOCKS)
4925 cur_bb->aux = cur_bb->next_bb;
4926 cfg_layout_finalize ();
4928 epilogue_done:
4930 if (inserted)
4932 commit_edge_insertions ();
4934 /* The epilogue insns we inserted may cause the exit edge to no longer
4935 be fallthru. */
4936 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
4938 if (((e->flags & EDGE_FALLTHRU) != 0)
4939 && returnjump_p (BB_END (e->src)))
4940 e->flags &= ~EDGE_FALLTHRU;
4944 #ifdef HAVE_sibcall_epilogue
4945 /* Emit sibling epilogues before any sibling call sites. */
4946 for (ei = ei_start (EXIT_BLOCK_PTR->preds); (e = ei_safe_edge (ei)); )
4948 basic_block bb = e->src;
4949 rtx insn = BB_END (bb);
4951 if (!CALL_P (insn)
4952 || ! SIBLING_CALL_P (insn))
4954 ei_next (&ei);
4955 continue;
4958 start_sequence ();
4959 emit_insn (gen_sibcall_epilogue ());
4960 seq = get_insns ();
4961 end_sequence ();
4963 /* Retain a map of the epilogue insns. Used in life analysis to
4964 avoid getting rid of sibcall epilogue insns. Do this before we
4965 actually emit the sequence. */
4966 record_insns (seq, &sibcall_epilogue);
4967 set_insn_locators (seq, epilogue_locator);
4969 emit_insn_before (seq, insn);
4970 ei_next (&ei);
4972 #endif
4974 #ifdef HAVE_epilogue
4975 if (epilogue_end)
4977 rtx insn, next;
4979 /* Similarly, move any line notes that appear after the epilogue.
4980 There is no need, however, to be quite so anal about the existence
4981 of such a note. Also possibly move
4982 NOTE_INSN_FUNCTION_BEG notes, as those can be relevant for debug
4983 info generation. */
4984 for (insn = epilogue_end; insn; insn = next)
4986 next = NEXT_INSN (insn);
4987 if (NOTE_P (insn)
4988 && (NOTE_KIND (insn) == NOTE_INSN_FUNCTION_BEG))
4989 reorder_insns (insn, insn, PREV_INSN (epilogue_end));
4992 #endif
4994 /* Threading the prologue and epilogue changes the artificial refs
4995 in the entry and exit blocks. */
4996 epilogue_completed = 1;
4997 df_update_entry_exit_and_calls ();
5000 /* Reposition the prologue-end and epilogue-begin notes after instruction
5001 scheduling and delayed branch scheduling. */
5003 void
5004 reposition_prologue_and_epilogue_notes (void)
5006 #if defined (HAVE_prologue) || defined (HAVE_epilogue)
5007 rtx insn, last, note;
5008 int len;
5010 if ((len = VEC_length (int, prologue)) > 0)
5012 last = 0, note = 0;
5014 /* Scan from the beginning until we reach the last prologue insn.
5015 We apparently can't depend on basic_block_{head,end} after
5016 reorg has run. */
5017 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5019 if (NOTE_P (insn))
5021 if (NOTE_KIND (insn) == NOTE_INSN_PROLOGUE_END)
5022 note = insn;
5024 else if (contains (insn, &prologue))
5026 last = insn;
5027 if (--len == 0)
5028 break;
5032 if (last)
5034 /* Find the prologue-end note if we haven't already, and
5035 move it to just after the last prologue insn. */
5036 if (note == 0)
5038 for (note = last; (note = NEXT_INSN (note));)
5039 if (NOTE_P (note)
5040 && NOTE_KIND (note) == NOTE_INSN_PROLOGUE_END)
5041 break;
5044 /* Avoid placing note between CODE_LABEL and BASIC_BLOCK note. */
5045 if (LABEL_P (last))
5046 last = NEXT_INSN (last);
5047 reorder_insns (note, note, last);
5051 if ((len = VEC_length (int, epilogue)) > 0)
5053 last = 0, note = 0;
5055 /* Scan from the end until we reach the first epilogue insn.
5056 We apparently can't depend on basic_block_{head,end} after
5057 reorg has run. */
5058 for (insn = get_last_insn (); insn; insn = PREV_INSN (insn))
5060 if (NOTE_P (insn))
5062 if (NOTE_KIND (insn) == NOTE_INSN_EPILOGUE_BEG)
5063 note = insn;
5065 else if (contains (insn, &epilogue))
5067 last = insn;
5068 if (--len == 0)
5069 break;
5073 if (last)
5075 /* Find the epilogue-begin note if we haven't already, and
5076 move it to just before the first epilogue insn. */
5077 if (note == 0)
5079 for (note = insn; (note = PREV_INSN (note));)
5080 if (NOTE_P (note)
5081 && NOTE_KIND (note) == NOTE_INSN_EPILOGUE_BEG)
5082 break;
5085 if (PREV_INSN (last) != note)
5086 reorder_insns (note, note, PREV_INSN (last));
5089 #endif /* HAVE_prologue or HAVE_epilogue */
5092 /* Returns the name of the current function. */
5093 const char *
5094 current_function_name (void)
5096 return lang_hooks.decl_printable_name (cfun->decl, 2);
5099 /* Returns the raw (mangled) name of the current function. */
5100 const char *
5101 current_function_assembler_name (void)
5103 return IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (cfun->decl));
5107 /* This recursive function finds and returns CALL expression in X. */
5108 static rtx
5109 get_call (rtx x)
5111 int i;
5112 rtx call_rtx;
5113 const char *fmt;
5114 enum rtx_code code = GET_CODE (x);
5116 /* Ignore registers in memory. */
5117 if (code == CALL)
5118 return x;
5120 fmt = GET_RTX_FORMAT (code);
5121 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
5123 if (fmt [i] == 'e')
5125 if ((call_rtx = get_call (XEXP (x, i))) != NULL_RTX)
5126 return call_rtx;
5128 else if (fmt [i] == 'E')
5130 int j;
5132 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
5133 if ((call_rtx = get_call (XVECEXP (x, i, j))) != NULL_RTX)
5134 return call_rtx;
5137 return NULL_RTX;
5140 /* This function returns call unsaved registers invalidated (if
5141 CLOBBERED_P) or used by function called by INSN through REGS. */
5142 void
5143 get_call_invalidated_used_regs (const_rtx insn, HARD_REG_SET *regs,
5144 bool clobbered_p)
5146 rtx x;
5147 struct cgraph_node *node;
5148 tree decl = NULL;
5150 gcc_assert (CALL_P (insn));
5152 x = get_call (PATTERN (insn));
5153 if (x != NULL_RTX)
5155 x = XEXP (x, 0);
5156 gcc_assert (GET_CODE (x) == MEM);
5157 x = XEXP (x, 0);
5158 if (GET_CODE (x) == SYMBOL_REF)
5159 decl = SYMBOL_REF_DECL (x);
5160 if (decl != NULL && TREE_CODE (decl) != FUNCTION_DECL)
5161 decl = NULL;
5163 node = decl == NULL ? NULL : cgraph_node (decl);
5164 if (! flag_ira || ! flag_ira_ipra || node == NULL
5165 /* This is a call of the function itself. We don't know used
5166 registers yet. So take the worst case. */
5167 || node->decl == cfun->decl)
5169 if (clobbered_p)
5170 COPY_HARD_REG_SET (*regs, regs_invalidated_by_call);
5171 else
5172 COPY_HARD_REG_SET (*regs, call_used_reg_set);
5174 else
5176 COPY_HARD_REG_SET (*regs, node->function_used_regs);
5177 if (clobbered_p)
5178 AND_HARD_REG_SET (*regs, regs_invalidated_by_call);
5184 static unsigned int
5185 rest_of_handle_check_leaf_regs (void)
5187 #ifdef LEAF_REGISTERS
5188 current_function_uses_only_leaf_regs
5189 = optimize > 0 && only_leaf_regs_used () && leaf_function_p ();
5190 #endif
5191 return 0;
5194 /* Insert a TYPE into the used types hash table of CFUN. */
5195 static void
5196 used_types_insert_helper (tree type, struct function *func)
5198 if (type != NULL && func != NULL)
5200 void **slot;
5202 if (func->used_types_hash == NULL)
5203 func->used_types_hash = htab_create_ggc (37, htab_hash_pointer,
5204 htab_eq_pointer, NULL);
5205 slot = htab_find_slot (func->used_types_hash, type, INSERT);
5206 if (*slot == NULL)
5207 *slot = type;
5211 /* Given a type, insert it into the used hash table in cfun. */
5212 void
5213 used_types_insert (tree t)
5215 while (POINTER_TYPE_P (t) || TREE_CODE (t) == ARRAY_TYPE)
5216 t = TREE_TYPE (t);
5217 t = TYPE_MAIN_VARIANT (t);
5218 if (debug_info_level > DINFO_LEVEL_NONE)
5219 used_types_insert_helper (t, cfun);
5222 struct rtl_opt_pass pass_leaf_regs =
5225 RTL_PASS,
5226 NULL, /* name */
5227 NULL, /* gate */
5228 rest_of_handle_check_leaf_regs, /* execute */
5229 NULL, /* sub */
5230 NULL, /* next */
5231 0, /* static_pass_number */
5232 0, /* tv_id */
5233 0, /* properties_required */
5234 0, /* properties_provided */
5235 0, /* properties_destroyed */
5236 0, /* todo_flags_start */
5237 0 /* todo_flags_finish */
5241 static unsigned int
5242 rest_of_handle_thread_prologue_and_epilogue (void)
5244 if (optimize)
5245 cleanup_cfg (CLEANUP_EXPENSIVE);
5246 /* On some machines, the prologue and epilogue code, or parts thereof,
5247 can be represented as RTL. Doing so lets us schedule insns between
5248 it and the rest of the code and also allows delayed branch
5249 scheduling to operate in the epilogue. */
5251 thread_prologue_and_epilogue_insns ();
5252 return 0;
5255 struct rtl_opt_pass pass_thread_prologue_and_epilogue =
5258 RTL_PASS,
5259 "pro_and_epilogue", /* name */
5260 NULL, /* gate */
5261 rest_of_handle_thread_prologue_and_epilogue, /* execute */
5262 NULL, /* sub */
5263 NULL, /* next */
5264 0, /* static_pass_number */
5265 TV_THREAD_PROLOGUE_AND_EPILOGUE, /* tv_id */
5266 0, /* properties_required */
5267 0, /* properties_provided */
5268 0, /* properties_destroyed */
5269 TODO_verify_flow, /* todo_flags_start */
5270 TODO_dump_func |
5271 TODO_df_verify |
5272 TODO_df_finish | TODO_verify_rtl_sharing |
5273 TODO_ggc_collect /* todo_flags_finish */
5278 /* This mini-pass fixes fall-out from SSA in asm statements that have
5279 in-out constraints. Say you start with
5281 orig = inout;
5282 asm ("": "+mr" (inout));
5283 use (orig);
5285 which is transformed very early to use explicit output and match operands:
5287 orig = inout;
5288 asm ("": "=mr" (inout) : "0" (inout));
5289 use (orig);
5291 Or, after SSA and copyprop,
5293 asm ("": "=mr" (inout_2) : "0" (inout_1));
5294 use (inout_1);
5296 Clearly inout_2 and inout_1 can't be coalesced easily anymore, as
5297 they represent two separate values, so they will get different pseudo
5298 registers during expansion. Then, since the two operands need to match
5299 per the constraints, but use different pseudo registers, reload can
5300 only register a reload for these operands. But reloads can only be
5301 satisfied by hardregs, not by memory, so we need a register for this
5302 reload, just because we are presented with non-matching operands.
5303 So, even though we allow memory for this operand, no memory can be
5304 used for it, just because the two operands don't match. This can
5305 cause reload failures on register-starved targets.
5307 So it's a symptom of reload not being able to use memory for reloads
5308 or, alternatively it's also a symptom of both operands not coming into
5309 reload as matching (in which case the pseudo could go to memory just
5310 fine, as the alternative allows it, and no reload would be necessary).
5311 We fix the latter problem here, by transforming
5313 asm ("": "=mr" (inout_2) : "0" (inout_1));
5315 back to
5317 inout_2 = inout_1;
5318 asm ("": "=mr" (inout_2) : "0" (inout_2)); */
5320 static void
5321 match_asm_constraints_1 (rtx insn, rtx *p_sets, int noutputs)
5323 int i;
5324 bool changed = false;
5325 rtx op = SET_SRC (p_sets[0]);
5326 int ninputs = ASM_OPERANDS_INPUT_LENGTH (op);
5327 rtvec inputs = ASM_OPERANDS_INPUT_VEC (op);
5328 bool *output_matched = alloca (noutputs * sizeof (bool));
5330 memset (output_matched, 0, noutputs * sizeof (bool));
5331 for (i = 0; i < ninputs; i++)
5333 rtx input, output, insns;
5334 const char *constraint = ASM_OPERANDS_INPUT_CONSTRAINT (op, i);
5335 char *end;
5336 int match, j;
5338 match = strtoul (constraint, &end, 10);
5339 if (end == constraint)
5340 continue;
5342 gcc_assert (match < noutputs);
5343 output = SET_DEST (p_sets[match]);
5344 input = RTVEC_ELT (inputs, i);
5345 /* Only do the transformation for pseudos. */
5346 if (! REG_P (output)
5347 || rtx_equal_p (output, input)
5348 || (GET_MODE (input) != VOIDmode
5349 && GET_MODE (input) != GET_MODE (output)))
5350 continue;
5352 /* We can't do anything if the output is also used as input,
5353 as we're going to overwrite it. */
5354 for (j = 0; j < ninputs; j++)
5355 if (reg_overlap_mentioned_p (output, RTVEC_ELT (inputs, j)))
5356 break;
5357 if (j != ninputs)
5358 continue;
5360 /* Avoid changing the same input several times. For
5361 asm ("" : "=mr" (out1), "=mr" (out2) : "0" (in), "1" (in));
5362 only change in once (to out1), rather than changing it
5363 first to out1 and afterwards to out2. */
5364 if (i > 0)
5366 for (j = 0; j < noutputs; j++)
5367 if (output_matched[j] && input == SET_DEST (p_sets[j]))
5368 break;
5369 if (j != noutputs)
5370 continue;
5372 output_matched[match] = true;
5374 start_sequence ();
5375 emit_move_insn (output, input);
5376 insns = get_insns ();
5377 end_sequence ();
5378 emit_insn_before (insns, insn);
5380 /* Now replace all mentions of the input with output. We can't
5381 just replace the occurence in inputs[i], as the register might
5382 also be used in some other input (or even in an address of an
5383 output), which would mean possibly increasing the number of
5384 inputs by one (namely 'output' in addition), which might pose
5385 a too complicated problem for reload to solve. E.g. this situation:
5387 asm ("" : "=r" (output), "=m" (input) : "0" (input))
5389 Here 'input' is used in two occurrences as input (once for the
5390 input operand, once for the address in the second output operand).
5391 If we would replace only the occurence of the input operand (to
5392 make the matching) we would be left with this:
5394 output = input
5395 asm ("" : "=r" (output), "=m" (input) : "0" (output))
5397 Now we suddenly have two different input values (containing the same
5398 value, but different pseudos) where we formerly had only one.
5399 With more complicated asms this might lead to reload failures
5400 which wouldn't have happen without this pass. So, iterate over
5401 all operands and replace all occurrences of the register used. */
5402 for (j = 0; j < noutputs; j++)
5403 if (!rtx_equal_p (SET_DEST (p_sets[j]), input)
5404 && reg_overlap_mentioned_p (input, SET_DEST (p_sets[j])))
5405 SET_DEST (p_sets[j]) = replace_rtx (SET_DEST (p_sets[j]),
5406 input, output);
5407 for (j = 0; j < ninputs; j++)
5408 if (reg_overlap_mentioned_p (input, RTVEC_ELT (inputs, j)))
5409 RTVEC_ELT (inputs, j) = replace_rtx (RTVEC_ELT (inputs, j),
5410 input, output);
5412 changed = true;
5415 if (changed)
5416 df_insn_rescan (insn);
5419 static unsigned
5420 rest_of_match_asm_constraints (void)
5422 basic_block bb;
5423 rtx insn, pat, *p_sets;
5424 int noutputs;
5426 if (!crtl->has_asm_statement)
5427 return 0;
5429 df_set_flags (DF_DEFER_INSN_RESCAN);
5430 FOR_EACH_BB (bb)
5432 FOR_BB_INSNS (bb, insn)
5434 if (!INSN_P (insn))
5435 continue;
5437 pat = PATTERN (insn);
5438 if (GET_CODE (pat) == PARALLEL)
5439 p_sets = &XVECEXP (pat, 0, 0), noutputs = XVECLEN (pat, 0);
5440 else if (GET_CODE (pat) == SET)
5441 p_sets = &PATTERN (insn), noutputs = 1;
5442 else
5443 continue;
5445 if (GET_CODE (*p_sets) == SET
5446 && GET_CODE (SET_SRC (*p_sets)) == ASM_OPERANDS)
5447 match_asm_constraints_1 (insn, p_sets, noutputs);
5451 return TODO_df_finish;
5454 struct rtl_opt_pass pass_match_asm_constraints =
5457 RTL_PASS,
5458 "asmcons", /* name */
5459 NULL, /* gate */
5460 rest_of_match_asm_constraints, /* execute */
5461 NULL, /* sub */
5462 NULL, /* next */
5463 0, /* static_pass_number */
5464 0, /* tv_id */
5465 0, /* properties_required */
5466 0, /* properties_provided */
5467 0, /* properties_destroyed */
5468 0, /* todo_flags_start */
5469 TODO_dump_func /* todo_flags_finish */
5474 #include "gt-function.h"