function.c (expand_function_end): Move blockage to just after we emit the label for...
[official-gcc.git] / gcc / function.c
blobf6ebb85589868568524ef94057ae4cef727911c0
1 /* Expands front end tree to back end RTL for GCC.
2 Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
3 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007
4 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 2, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 /* This file handles the generation of rtl code from tree structure
24 at the level of the function as a whole.
25 It creates the rtl expressions for parameters and auto variables
26 and has full responsibility for allocating stack slots.
28 `expand_function_start' is called at the beginning of a function,
29 before the function body is parsed, and `expand_function_end' is
30 called after parsing the body.
32 Call `assign_stack_local' to allocate a stack slot for a local variable.
33 This is usually done during the RTL generation for the function body,
34 but it can also be done in the reload pass when a pseudo-register does
35 not get a hard register. */
37 #include "config.h"
38 #include "system.h"
39 #include "coretypes.h"
40 #include "tm.h"
41 #include "rtl.h"
42 #include "tree.h"
43 #include "flags.h"
44 #include "except.h"
45 #include "function.h"
46 #include "expr.h"
47 #include "optabs.h"
48 #include "libfuncs.h"
49 #include "regs.h"
50 #include "hard-reg-set.h"
51 #include "insn-config.h"
52 #include "recog.h"
53 #include "output.h"
54 #include "basic-block.h"
55 #include "toplev.h"
56 #include "hashtab.h"
57 #include "ggc.h"
58 #include "tm_p.h"
59 #include "integrate.h"
60 #include "langhooks.h"
61 #include "target.h"
62 #include "cfglayout.h"
63 #include "tree-gimple.h"
64 #include "tree-pass.h"
65 #include "predict.h"
66 #include "vecprim.h"
68 #ifndef LOCAL_ALIGNMENT
69 #define LOCAL_ALIGNMENT(TYPE, ALIGNMENT) ALIGNMENT
70 #endif
72 #ifndef STACK_ALIGNMENT_NEEDED
73 #define STACK_ALIGNMENT_NEEDED 1
74 #endif
76 #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT)
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* Round a value to the lowest integer less than it that is a multiple of
87 the required alignment. Avoid using division in case the value is
88 negative. Assume the alignment is a power of two. */
89 #define FLOOR_ROUND(VALUE,ALIGN) ((VALUE) & ~((ALIGN) - 1))
91 /* Similar, but round to the next highest integer that meets the
92 alignment. */
93 #define CEIL_ROUND(VALUE,ALIGN) (((VALUE) + (ALIGN) - 1) & ~((ALIGN)- 1))
95 /* Nonzero if function being compiled doesn't contain any calls
96 (ignoring the prologue and epilogue). This is set prior to
97 local register allocation and is valid for the remaining
98 compiler passes. */
99 int current_function_is_leaf;
101 /* Nonzero if function being compiled doesn't modify the stack pointer
102 (ignoring the prologue and epilogue). This is only valid after
103 life_analysis has run. */
104 int current_function_sp_is_unchanging;
106 /* Nonzero if the function being compiled is a leaf function which only
107 uses leaf registers. This is valid after reload (specifically after
108 sched2) and is useful only if the port defines LEAF_REGISTERS. */
109 int current_function_uses_only_leaf_regs;
111 /* Nonzero once virtual register instantiation has been done.
112 assign_stack_local uses frame_pointer_rtx when this is nonzero.
113 calls.c:emit_library_call_value_1 uses it to set up
114 post-instantiation libcalls. */
115 int virtuals_instantiated;
117 /* Assign unique numbers to labels generated for profiling, debugging, etc. */
118 static GTY(()) int funcdef_no;
120 /* These variables hold pointers to functions to create and destroy
121 target specific, per-function data structures. */
122 struct machine_function * (*init_machine_status) (void);
124 /* The currently compiled function. */
125 struct function *cfun = 0;
127 /* These arrays record the INSN_UIDs of the prologue and epilogue insns. */
128 static VEC(int,heap) *prologue;
129 static VEC(int,heap) *epilogue;
131 /* Array of INSN_UIDs to hold the INSN_UIDs for each sibcall epilogue
132 in this function. */
133 static VEC(int,heap) *sibcall_epilogue;
135 /* In order to evaluate some expressions, such as function calls returning
136 structures in memory, we need to temporarily allocate stack locations.
137 We record each allocated temporary in the following structure.
139 Associated with each temporary slot is a nesting level. When we pop up
140 one level, all temporaries associated with the previous level are freed.
141 Normally, all temporaries are freed after the execution of the statement
142 in which they were created. However, if we are inside a ({...}) grouping,
143 the result may be in a temporary and hence must be preserved. If the
144 result could be in a temporary, we preserve it if we can determine which
145 one it is in. If we cannot determine which temporary may contain the
146 result, all temporaries are preserved. A temporary is preserved by
147 pretending it was allocated at the previous nesting level.
149 Automatic variables are also assigned temporary slots, at the nesting
150 level where they are defined. They are marked a "kept" so that
151 free_temp_slots will not free them. */
153 struct temp_slot GTY(())
155 /* Points to next temporary slot. */
156 struct temp_slot *next;
157 /* Points to previous temporary slot. */
158 struct temp_slot *prev;
160 /* The rtx to used to reference the slot. */
161 rtx slot;
162 /* The rtx used to represent the address if not the address of the
163 slot above. May be an EXPR_LIST if multiple addresses exist. */
164 rtx address;
165 /* The alignment (in bits) of the slot. */
166 unsigned int align;
167 /* The size, in units, of the slot. */
168 HOST_WIDE_INT size;
169 /* The type of the object in the slot, or zero if it doesn't correspond
170 to a type. We use this to determine whether a slot can be reused.
171 It can be reused if objects of the type of the new slot will always
172 conflict with objects of the type of the old slot. */
173 tree type;
174 /* Nonzero if this temporary is currently in use. */
175 char in_use;
176 /* Nonzero if this temporary has its address taken. */
177 char addr_taken;
178 /* Nesting level at which this slot is being used. */
179 int level;
180 /* Nonzero if this should survive a call to free_temp_slots. */
181 int keep;
182 /* The offset of the slot from the frame_pointer, including extra space
183 for alignment. This info is for combine_temp_slots. */
184 HOST_WIDE_INT base_offset;
185 /* The size of the slot, including extra space for alignment. This
186 info is for combine_temp_slots. */
187 HOST_WIDE_INT full_size;
190 /* Forward declarations. */
192 static rtx assign_stack_local_1 (enum machine_mode, HOST_WIDE_INT, int,
193 struct function *);
194 static struct temp_slot *find_temp_slot_from_address (rtx);
195 static void pad_to_arg_alignment (struct args_size *, int, struct args_size *);
196 static void pad_below (struct args_size *, enum machine_mode, tree);
197 static void reorder_blocks_1 (rtx, tree, VEC(tree,heap) **);
198 static int all_blocks (tree, tree *);
199 static tree *get_block_vector (tree, int *);
200 extern tree debug_find_var_in_block_tree (tree, tree);
201 /* We always define `record_insns' even if it's not used so that we
202 can always export `prologue_epilogue_contains'. */
203 static void record_insns (rtx, VEC(int,heap) **) ATTRIBUTE_UNUSED;
204 static int contains (rtx, VEC(int,heap) **);
205 #ifdef HAVE_return
206 static void emit_return_into_block (basic_block);
207 #endif
208 #if defined(HAVE_epilogue) && defined(INCOMING_RETURN_ADDR_RTX)
209 static rtx keep_stack_depressed (rtx);
210 #endif
211 static void prepare_function_start (tree);
212 static void do_clobber_return_reg (rtx, void *);
213 static void do_use_return_reg (rtx, void *);
214 static void set_insn_locators (rtx, int) ATTRIBUTE_UNUSED;
216 /* Pointer to chain of `struct function' for containing functions. */
217 struct function *outer_function_chain;
219 /* Given a function decl for a containing function,
220 return the `struct function' for it. */
222 struct function *
223 find_function_data (tree decl)
225 struct function *p;
227 for (p = outer_function_chain; p; p = p->outer)
228 if (p->decl == decl)
229 return p;
231 gcc_unreachable ();
234 /* Save the current context for compilation of a nested function.
235 This is called from language-specific code. The caller should use
236 the enter_nested langhook to save any language-specific state,
237 since this function knows only about language-independent
238 variables. */
240 void
241 push_function_context_to (tree context ATTRIBUTE_UNUSED)
243 struct function *p;
245 if (cfun == 0)
246 init_dummy_function_start ();
247 p = cfun;
249 p->outer = outer_function_chain;
250 outer_function_chain = p;
252 lang_hooks.function.enter_nested (p);
254 cfun = 0;
257 void
258 push_function_context (void)
260 push_function_context_to (current_function_decl);
263 /* Restore the last saved context, at the end of a nested function.
264 This function is called from language-specific code. */
266 void
267 pop_function_context_from (tree context ATTRIBUTE_UNUSED)
269 struct function *p = outer_function_chain;
271 cfun = p;
272 outer_function_chain = p->outer;
274 current_function_decl = p->decl;
276 lang_hooks.function.leave_nested (p);
278 /* Reset variables that have known state during rtx generation. */
279 virtuals_instantiated = 0;
280 generating_concat_p = 1;
283 void
284 pop_function_context (void)
286 pop_function_context_from (current_function_decl);
289 /* Clear out all parts of the state in F that can safely be discarded
290 after the function has been parsed, but not compiled, to let
291 garbage collection reclaim the memory. */
293 void
294 free_after_parsing (struct function *f)
296 /* f->expr->forced_labels is used by code generation. */
297 /* f->emit->regno_reg_rtx is used by code generation. */
298 /* f->varasm is used by code generation. */
299 /* f->eh->eh_return_stub_label is used by code generation. */
301 lang_hooks.function.final (f);
304 /* Clear out all parts of the state in F that can safely be discarded
305 after the function has been compiled, to let garbage collection
306 reclaim the memory. */
308 void
309 free_after_compilation (struct function *f)
311 VEC_free (int, heap, prologue);
312 VEC_free (int, heap, epilogue);
313 VEC_free (int, heap, sibcall_epilogue);
315 f->eh = NULL;
316 f->expr = NULL;
317 f->emit = NULL;
318 f->varasm = NULL;
319 f->machine = NULL;
320 f->cfg = NULL;
322 f->x_avail_temp_slots = NULL;
323 f->x_used_temp_slots = NULL;
324 f->arg_offset_rtx = NULL;
325 f->return_rtx = NULL;
326 f->internal_arg_pointer = NULL;
327 f->x_nonlocal_goto_handler_labels = NULL;
328 f->x_return_label = NULL;
329 f->x_naked_return_label = NULL;
330 f->x_stack_slot_list = NULL;
331 f->x_stack_check_probe_note = NULL;
332 f->x_arg_pointer_save_area = NULL;
333 f->x_parm_birth_insn = NULL;
334 f->epilogue_delay_list = NULL;
337 /* Allocate fixed slots in the stack frame of the current function. */
339 /* Return size needed for stack frame based on slots so far allocated in
340 function F.
341 This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY;
342 the caller may have to do that. */
344 static HOST_WIDE_INT
345 get_func_frame_size (struct function *f)
347 if (FRAME_GROWS_DOWNWARD)
348 return -f->x_frame_offset;
349 else
350 return f->x_frame_offset;
353 /* Return size needed for stack frame based on slots so far allocated.
354 This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY;
355 the caller may have to do that. */
357 HOST_WIDE_INT
358 get_frame_size (void)
360 return get_func_frame_size (cfun);
363 /* Issue an error message and return TRUE if frame OFFSET overflows in
364 the signed target pointer arithmetics for function FUNC. Otherwise
365 return FALSE. */
367 bool
368 frame_offset_overflow (HOST_WIDE_INT offset, tree func)
370 unsigned HOST_WIDE_INT size = FRAME_GROWS_DOWNWARD ? -offset : offset;
372 if (size > ((unsigned HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (Pmode) - 1))
373 /* Leave room for the fixed part of the frame. */
374 - 64 * UNITS_PER_WORD)
376 error ("%Jtotal size of local objects too large", func);
377 return TRUE;
380 return FALSE;
383 /* Allocate a stack slot of SIZE bytes and return a MEM rtx for it
384 with machine mode MODE.
386 ALIGN controls the amount of alignment for the address of the slot:
387 0 means according to MODE,
388 -1 means use BIGGEST_ALIGNMENT and round size to multiple of that,
389 -2 means use BITS_PER_UNIT,
390 positive specifies alignment boundary in bits.
392 We do not round to stack_boundary here.
394 FUNCTION specifies the function to allocate in. */
396 static rtx
397 assign_stack_local_1 (enum machine_mode mode, HOST_WIDE_INT size, int align,
398 struct function *function)
400 rtx x, addr;
401 int bigend_correction = 0;
402 unsigned int alignment;
403 int frame_off, frame_alignment, frame_phase;
405 if (align == 0)
407 tree type;
409 if (mode == BLKmode)
410 alignment = BIGGEST_ALIGNMENT;
411 else
412 alignment = GET_MODE_ALIGNMENT (mode);
414 /* Allow the target to (possibly) increase the alignment of this
415 stack slot. */
416 type = lang_hooks.types.type_for_mode (mode, 0);
417 if (type)
418 alignment = LOCAL_ALIGNMENT (type, alignment);
420 alignment /= BITS_PER_UNIT;
422 else if (align == -1)
424 alignment = BIGGEST_ALIGNMENT / BITS_PER_UNIT;
425 size = CEIL_ROUND (size, alignment);
427 else if (align == -2)
428 alignment = 1; /* BITS_PER_UNIT / BITS_PER_UNIT */
429 else
430 alignment = align / BITS_PER_UNIT;
432 if (FRAME_GROWS_DOWNWARD)
433 function->x_frame_offset -= size;
435 /* Ignore alignment we can't do with expected alignment of the boundary. */
436 if (alignment * BITS_PER_UNIT > PREFERRED_STACK_BOUNDARY)
437 alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
439 if (function->stack_alignment_needed < alignment * BITS_PER_UNIT)
440 function->stack_alignment_needed = alignment * BITS_PER_UNIT;
442 /* Calculate how many bytes the start of local variables is off from
443 stack alignment. */
444 frame_alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
445 frame_off = STARTING_FRAME_OFFSET % frame_alignment;
446 frame_phase = frame_off ? frame_alignment - frame_off : 0;
448 /* Round the frame offset to the specified alignment. The default is
449 to always honor requests to align the stack but a port may choose to
450 do its own stack alignment by defining STACK_ALIGNMENT_NEEDED. */
451 if (STACK_ALIGNMENT_NEEDED
452 || mode != BLKmode
453 || size != 0)
455 /* We must be careful here, since FRAME_OFFSET might be negative and
456 division with a negative dividend isn't as well defined as we might
457 like. So we instead assume that ALIGNMENT is a power of two and
458 use logical operations which are unambiguous. */
459 if (FRAME_GROWS_DOWNWARD)
460 function->x_frame_offset
461 = (FLOOR_ROUND (function->x_frame_offset - frame_phase,
462 (unsigned HOST_WIDE_INT) alignment)
463 + frame_phase);
464 else
465 function->x_frame_offset
466 = (CEIL_ROUND (function->x_frame_offset - frame_phase,
467 (unsigned HOST_WIDE_INT) alignment)
468 + frame_phase);
471 /* On a big-endian machine, if we are allocating more space than we will use,
472 use the least significant bytes of those that are allocated. */
473 if (BYTES_BIG_ENDIAN && mode != BLKmode && GET_MODE_SIZE (mode) < size)
474 bigend_correction = size - GET_MODE_SIZE (mode);
476 /* If we have already instantiated virtual registers, return the actual
477 address relative to the frame pointer. */
478 if (function == cfun && virtuals_instantiated)
479 addr = plus_constant (frame_pointer_rtx,
480 trunc_int_for_mode
481 (frame_offset + bigend_correction
482 + STARTING_FRAME_OFFSET, Pmode));
483 else
484 addr = plus_constant (virtual_stack_vars_rtx,
485 trunc_int_for_mode
486 (function->x_frame_offset + bigend_correction,
487 Pmode));
489 if (!FRAME_GROWS_DOWNWARD)
490 function->x_frame_offset += size;
492 x = gen_rtx_MEM (mode, addr);
493 MEM_NOTRAP_P (x) = 1;
495 function->x_stack_slot_list
496 = gen_rtx_EXPR_LIST (VOIDmode, x, function->x_stack_slot_list);
498 if (frame_offset_overflow (function->x_frame_offset, function->decl))
499 function->x_frame_offset = 0;
501 return x;
504 /* Wrapper around assign_stack_local_1; assign a local stack slot for the
505 current function. */
508 assign_stack_local (enum machine_mode mode, HOST_WIDE_INT size, int align)
510 return assign_stack_local_1 (mode, size, align, cfun);
514 /* Removes temporary slot TEMP from LIST. */
516 static void
517 cut_slot_from_list (struct temp_slot *temp, struct temp_slot **list)
519 if (temp->next)
520 temp->next->prev = temp->prev;
521 if (temp->prev)
522 temp->prev->next = temp->next;
523 else
524 *list = temp->next;
526 temp->prev = temp->next = NULL;
529 /* Inserts temporary slot TEMP to LIST. */
531 static void
532 insert_slot_to_list (struct temp_slot *temp, struct temp_slot **list)
534 temp->next = *list;
535 if (*list)
536 (*list)->prev = temp;
537 temp->prev = NULL;
538 *list = temp;
541 /* Returns the list of used temp slots at LEVEL. */
543 static struct temp_slot **
544 temp_slots_at_level (int level)
546 if (level >= (int) VEC_length (temp_slot_p, used_temp_slots))
547 VEC_safe_grow_cleared (temp_slot_p, gc, used_temp_slots, level + 1);
549 return &(VEC_address (temp_slot_p, used_temp_slots)[level]);
552 /* Returns the maximal temporary slot level. */
554 static int
555 max_slot_level (void)
557 if (!used_temp_slots)
558 return -1;
560 return VEC_length (temp_slot_p, used_temp_slots) - 1;
563 /* Moves temporary slot TEMP to LEVEL. */
565 static void
566 move_slot_to_level (struct temp_slot *temp, int level)
568 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
569 insert_slot_to_list (temp, temp_slots_at_level (level));
570 temp->level = level;
573 /* Make temporary slot TEMP available. */
575 static void
576 make_slot_available (struct temp_slot *temp)
578 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
579 insert_slot_to_list (temp, &avail_temp_slots);
580 temp->in_use = 0;
581 temp->level = -1;
584 /* Allocate a temporary stack slot and record it for possible later
585 reuse.
587 MODE is the machine mode to be given to the returned rtx.
589 SIZE is the size in units of the space required. We do no rounding here
590 since assign_stack_local will do any required rounding.
592 KEEP is 1 if this slot is to be retained after a call to
593 free_temp_slots. Automatic variables for a block are allocated
594 with this flag. KEEP values of 2 or 3 were needed respectively
595 for variables whose lifetime is controlled by CLEANUP_POINT_EXPRs
596 or for SAVE_EXPRs, but they are now unused.
598 TYPE is the type that will be used for the stack slot. */
601 assign_stack_temp_for_type (enum machine_mode mode, HOST_WIDE_INT size,
602 int keep, tree type)
604 unsigned int align;
605 struct temp_slot *p, *best_p = 0, *selected = NULL, **pp;
606 rtx slot;
608 /* If SIZE is -1 it means that somebody tried to allocate a temporary
609 of a variable size. */
610 gcc_assert (size != -1);
612 /* These are now unused. */
613 gcc_assert (keep <= 1);
615 if (mode == BLKmode)
616 align = BIGGEST_ALIGNMENT;
617 else
618 align = GET_MODE_ALIGNMENT (mode);
620 if (! type)
621 type = lang_hooks.types.type_for_mode (mode, 0);
623 if (type)
624 align = LOCAL_ALIGNMENT (type, align);
626 /* Try to find an available, already-allocated temporary of the proper
627 mode which meets the size and alignment requirements. Choose the
628 smallest one with the closest alignment.
630 If assign_stack_temp is called outside of the tree->rtl expansion,
631 we cannot reuse the stack slots (that may still refer to
632 VIRTUAL_STACK_VARS_REGNUM). */
633 if (!virtuals_instantiated)
635 for (p = avail_temp_slots; p; p = p->next)
637 if (p->align >= align && p->size >= size
638 && GET_MODE (p->slot) == mode
639 && objects_must_conflict_p (p->type, type)
640 && (best_p == 0 || best_p->size > p->size
641 || (best_p->size == p->size && best_p->align > p->align)))
643 if (p->align == align && p->size == size)
645 selected = p;
646 cut_slot_from_list (selected, &avail_temp_slots);
647 best_p = 0;
648 break;
650 best_p = p;
655 /* Make our best, if any, the one to use. */
656 if (best_p)
658 selected = best_p;
659 cut_slot_from_list (selected, &avail_temp_slots);
661 /* If there are enough aligned bytes left over, make them into a new
662 temp_slot so that the extra bytes don't get wasted. Do this only
663 for BLKmode slots, so that we can be sure of the alignment. */
664 if (GET_MODE (best_p->slot) == BLKmode)
666 int alignment = best_p->align / BITS_PER_UNIT;
667 HOST_WIDE_INT rounded_size = CEIL_ROUND (size, alignment);
669 if (best_p->size - rounded_size >= alignment)
671 p = ggc_alloc (sizeof (struct temp_slot));
672 p->in_use = p->addr_taken = 0;
673 p->size = best_p->size - rounded_size;
674 p->base_offset = best_p->base_offset + rounded_size;
675 p->full_size = best_p->full_size - rounded_size;
676 p->slot = adjust_address_nv (best_p->slot, BLKmode, rounded_size);
677 p->align = best_p->align;
678 p->address = 0;
679 p->type = best_p->type;
680 insert_slot_to_list (p, &avail_temp_slots);
682 stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, p->slot,
683 stack_slot_list);
685 best_p->size = rounded_size;
686 best_p->full_size = rounded_size;
691 /* If we still didn't find one, make a new temporary. */
692 if (selected == 0)
694 HOST_WIDE_INT frame_offset_old = frame_offset;
696 p = ggc_alloc (sizeof (struct temp_slot));
698 /* We are passing an explicit alignment request to assign_stack_local.
699 One side effect of that is assign_stack_local will not round SIZE
700 to ensure the frame offset remains suitably aligned.
702 So for requests which depended on the rounding of SIZE, we go ahead
703 and round it now. We also make sure ALIGNMENT is at least
704 BIGGEST_ALIGNMENT. */
705 gcc_assert (mode != BLKmode || align == BIGGEST_ALIGNMENT);
706 p->slot = assign_stack_local (mode,
707 (mode == BLKmode
708 ? CEIL_ROUND (size, (int) align / BITS_PER_UNIT)
709 : size),
710 align);
712 p->align = align;
714 /* The following slot size computation is necessary because we don't
715 know the actual size of the temporary slot until assign_stack_local
716 has performed all the frame alignment and size rounding for the
717 requested temporary. Note that extra space added for alignment
718 can be either above or below this stack slot depending on which
719 way the frame grows. We include the extra space if and only if it
720 is above this slot. */
721 if (FRAME_GROWS_DOWNWARD)
722 p->size = frame_offset_old - frame_offset;
723 else
724 p->size = size;
726 /* Now define the fields used by combine_temp_slots. */
727 if (FRAME_GROWS_DOWNWARD)
729 p->base_offset = frame_offset;
730 p->full_size = frame_offset_old - frame_offset;
732 else
734 p->base_offset = frame_offset_old;
735 p->full_size = frame_offset - frame_offset_old;
737 p->address = 0;
739 selected = p;
742 p = selected;
743 p->in_use = 1;
744 p->addr_taken = 0;
745 p->type = type;
746 p->level = temp_slot_level;
747 p->keep = keep;
749 pp = temp_slots_at_level (p->level);
750 insert_slot_to_list (p, pp);
752 /* Create a new MEM rtx to avoid clobbering MEM flags of old slots. */
753 slot = gen_rtx_MEM (mode, XEXP (p->slot, 0));
754 stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, slot, stack_slot_list);
756 /* If we know the alias set for the memory that will be used, use
757 it. If there's no TYPE, then we don't know anything about the
758 alias set for the memory. */
759 set_mem_alias_set (slot, type ? get_alias_set (type) : 0);
760 set_mem_align (slot, align);
762 /* If a type is specified, set the relevant flags. */
763 if (type != 0)
765 MEM_VOLATILE_P (slot) = TYPE_VOLATILE (type);
766 MEM_SET_IN_STRUCT_P (slot, (AGGREGATE_TYPE_P (type)
767 || TREE_CODE (type) == COMPLEX_TYPE));
769 MEM_NOTRAP_P (slot) = 1;
771 return slot;
774 /* Allocate a temporary stack slot and record it for possible later
775 reuse. First three arguments are same as in preceding function. */
778 assign_stack_temp (enum machine_mode mode, HOST_WIDE_INT size, int keep)
780 return assign_stack_temp_for_type (mode, size, keep, NULL_TREE);
783 /* Assign a temporary.
784 If TYPE_OR_DECL is a decl, then we are doing it on behalf of the decl
785 and so that should be used in error messages. In either case, we
786 allocate of the given type.
787 KEEP is as for assign_stack_temp.
788 MEMORY_REQUIRED is 1 if the result must be addressable stack memory;
789 it is 0 if a register is OK.
790 DONT_PROMOTE is 1 if we should not promote values in register
791 to wider modes. */
794 assign_temp (tree type_or_decl, int keep, int memory_required,
795 int dont_promote ATTRIBUTE_UNUSED)
797 tree type, decl;
798 enum machine_mode mode;
799 #ifdef PROMOTE_MODE
800 int unsignedp;
801 #endif
803 if (DECL_P (type_or_decl))
804 decl = type_or_decl, type = TREE_TYPE (decl);
805 else
806 decl = NULL, type = type_or_decl;
808 mode = TYPE_MODE (type);
809 #ifdef PROMOTE_MODE
810 unsignedp = TYPE_UNSIGNED (type);
811 #endif
813 if (mode == BLKmode || memory_required)
815 HOST_WIDE_INT size = int_size_in_bytes (type);
816 rtx tmp;
818 /* Zero sized arrays are GNU C extension. Set size to 1 to avoid
819 problems with allocating the stack space. */
820 if (size == 0)
821 size = 1;
823 /* Unfortunately, we don't yet know how to allocate variable-sized
824 temporaries. However, sometimes we can find a fixed upper limit on
825 the size, so try that instead. */
826 else if (size == -1)
827 size = max_int_size_in_bytes (type);
829 /* The size of the temporary may be too large to fit into an integer. */
830 /* ??? Not sure this should happen except for user silliness, so limit
831 this to things that aren't compiler-generated temporaries. The
832 rest of the time we'll die in assign_stack_temp_for_type. */
833 if (decl && size == -1
834 && TREE_CODE (TYPE_SIZE_UNIT (type)) == INTEGER_CST)
836 error ("size of variable %q+D is too large", decl);
837 size = 1;
840 tmp = assign_stack_temp_for_type (mode, size, keep, type);
841 return tmp;
844 #ifdef PROMOTE_MODE
845 if (! dont_promote)
846 mode = promote_mode (type, mode, &unsignedp, 0);
847 #endif
849 return gen_reg_rtx (mode);
852 /* Combine temporary stack slots which are adjacent on the stack.
854 This allows for better use of already allocated stack space. This is only
855 done for BLKmode slots because we can be sure that we won't have alignment
856 problems in this case. */
858 static void
859 combine_temp_slots (void)
861 struct temp_slot *p, *q, *next, *next_q;
862 int num_slots;
864 /* We can't combine slots, because the information about which slot
865 is in which alias set will be lost. */
866 if (flag_strict_aliasing)
867 return;
869 /* If there are a lot of temp slots, don't do anything unless
870 high levels of optimization. */
871 if (! flag_expensive_optimizations)
872 for (p = avail_temp_slots, num_slots = 0; p; p = p->next, num_slots++)
873 if (num_slots > 100 || (num_slots > 10 && optimize == 0))
874 return;
876 for (p = avail_temp_slots; p; p = next)
878 int delete_p = 0;
880 next = p->next;
882 if (GET_MODE (p->slot) != BLKmode)
883 continue;
885 for (q = p->next; q; q = next_q)
887 int delete_q = 0;
889 next_q = q->next;
891 if (GET_MODE (q->slot) != BLKmode)
892 continue;
894 if (p->base_offset + p->full_size == q->base_offset)
896 /* Q comes after P; combine Q into P. */
897 p->size += q->size;
898 p->full_size += q->full_size;
899 delete_q = 1;
901 else if (q->base_offset + q->full_size == p->base_offset)
903 /* P comes after Q; combine P into Q. */
904 q->size += p->size;
905 q->full_size += p->full_size;
906 delete_p = 1;
907 break;
909 if (delete_q)
910 cut_slot_from_list (q, &avail_temp_slots);
913 /* Either delete P or advance past it. */
914 if (delete_p)
915 cut_slot_from_list (p, &avail_temp_slots);
919 /* Find the temp slot corresponding to the object at address X. */
921 static struct temp_slot *
922 find_temp_slot_from_address (rtx x)
924 struct temp_slot *p;
925 rtx next;
926 int i;
928 for (i = max_slot_level (); i >= 0; i--)
929 for (p = *temp_slots_at_level (i); p; p = p->next)
931 if (XEXP (p->slot, 0) == x
932 || p->address == x
933 || (GET_CODE (x) == PLUS
934 && XEXP (x, 0) == virtual_stack_vars_rtx
935 && GET_CODE (XEXP (x, 1)) == CONST_INT
936 && INTVAL (XEXP (x, 1)) >= p->base_offset
937 && INTVAL (XEXP (x, 1)) < p->base_offset + p->full_size))
938 return p;
940 else if (p->address != 0 && GET_CODE (p->address) == EXPR_LIST)
941 for (next = p->address; next; next = XEXP (next, 1))
942 if (XEXP (next, 0) == x)
943 return p;
946 /* If we have a sum involving a register, see if it points to a temp
947 slot. */
948 if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 0))
949 && (p = find_temp_slot_from_address (XEXP (x, 0))) != 0)
950 return p;
951 else if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 1))
952 && (p = find_temp_slot_from_address (XEXP (x, 1))) != 0)
953 return p;
955 return 0;
958 /* Indicate that NEW is an alternate way of referring to the temp slot
959 that previously was known by OLD. */
961 void
962 update_temp_slot_address (rtx old, rtx new)
964 struct temp_slot *p;
966 if (rtx_equal_p (old, new))
967 return;
969 p = find_temp_slot_from_address (old);
971 /* If we didn't find one, see if both OLD is a PLUS. If so, and NEW
972 is a register, see if one operand of the PLUS is a temporary
973 location. If so, NEW points into it. Otherwise, if both OLD and
974 NEW are a PLUS and if there is a register in common between them.
975 If so, try a recursive call on those values. */
976 if (p == 0)
978 if (GET_CODE (old) != PLUS)
979 return;
981 if (REG_P (new))
983 update_temp_slot_address (XEXP (old, 0), new);
984 update_temp_slot_address (XEXP (old, 1), new);
985 return;
987 else if (GET_CODE (new) != PLUS)
988 return;
990 if (rtx_equal_p (XEXP (old, 0), XEXP (new, 0)))
991 update_temp_slot_address (XEXP (old, 1), XEXP (new, 1));
992 else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 0)))
993 update_temp_slot_address (XEXP (old, 0), XEXP (new, 1));
994 else if (rtx_equal_p (XEXP (old, 0), XEXP (new, 1)))
995 update_temp_slot_address (XEXP (old, 1), XEXP (new, 0));
996 else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 1)))
997 update_temp_slot_address (XEXP (old, 0), XEXP (new, 0));
999 return;
1002 /* Otherwise add an alias for the temp's address. */
1003 else if (p->address == 0)
1004 p->address = new;
1005 else
1007 if (GET_CODE (p->address) != EXPR_LIST)
1008 p->address = gen_rtx_EXPR_LIST (VOIDmode, p->address, NULL_RTX);
1010 p->address = gen_rtx_EXPR_LIST (VOIDmode, new, p->address);
1014 /* If X could be a reference to a temporary slot, mark the fact that its
1015 address was taken. */
1017 void
1018 mark_temp_addr_taken (rtx x)
1020 struct temp_slot *p;
1022 if (x == 0)
1023 return;
1025 /* If X is not in memory or is at a constant address, it cannot be in
1026 a temporary slot. */
1027 if (!MEM_P (x) || CONSTANT_P (XEXP (x, 0)))
1028 return;
1030 p = find_temp_slot_from_address (XEXP (x, 0));
1031 if (p != 0)
1032 p->addr_taken = 1;
1035 /* If X could be a reference to a temporary slot, mark that slot as
1036 belonging to the to one level higher than the current level. If X
1037 matched one of our slots, just mark that one. Otherwise, we can't
1038 easily predict which it is, so upgrade all of them. Kept slots
1039 need not be touched.
1041 This is called when an ({...}) construct occurs and a statement
1042 returns a value in memory. */
1044 void
1045 preserve_temp_slots (rtx x)
1047 struct temp_slot *p = 0, *next;
1049 /* If there is no result, we still might have some objects whose address
1050 were taken, so we need to make sure they stay around. */
1051 if (x == 0)
1053 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1055 next = p->next;
1057 if (p->addr_taken)
1058 move_slot_to_level (p, temp_slot_level - 1);
1061 return;
1064 /* If X is a register that is being used as a pointer, see if we have
1065 a temporary slot we know it points to. To be consistent with
1066 the code below, we really should preserve all non-kept slots
1067 if we can't find a match, but that seems to be much too costly. */
1068 if (REG_P (x) && REG_POINTER (x))
1069 p = find_temp_slot_from_address (x);
1071 /* If X is not in memory or is at a constant address, it cannot be in
1072 a temporary slot, but it can contain something whose address was
1073 taken. */
1074 if (p == 0 && (!MEM_P (x) || CONSTANT_P (XEXP (x, 0))))
1076 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1078 next = p->next;
1080 if (p->addr_taken)
1081 move_slot_to_level (p, temp_slot_level - 1);
1084 return;
1087 /* First see if we can find a match. */
1088 if (p == 0)
1089 p = find_temp_slot_from_address (XEXP (x, 0));
1091 if (p != 0)
1093 /* Move everything at our level whose address was taken to our new
1094 level in case we used its address. */
1095 struct temp_slot *q;
1097 if (p->level == temp_slot_level)
1099 for (q = *temp_slots_at_level (temp_slot_level); q; q = next)
1101 next = q->next;
1103 if (p != q && q->addr_taken)
1104 move_slot_to_level (q, temp_slot_level - 1);
1107 move_slot_to_level (p, temp_slot_level - 1);
1108 p->addr_taken = 0;
1110 return;
1113 /* Otherwise, preserve all non-kept slots at this level. */
1114 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1116 next = p->next;
1118 if (!p->keep)
1119 move_slot_to_level (p, temp_slot_level - 1);
1123 /* Free all temporaries used so far. This is normally called at the
1124 end of generating code for a statement. */
1126 void
1127 free_temp_slots (void)
1129 struct temp_slot *p, *next;
1131 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1133 next = p->next;
1135 if (!p->keep)
1136 make_slot_available (p);
1139 combine_temp_slots ();
1142 /* Push deeper into the nesting level for stack temporaries. */
1144 void
1145 push_temp_slots (void)
1147 temp_slot_level++;
1150 /* Pop a temporary nesting level. All slots in use in the current level
1151 are freed. */
1153 void
1154 pop_temp_slots (void)
1156 struct temp_slot *p, *next;
1158 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1160 next = p->next;
1161 make_slot_available (p);
1164 combine_temp_slots ();
1166 temp_slot_level--;
1169 /* Initialize temporary slots. */
1171 void
1172 init_temp_slots (void)
1174 /* We have not allocated any temporaries yet. */
1175 avail_temp_slots = 0;
1176 used_temp_slots = 0;
1177 temp_slot_level = 0;
1180 /* These routines are responsible for converting virtual register references
1181 to the actual hard register references once RTL generation is complete.
1183 The following four variables are used for communication between the
1184 routines. They contain the offsets of the virtual registers from their
1185 respective hard registers. */
1187 static int in_arg_offset;
1188 static int var_offset;
1189 static int dynamic_offset;
1190 static int out_arg_offset;
1191 static int cfa_offset;
1193 /* In most machines, the stack pointer register is equivalent to the bottom
1194 of the stack. */
1196 #ifndef STACK_POINTER_OFFSET
1197 #define STACK_POINTER_OFFSET 0
1198 #endif
1200 /* If not defined, pick an appropriate default for the offset of dynamically
1201 allocated memory depending on the value of ACCUMULATE_OUTGOING_ARGS,
1202 REG_PARM_STACK_SPACE, and OUTGOING_REG_PARM_STACK_SPACE. */
1204 #ifndef STACK_DYNAMIC_OFFSET
1206 /* The bottom of the stack points to the actual arguments. If
1207 REG_PARM_STACK_SPACE is defined, this includes the space for the register
1208 parameters. However, if OUTGOING_REG_PARM_STACK space is not defined,
1209 stack space for register parameters is not pushed by the caller, but
1210 rather part of the fixed stack areas and hence not included in
1211 `current_function_outgoing_args_size'. Nevertheless, we must allow
1212 for it when allocating stack dynamic objects. */
1214 #if defined(REG_PARM_STACK_SPACE) && ! defined(OUTGOING_REG_PARM_STACK_SPACE)
1215 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1216 ((ACCUMULATE_OUTGOING_ARGS \
1217 ? (current_function_outgoing_args_size + REG_PARM_STACK_SPACE (FNDECL)) : 0)\
1218 + (STACK_POINTER_OFFSET)) \
1220 #else
1221 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1222 ((ACCUMULATE_OUTGOING_ARGS ? current_function_outgoing_args_size : 0) \
1223 + (STACK_POINTER_OFFSET))
1224 #endif
1225 #endif
1228 /* Given a piece of RTX and a pointer to a HOST_WIDE_INT, if the RTX
1229 is a virtual register, return the equivalent hard register and set the
1230 offset indirectly through the pointer. Otherwise, return 0. */
1232 static rtx
1233 instantiate_new_reg (rtx x, HOST_WIDE_INT *poffset)
1235 rtx new;
1236 HOST_WIDE_INT offset;
1238 if (x == virtual_incoming_args_rtx)
1239 new = arg_pointer_rtx, offset = in_arg_offset;
1240 else if (x == virtual_stack_vars_rtx)
1241 new = frame_pointer_rtx, offset = var_offset;
1242 else if (x == virtual_stack_dynamic_rtx)
1243 new = stack_pointer_rtx, offset = dynamic_offset;
1244 else if (x == virtual_outgoing_args_rtx)
1245 new = stack_pointer_rtx, offset = out_arg_offset;
1246 else if (x == virtual_cfa_rtx)
1248 #ifdef FRAME_POINTER_CFA_OFFSET
1249 new = frame_pointer_rtx;
1250 #else
1251 new = arg_pointer_rtx;
1252 #endif
1253 offset = cfa_offset;
1255 else
1256 return NULL_RTX;
1258 *poffset = offset;
1259 return new;
1262 /* A subroutine of instantiate_virtual_regs, called via for_each_rtx.
1263 Instantiate any virtual registers present inside of *LOC. The expression
1264 is simplified, as much as possible, but is not to be considered "valid"
1265 in any sense implied by the target. If any change is made, set CHANGED
1266 to true. */
1268 static int
1269 instantiate_virtual_regs_in_rtx (rtx *loc, void *data)
1271 HOST_WIDE_INT offset;
1272 bool *changed = (bool *) data;
1273 rtx x, new;
1275 x = *loc;
1276 if (x == 0)
1277 return 0;
1279 switch (GET_CODE (x))
1281 case REG:
1282 new = instantiate_new_reg (x, &offset);
1283 if (new)
1285 *loc = plus_constant (new, offset);
1286 if (changed)
1287 *changed = true;
1289 return -1;
1291 case PLUS:
1292 new = instantiate_new_reg (XEXP (x, 0), &offset);
1293 if (new)
1295 new = plus_constant (new, offset);
1296 *loc = simplify_gen_binary (PLUS, GET_MODE (x), new, XEXP (x, 1));
1297 if (changed)
1298 *changed = true;
1299 return -1;
1302 /* FIXME -- from old code */
1303 /* If we have (plus (subreg (virtual-reg)) (const_int)), we know
1304 we can commute the PLUS and SUBREG because pointers into the
1305 frame are well-behaved. */
1306 break;
1308 default:
1309 break;
1312 return 0;
1315 /* A subroutine of instantiate_virtual_regs_in_insn. Return true if X
1316 matches the predicate for insn CODE operand OPERAND. */
1318 static int
1319 safe_insn_predicate (int code, int operand, rtx x)
1321 const struct insn_operand_data *op_data;
1323 if (code < 0)
1324 return true;
1326 op_data = &insn_data[code].operand[operand];
1327 if (op_data->predicate == NULL)
1328 return true;
1330 return op_data->predicate (x, op_data->mode);
1333 /* A subroutine of instantiate_virtual_regs. Instantiate any virtual
1334 registers present inside of insn. The result will be a valid insn. */
1336 static void
1337 instantiate_virtual_regs_in_insn (rtx insn)
1339 HOST_WIDE_INT offset;
1340 int insn_code, i;
1341 bool any_change = false;
1342 rtx set, new, x, seq;
1344 /* There are some special cases to be handled first. */
1345 set = single_set (insn);
1346 if (set)
1348 /* We're allowed to assign to a virtual register. This is interpreted
1349 to mean that the underlying register gets assigned the inverse
1350 transformation. This is used, for example, in the handling of
1351 non-local gotos. */
1352 new = instantiate_new_reg (SET_DEST (set), &offset);
1353 if (new)
1355 start_sequence ();
1357 for_each_rtx (&SET_SRC (set), instantiate_virtual_regs_in_rtx, NULL);
1358 x = simplify_gen_binary (PLUS, GET_MODE (new), SET_SRC (set),
1359 GEN_INT (-offset));
1360 x = force_operand (x, new);
1361 if (x != new)
1362 emit_move_insn (new, x);
1364 seq = get_insns ();
1365 end_sequence ();
1367 emit_insn_before (seq, insn);
1368 delete_insn (insn);
1369 return;
1372 /* Handle a straight copy from a virtual register by generating a
1373 new add insn. The difference between this and falling through
1374 to the generic case is avoiding a new pseudo and eliminating a
1375 move insn in the initial rtl stream. */
1376 new = instantiate_new_reg (SET_SRC (set), &offset);
1377 if (new && offset != 0
1378 && REG_P (SET_DEST (set))
1379 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1381 start_sequence ();
1383 x = expand_simple_binop (GET_MODE (SET_DEST (set)), PLUS,
1384 new, GEN_INT (offset), SET_DEST (set),
1385 1, OPTAB_LIB_WIDEN);
1386 if (x != SET_DEST (set))
1387 emit_move_insn (SET_DEST (set), x);
1389 seq = get_insns ();
1390 end_sequence ();
1392 emit_insn_before (seq, insn);
1393 delete_insn (insn);
1394 return;
1397 extract_insn (insn);
1398 insn_code = INSN_CODE (insn);
1400 /* Handle a plus involving a virtual register by determining if the
1401 operands remain valid if they're modified in place. */
1402 if (GET_CODE (SET_SRC (set)) == PLUS
1403 && recog_data.n_operands >= 3
1404 && recog_data.operand_loc[1] == &XEXP (SET_SRC (set), 0)
1405 && recog_data.operand_loc[2] == &XEXP (SET_SRC (set), 1)
1406 && GET_CODE (recog_data.operand[2]) == CONST_INT
1407 && (new = instantiate_new_reg (recog_data.operand[1], &offset)))
1409 offset += INTVAL (recog_data.operand[2]);
1411 /* If the sum is zero, then replace with a plain move. */
1412 if (offset == 0
1413 && REG_P (SET_DEST (set))
1414 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1416 start_sequence ();
1417 emit_move_insn (SET_DEST (set), new);
1418 seq = get_insns ();
1419 end_sequence ();
1421 emit_insn_before (seq, insn);
1422 delete_insn (insn);
1423 return;
1426 x = gen_int_mode (offset, recog_data.operand_mode[2]);
1428 /* Using validate_change and apply_change_group here leaves
1429 recog_data in an invalid state. Since we know exactly what
1430 we want to check, do those two by hand. */
1431 if (safe_insn_predicate (insn_code, 1, new)
1432 && safe_insn_predicate (insn_code, 2, x))
1434 *recog_data.operand_loc[1] = recog_data.operand[1] = new;
1435 *recog_data.operand_loc[2] = recog_data.operand[2] = x;
1436 any_change = true;
1438 /* Fall through into the regular operand fixup loop in
1439 order to take care of operands other than 1 and 2. */
1443 else
1445 extract_insn (insn);
1446 insn_code = INSN_CODE (insn);
1449 /* In the general case, we expect virtual registers to appear only in
1450 operands, and then only as either bare registers or inside memories. */
1451 for (i = 0; i < recog_data.n_operands; ++i)
1453 x = recog_data.operand[i];
1454 switch (GET_CODE (x))
1456 case MEM:
1458 rtx addr = XEXP (x, 0);
1459 bool changed = false;
1461 for_each_rtx (&addr, instantiate_virtual_regs_in_rtx, &changed);
1462 if (!changed)
1463 continue;
1465 start_sequence ();
1466 x = replace_equiv_address (x, addr);
1467 seq = get_insns ();
1468 end_sequence ();
1469 if (seq)
1470 emit_insn_before (seq, insn);
1472 break;
1474 case REG:
1475 new = instantiate_new_reg (x, &offset);
1476 if (new == NULL)
1477 continue;
1478 if (offset == 0)
1479 x = new;
1480 else
1482 start_sequence ();
1484 /* Careful, special mode predicates may have stuff in
1485 insn_data[insn_code].operand[i].mode that isn't useful
1486 to us for computing a new value. */
1487 /* ??? Recognize address_operand and/or "p" constraints
1488 to see if (plus new offset) is a valid before we put
1489 this through expand_simple_binop. */
1490 x = expand_simple_binop (GET_MODE (x), PLUS, new,
1491 GEN_INT (offset), NULL_RTX,
1492 1, OPTAB_LIB_WIDEN);
1493 seq = get_insns ();
1494 end_sequence ();
1495 emit_insn_before (seq, insn);
1497 break;
1499 case SUBREG:
1500 new = instantiate_new_reg (SUBREG_REG (x), &offset);
1501 if (new == NULL)
1502 continue;
1503 if (offset != 0)
1505 start_sequence ();
1506 new = expand_simple_binop (GET_MODE (new), PLUS, new,
1507 GEN_INT (offset), NULL_RTX,
1508 1, OPTAB_LIB_WIDEN);
1509 seq = get_insns ();
1510 end_sequence ();
1511 emit_insn_before (seq, insn);
1513 x = simplify_gen_subreg (recog_data.operand_mode[i], new,
1514 GET_MODE (new), SUBREG_BYTE (x));
1515 break;
1517 default:
1518 continue;
1521 /* At this point, X contains the new value for the operand.
1522 Validate the new value vs the insn predicate. Note that
1523 asm insns will have insn_code -1 here. */
1524 if (!safe_insn_predicate (insn_code, i, x))
1526 start_sequence ();
1527 x = force_reg (insn_data[insn_code].operand[i].mode, x);
1528 seq = get_insns ();
1529 end_sequence ();
1530 if (seq)
1531 emit_insn_before (seq, insn);
1534 *recog_data.operand_loc[i] = recog_data.operand[i] = x;
1535 any_change = true;
1538 if (any_change)
1540 /* Propagate operand changes into the duplicates. */
1541 for (i = 0; i < recog_data.n_dups; ++i)
1542 *recog_data.dup_loc[i]
1543 = copy_rtx (recog_data.operand[(unsigned)recog_data.dup_num[i]]);
1545 /* Force re-recognition of the instruction for validation. */
1546 INSN_CODE (insn) = -1;
1549 if (asm_noperands (PATTERN (insn)) >= 0)
1551 if (!check_asm_operands (PATTERN (insn)))
1553 error_for_asm (insn, "impossible constraint in %<asm%>");
1554 delete_insn (insn);
1557 else
1559 if (recog_memoized (insn) < 0)
1560 fatal_insn_not_found (insn);
1564 /* Subroutine of instantiate_decls. Given RTL representing a decl,
1565 do any instantiation required. */
1567 static void
1568 instantiate_decl (rtx x)
1570 rtx addr;
1572 if (x == 0)
1573 return;
1575 /* If this is a CONCAT, recurse for the pieces. */
1576 if (GET_CODE (x) == CONCAT)
1578 instantiate_decl (XEXP (x, 0));
1579 instantiate_decl (XEXP (x, 1));
1580 return;
1583 /* If this is not a MEM, no need to do anything. Similarly if the
1584 address is a constant or a register that is not a virtual register. */
1585 if (!MEM_P (x))
1586 return;
1588 addr = XEXP (x, 0);
1589 if (CONSTANT_P (addr)
1590 || (REG_P (addr)
1591 && (REGNO (addr) < FIRST_VIRTUAL_REGISTER
1592 || REGNO (addr) > LAST_VIRTUAL_REGISTER)))
1593 return;
1595 for_each_rtx (&XEXP (x, 0), instantiate_virtual_regs_in_rtx, NULL);
1598 /* Helper for instantiate_decls called via walk_tree: Process all decls
1599 in the given DECL_VALUE_EXPR. */
1601 static tree
1602 instantiate_expr (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
1604 tree t = *tp;
1605 if (! EXPR_P (t) && ! GIMPLE_STMT_P (t))
1607 *walk_subtrees = 0;
1608 if (DECL_P (t) && DECL_RTL_SET_P (t))
1609 instantiate_decl (DECL_RTL (t));
1611 return NULL;
1614 /* Subroutine of instantiate_decls: Process all decls in the given
1615 BLOCK node and all its subblocks. */
1617 static void
1618 instantiate_decls_1 (tree let)
1620 tree t;
1622 for (t = BLOCK_VARS (let); t; t = TREE_CHAIN (t))
1624 if (DECL_RTL_SET_P (t))
1625 instantiate_decl (DECL_RTL (t));
1626 if (TREE_CODE (t) == VAR_DECL && DECL_HAS_VALUE_EXPR_P (t))
1628 tree v = DECL_VALUE_EXPR (t);
1629 walk_tree (&v, instantiate_expr, NULL, NULL);
1633 /* Process all subblocks. */
1634 for (t = BLOCK_SUBBLOCKS (let); t; t = TREE_CHAIN (t))
1635 instantiate_decls_1 (t);
1638 /* Scan all decls in FNDECL (both variables and parameters) and instantiate
1639 all virtual registers in their DECL_RTL's. */
1641 static void
1642 instantiate_decls (tree fndecl)
1644 tree decl;
1646 /* Process all parameters of the function. */
1647 for (decl = DECL_ARGUMENTS (fndecl); decl; decl = TREE_CHAIN (decl))
1649 instantiate_decl (DECL_RTL (decl));
1650 instantiate_decl (DECL_INCOMING_RTL (decl));
1651 if (DECL_HAS_VALUE_EXPR_P (decl))
1653 tree v = DECL_VALUE_EXPR (decl);
1654 walk_tree (&v, instantiate_expr, NULL, NULL);
1658 /* Now process all variables defined in the function or its subblocks. */
1659 instantiate_decls_1 (DECL_INITIAL (fndecl));
1662 /* Pass through the INSNS of function FNDECL and convert virtual register
1663 references to hard register references. */
1665 static unsigned int
1666 instantiate_virtual_regs (void)
1668 rtx insn;
1670 /* Compute the offsets to use for this function. */
1671 in_arg_offset = FIRST_PARM_OFFSET (current_function_decl);
1672 var_offset = STARTING_FRAME_OFFSET;
1673 dynamic_offset = STACK_DYNAMIC_OFFSET (current_function_decl);
1674 out_arg_offset = STACK_POINTER_OFFSET;
1675 #ifdef FRAME_POINTER_CFA_OFFSET
1676 cfa_offset = FRAME_POINTER_CFA_OFFSET (current_function_decl);
1677 #else
1678 cfa_offset = ARG_POINTER_CFA_OFFSET (current_function_decl);
1679 #endif
1681 /* Initialize recognition, indicating that volatile is OK. */
1682 init_recog ();
1684 /* Scan through all the insns, instantiating every virtual register still
1685 present. */
1686 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
1687 if (INSN_P (insn))
1689 /* These patterns in the instruction stream can never be recognized.
1690 Fortunately, they shouldn't contain virtual registers either. */
1691 if (GET_CODE (PATTERN (insn)) == USE
1692 || GET_CODE (PATTERN (insn)) == CLOBBER
1693 || GET_CODE (PATTERN (insn)) == ADDR_VEC
1694 || GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
1695 || GET_CODE (PATTERN (insn)) == ASM_INPUT)
1696 continue;
1698 instantiate_virtual_regs_in_insn (insn);
1700 if (INSN_DELETED_P (insn))
1701 continue;
1703 for_each_rtx (&REG_NOTES (insn), instantiate_virtual_regs_in_rtx, NULL);
1705 /* Instantiate any virtual registers in CALL_INSN_FUNCTION_USAGE. */
1706 if (GET_CODE (insn) == CALL_INSN)
1707 for_each_rtx (&CALL_INSN_FUNCTION_USAGE (insn),
1708 instantiate_virtual_regs_in_rtx, NULL);
1711 /* Instantiate the virtual registers in the DECLs for debugging purposes. */
1712 instantiate_decls (current_function_decl);
1714 /* Indicate that, from now on, assign_stack_local should use
1715 frame_pointer_rtx. */
1716 virtuals_instantiated = 1;
1717 return 0;
1720 struct tree_opt_pass pass_instantiate_virtual_regs =
1722 "vregs", /* name */
1723 NULL, /* gate */
1724 instantiate_virtual_regs, /* execute */
1725 NULL, /* sub */
1726 NULL, /* next */
1727 0, /* static_pass_number */
1728 0, /* tv_id */
1729 0, /* properties_required */
1730 0, /* properties_provided */
1731 0, /* properties_destroyed */
1732 0, /* todo_flags_start */
1733 TODO_dump_func, /* todo_flags_finish */
1734 0 /* letter */
1738 /* Return 1 if EXP is an aggregate type (or a value with aggregate type).
1739 This means a type for which function calls must pass an address to the
1740 function or get an address back from the function.
1741 EXP may be a type node or an expression (whose type is tested). */
1744 aggregate_value_p (tree exp, tree fntype)
1746 int i, regno, nregs;
1747 rtx reg;
1749 tree type = (TYPE_P (exp)) ? exp : TREE_TYPE (exp);
1751 /* DECL node associated with FNTYPE when relevant, which we might need to
1752 check for by-invisible-reference returns, typically for CALL_EXPR input
1753 EXPressions. */
1754 tree fndecl = NULL_TREE;
1756 if (fntype)
1757 switch (TREE_CODE (fntype))
1759 case CALL_EXPR:
1760 fndecl = get_callee_fndecl (fntype);
1761 fntype = fndecl ? TREE_TYPE (fndecl) : 0;
1762 break;
1763 case FUNCTION_DECL:
1764 fndecl = fntype;
1765 fntype = TREE_TYPE (fndecl);
1766 break;
1767 case FUNCTION_TYPE:
1768 case METHOD_TYPE:
1769 break;
1770 case IDENTIFIER_NODE:
1771 fntype = 0;
1772 break;
1773 default:
1774 /* We don't expect other rtl types here. */
1775 gcc_unreachable ();
1778 if (TREE_CODE (type) == VOID_TYPE)
1779 return 0;
1781 /* If the front end has decided that this needs to be passed by
1782 reference, do so. */
1783 if ((TREE_CODE (exp) == PARM_DECL || TREE_CODE (exp) == RESULT_DECL)
1784 && DECL_BY_REFERENCE (exp))
1785 return 1;
1787 /* If the EXPression is a CALL_EXPR, honor DECL_BY_REFERENCE set on the
1788 called function RESULT_DECL, meaning the function returns in memory by
1789 invisible reference. This check lets front-ends not set TREE_ADDRESSABLE
1790 on the function type, which used to be the way to request such a return
1791 mechanism but might now be causing troubles at gimplification time if
1792 temporaries with the function type need to be created. */
1793 if (TREE_CODE (exp) == CALL_EXPR && fndecl && DECL_RESULT (fndecl)
1794 && DECL_BY_REFERENCE (DECL_RESULT (fndecl)))
1795 return 1;
1797 if (targetm.calls.return_in_memory (type, fntype))
1798 return 1;
1799 /* Types that are TREE_ADDRESSABLE must be constructed in memory,
1800 and thus can't be returned in registers. */
1801 if (TREE_ADDRESSABLE (type))
1802 return 1;
1803 if (flag_pcc_struct_return && AGGREGATE_TYPE_P (type))
1804 return 1;
1805 /* Make sure we have suitable call-clobbered regs to return
1806 the value in; if not, we must return it in memory. */
1807 reg = hard_function_value (type, 0, fntype, 0);
1809 /* If we have something other than a REG (e.g. a PARALLEL), then assume
1810 it is OK. */
1811 if (!REG_P (reg))
1812 return 0;
1814 regno = REGNO (reg);
1815 nregs = hard_regno_nregs[regno][TYPE_MODE (type)];
1816 for (i = 0; i < nregs; i++)
1817 if (! call_used_regs[regno + i])
1818 return 1;
1819 return 0;
1822 /* Return true if we should assign DECL a pseudo register; false if it
1823 should live on the local stack. */
1825 bool
1826 use_register_for_decl (tree decl)
1828 /* Honor volatile. */
1829 if (TREE_SIDE_EFFECTS (decl))
1830 return false;
1832 /* Honor addressability. */
1833 if (TREE_ADDRESSABLE (decl))
1834 return false;
1836 /* Only register-like things go in registers. */
1837 if (DECL_MODE (decl) == BLKmode)
1838 return false;
1840 /* If -ffloat-store specified, don't put explicit float variables
1841 into registers. */
1842 /* ??? This should be checked after DECL_ARTIFICIAL, but tree-ssa
1843 propagates values across these stores, and it probably shouldn't. */
1844 if (flag_float_store && FLOAT_TYPE_P (TREE_TYPE (decl)))
1845 return false;
1847 /* If we're not interested in tracking debugging information for
1848 this decl, then we can certainly put it in a register. */
1849 if (DECL_IGNORED_P (decl))
1850 return true;
1852 return (optimize || DECL_REGISTER (decl));
1855 /* Return true if TYPE should be passed by invisible reference. */
1857 bool
1858 pass_by_reference (CUMULATIVE_ARGS *ca, enum machine_mode mode,
1859 tree type, bool named_arg)
1861 if (type)
1863 /* If this type contains non-trivial constructors, then it is
1864 forbidden for the middle-end to create any new copies. */
1865 if (TREE_ADDRESSABLE (type))
1866 return true;
1868 /* GCC post 3.4 passes *all* variable sized types by reference. */
1869 if (!TYPE_SIZE (type) || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
1870 return true;
1873 return targetm.calls.pass_by_reference (ca, mode, type, named_arg);
1876 /* Return true if TYPE, which is passed by reference, should be callee
1877 copied instead of caller copied. */
1879 bool
1880 reference_callee_copied (CUMULATIVE_ARGS *ca, enum machine_mode mode,
1881 tree type, bool named_arg)
1883 if (type && TREE_ADDRESSABLE (type))
1884 return false;
1885 return targetm.calls.callee_copies (ca, mode, type, named_arg);
1888 /* Structures to communicate between the subroutines of assign_parms.
1889 The first holds data persistent across all parameters, the second
1890 is cleared out for each parameter. */
1892 struct assign_parm_data_all
1894 CUMULATIVE_ARGS args_so_far;
1895 struct args_size stack_args_size;
1896 tree function_result_decl;
1897 tree orig_fnargs;
1898 rtx conversion_insns;
1899 HOST_WIDE_INT pretend_args_size;
1900 HOST_WIDE_INT extra_pretend_bytes;
1901 int reg_parm_stack_space;
1904 struct assign_parm_data_one
1906 tree nominal_type;
1907 tree passed_type;
1908 rtx entry_parm;
1909 rtx stack_parm;
1910 enum machine_mode nominal_mode;
1911 enum machine_mode passed_mode;
1912 enum machine_mode promoted_mode;
1913 struct locate_and_pad_arg_data locate;
1914 int partial;
1915 BOOL_BITFIELD named_arg : 1;
1916 BOOL_BITFIELD passed_pointer : 1;
1917 BOOL_BITFIELD on_stack : 1;
1918 BOOL_BITFIELD loaded_in_reg : 1;
1921 /* A subroutine of assign_parms. Initialize ALL. */
1923 static void
1924 assign_parms_initialize_all (struct assign_parm_data_all *all)
1926 tree fntype;
1928 memset (all, 0, sizeof (*all));
1930 fntype = TREE_TYPE (current_function_decl);
1932 #ifdef INIT_CUMULATIVE_INCOMING_ARGS
1933 INIT_CUMULATIVE_INCOMING_ARGS (all->args_so_far, fntype, NULL_RTX);
1934 #else
1935 INIT_CUMULATIVE_ARGS (all->args_so_far, fntype, NULL_RTX,
1936 current_function_decl, -1);
1937 #endif
1939 #ifdef REG_PARM_STACK_SPACE
1940 all->reg_parm_stack_space = REG_PARM_STACK_SPACE (current_function_decl);
1941 #endif
1944 /* If ARGS contains entries with complex types, split the entry into two
1945 entries of the component type. Return a new list of substitutions are
1946 needed, else the old list. */
1948 static tree
1949 split_complex_args (tree args)
1951 tree p;
1953 /* Before allocating memory, check for the common case of no complex. */
1954 for (p = args; p; p = TREE_CHAIN (p))
1956 tree type = TREE_TYPE (p);
1957 if (TREE_CODE (type) == COMPLEX_TYPE
1958 && targetm.calls.split_complex_arg (type))
1959 goto found;
1961 return args;
1963 found:
1964 args = copy_list (args);
1966 for (p = args; p; p = TREE_CHAIN (p))
1968 tree type = TREE_TYPE (p);
1969 if (TREE_CODE (type) == COMPLEX_TYPE
1970 && targetm.calls.split_complex_arg (type))
1972 tree decl;
1973 tree subtype = TREE_TYPE (type);
1974 bool addressable = TREE_ADDRESSABLE (p);
1976 /* Rewrite the PARM_DECL's type with its component. */
1977 TREE_TYPE (p) = subtype;
1978 DECL_ARG_TYPE (p) = TREE_TYPE (DECL_ARG_TYPE (p));
1979 DECL_MODE (p) = VOIDmode;
1980 DECL_SIZE (p) = NULL;
1981 DECL_SIZE_UNIT (p) = NULL;
1982 /* If this arg must go in memory, put it in a pseudo here.
1983 We can't allow it to go in memory as per normal parms,
1984 because the usual place might not have the imag part
1985 adjacent to the real part. */
1986 DECL_ARTIFICIAL (p) = addressable;
1987 DECL_IGNORED_P (p) = addressable;
1988 TREE_ADDRESSABLE (p) = 0;
1989 layout_decl (p, 0);
1991 /* Build a second synthetic decl. */
1992 decl = build_decl (PARM_DECL, NULL_TREE, subtype);
1993 DECL_ARG_TYPE (decl) = DECL_ARG_TYPE (p);
1994 DECL_ARTIFICIAL (decl) = addressable;
1995 DECL_IGNORED_P (decl) = addressable;
1996 layout_decl (decl, 0);
1998 /* Splice it in; skip the new decl. */
1999 TREE_CHAIN (decl) = TREE_CHAIN (p);
2000 TREE_CHAIN (p) = decl;
2001 p = decl;
2005 return args;
2008 /* A subroutine of assign_parms. Adjust the parameter list to incorporate
2009 the hidden struct return argument, and (abi willing) complex args.
2010 Return the new parameter list. */
2012 static tree
2013 assign_parms_augmented_arg_list (struct assign_parm_data_all *all)
2015 tree fndecl = current_function_decl;
2016 tree fntype = TREE_TYPE (fndecl);
2017 tree fnargs = DECL_ARGUMENTS (fndecl);
2019 /* If struct value address is treated as the first argument, make it so. */
2020 if (aggregate_value_p (DECL_RESULT (fndecl), fndecl)
2021 && ! current_function_returns_pcc_struct
2022 && targetm.calls.struct_value_rtx (TREE_TYPE (fndecl), 1) == 0)
2024 tree type = build_pointer_type (TREE_TYPE (fntype));
2025 tree decl;
2027 decl = build_decl (PARM_DECL, NULL_TREE, type);
2028 DECL_ARG_TYPE (decl) = type;
2029 DECL_ARTIFICIAL (decl) = 1;
2030 DECL_IGNORED_P (decl) = 1;
2032 TREE_CHAIN (decl) = fnargs;
2033 fnargs = decl;
2034 all->function_result_decl = decl;
2037 all->orig_fnargs = fnargs;
2039 /* If the target wants to split complex arguments into scalars, do so. */
2040 if (targetm.calls.split_complex_arg)
2041 fnargs = split_complex_args (fnargs);
2043 return fnargs;
2046 /* A subroutine of assign_parms. Examine PARM and pull out type and mode
2047 data for the parameter. Incorporate ABI specifics such as pass-by-
2048 reference and type promotion. */
2050 static void
2051 assign_parm_find_data_types (struct assign_parm_data_all *all, tree parm,
2052 struct assign_parm_data_one *data)
2054 tree nominal_type, passed_type;
2055 enum machine_mode nominal_mode, passed_mode, promoted_mode;
2057 memset (data, 0, sizeof (*data));
2059 /* NAMED_ARG is a mis-nomer. We really mean 'non-varadic'. */
2060 if (!current_function_stdarg)
2061 data->named_arg = 1; /* No varadic parms. */
2062 else if (TREE_CHAIN (parm))
2063 data->named_arg = 1; /* Not the last non-varadic parm. */
2064 else if (targetm.calls.strict_argument_naming (&all->args_so_far))
2065 data->named_arg = 1; /* Only varadic ones are unnamed. */
2066 else
2067 data->named_arg = 0; /* Treat as varadic. */
2069 nominal_type = TREE_TYPE (parm);
2070 passed_type = DECL_ARG_TYPE (parm);
2072 /* Look out for errors propagating this far. Also, if the parameter's
2073 type is void then its value doesn't matter. */
2074 if (TREE_TYPE (parm) == error_mark_node
2075 /* This can happen after weird syntax errors
2076 or if an enum type is defined among the parms. */
2077 || TREE_CODE (parm) != PARM_DECL
2078 || passed_type == NULL
2079 || VOID_TYPE_P (nominal_type))
2081 nominal_type = passed_type = void_type_node;
2082 nominal_mode = passed_mode = promoted_mode = VOIDmode;
2083 goto egress;
2086 /* Find mode of arg as it is passed, and mode of arg as it should be
2087 during execution of this function. */
2088 passed_mode = TYPE_MODE (passed_type);
2089 nominal_mode = TYPE_MODE (nominal_type);
2091 /* If the parm is to be passed as a transparent union, use the type of
2092 the first field for the tests below. We have already verified that
2093 the modes are the same. */
2094 if (TREE_CODE (passed_type) == UNION_TYPE
2095 && TYPE_TRANSPARENT_UNION (passed_type))
2096 passed_type = TREE_TYPE (TYPE_FIELDS (passed_type));
2098 /* See if this arg was passed by invisible reference. */
2099 if (pass_by_reference (&all->args_so_far, passed_mode,
2100 passed_type, data->named_arg))
2102 passed_type = nominal_type = build_pointer_type (passed_type);
2103 data->passed_pointer = true;
2104 passed_mode = nominal_mode = Pmode;
2107 /* Find mode as it is passed by the ABI. */
2108 promoted_mode = passed_mode;
2109 if (targetm.calls.promote_function_args (TREE_TYPE (current_function_decl)))
2111 int unsignedp = TYPE_UNSIGNED (passed_type);
2112 promoted_mode = promote_mode (passed_type, promoted_mode,
2113 &unsignedp, 1);
2116 egress:
2117 data->nominal_type = nominal_type;
2118 data->passed_type = passed_type;
2119 data->nominal_mode = nominal_mode;
2120 data->passed_mode = passed_mode;
2121 data->promoted_mode = promoted_mode;
2124 /* A subroutine of assign_parms. Invoke setup_incoming_varargs. */
2126 static void
2127 assign_parms_setup_varargs (struct assign_parm_data_all *all,
2128 struct assign_parm_data_one *data, bool no_rtl)
2130 int varargs_pretend_bytes = 0;
2132 targetm.calls.setup_incoming_varargs (&all->args_so_far,
2133 data->promoted_mode,
2134 data->passed_type,
2135 &varargs_pretend_bytes, no_rtl);
2137 /* If the back-end has requested extra stack space, record how much is
2138 needed. Do not change pretend_args_size otherwise since it may be
2139 nonzero from an earlier partial argument. */
2140 if (varargs_pretend_bytes > 0)
2141 all->pretend_args_size = varargs_pretend_bytes;
2144 /* A subroutine of assign_parms. Set DATA->ENTRY_PARM corresponding to
2145 the incoming location of the current parameter. */
2147 static void
2148 assign_parm_find_entry_rtl (struct assign_parm_data_all *all,
2149 struct assign_parm_data_one *data)
2151 HOST_WIDE_INT pretend_bytes = 0;
2152 rtx entry_parm;
2153 bool in_regs;
2155 if (data->promoted_mode == VOIDmode)
2157 data->entry_parm = data->stack_parm = const0_rtx;
2158 return;
2161 #ifdef FUNCTION_INCOMING_ARG
2162 entry_parm = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode,
2163 data->passed_type, data->named_arg);
2164 #else
2165 entry_parm = FUNCTION_ARG (all->args_so_far, data->promoted_mode,
2166 data->passed_type, data->named_arg);
2167 #endif
2169 if (entry_parm == 0)
2170 data->promoted_mode = data->passed_mode;
2172 /* Determine parm's home in the stack, in case it arrives in the stack
2173 or we should pretend it did. Compute the stack position and rtx where
2174 the argument arrives and its size.
2176 There is one complexity here: If this was a parameter that would
2177 have been passed in registers, but wasn't only because it is
2178 __builtin_va_alist, we want locate_and_pad_parm to treat it as if
2179 it came in a register so that REG_PARM_STACK_SPACE isn't skipped.
2180 In this case, we call FUNCTION_ARG with NAMED set to 1 instead of 0
2181 as it was the previous time. */
2182 in_regs = entry_parm != 0;
2183 #ifdef STACK_PARMS_IN_REG_PARM_AREA
2184 in_regs = true;
2185 #endif
2186 if (!in_regs && !data->named_arg)
2188 if (targetm.calls.pretend_outgoing_varargs_named (&all->args_so_far))
2190 rtx tem;
2191 #ifdef FUNCTION_INCOMING_ARG
2192 tem = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode,
2193 data->passed_type, true);
2194 #else
2195 tem = FUNCTION_ARG (all->args_so_far, data->promoted_mode,
2196 data->passed_type, true);
2197 #endif
2198 in_regs = tem != NULL;
2202 /* If this parameter was passed both in registers and in the stack, use
2203 the copy on the stack. */
2204 if (targetm.calls.must_pass_in_stack (data->promoted_mode,
2205 data->passed_type))
2206 entry_parm = 0;
2208 if (entry_parm)
2210 int partial;
2212 partial = targetm.calls.arg_partial_bytes (&all->args_so_far,
2213 data->promoted_mode,
2214 data->passed_type,
2215 data->named_arg);
2216 data->partial = partial;
2218 /* The caller might already have allocated stack space for the
2219 register parameters. */
2220 if (partial != 0 && all->reg_parm_stack_space == 0)
2222 /* Part of this argument is passed in registers and part
2223 is passed on the stack. Ask the prologue code to extend
2224 the stack part so that we can recreate the full value.
2226 PRETEND_BYTES is the size of the registers we need to store.
2227 CURRENT_FUNCTION_PRETEND_ARGS_SIZE is the amount of extra
2228 stack space that the prologue should allocate.
2230 Internally, gcc assumes that the argument pointer is aligned
2231 to STACK_BOUNDARY bits. This is used both for alignment
2232 optimizations (see init_emit) and to locate arguments that are
2233 aligned to more than PARM_BOUNDARY bits. We must preserve this
2234 invariant by rounding CURRENT_FUNCTION_PRETEND_ARGS_SIZE up to
2235 a stack boundary. */
2237 /* We assume at most one partial arg, and it must be the first
2238 argument on the stack. */
2239 gcc_assert (!all->extra_pretend_bytes && !all->pretend_args_size);
2241 pretend_bytes = partial;
2242 all->pretend_args_size = CEIL_ROUND (pretend_bytes, STACK_BYTES);
2244 /* We want to align relative to the actual stack pointer, so
2245 don't include this in the stack size until later. */
2246 all->extra_pretend_bytes = all->pretend_args_size;
2250 locate_and_pad_parm (data->promoted_mode, data->passed_type, in_regs,
2251 entry_parm ? data->partial : 0, current_function_decl,
2252 &all->stack_args_size, &data->locate);
2254 /* Adjust offsets to include the pretend args. */
2255 pretend_bytes = all->extra_pretend_bytes - pretend_bytes;
2256 data->locate.slot_offset.constant += pretend_bytes;
2257 data->locate.offset.constant += pretend_bytes;
2259 data->entry_parm = entry_parm;
2262 /* A subroutine of assign_parms. If there is actually space on the stack
2263 for this parm, count it in stack_args_size and return true. */
2265 static bool
2266 assign_parm_is_stack_parm (struct assign_parm_data_all *all,
2267 struct assign_parm_data_one *data)
2269 /* Trivially true if we've no incoming register. */
2270 if (data->entry_parm == NULL)
2272 /* Also true if we're partially in registers and partially not,
2273 since we've arranged to drop the entire argument on the stack. */
2274 else if (data->partial != 0)
2276 /* Also true if the target says that it's passed in both registers
2277 and on the stack. */
2278 else if (GET_CODE (data->entry_parm) == PARALLEL
2279 && XEXP (XVECEXP (data->entry_parm, 0, 0), 0) == NULL_RTX)
2281 /* Also true if the target says that there's stack allocated for
2282 all register parameters. */
2283 else if (all->reg_parm_stack_space > 0)
2285 /* Otherwise, no, this parameter has no ABI defined stack slot. */
2286 else
2287 return false;
2289 all->stack_args_size.constant += data->locate.size.constant;
2290 if (data->locate.size.var)
2291 ADD_PARM_SIZE (all->stack_args_size, data->locate.size.var);
2293 return true;
2296 /* A subroutine of assign_parms. Given that this parameter is allocated
2297 stack space by the ABI, find it. */
2299 static void
2300 assign_parm_find_stack_rtl (tree parm, struct assign_parm_data_one *data)
2302 rtx offset_rtx, stack_parm;
2303 unsigned int align, boundary;
2305 /* If we're passing this arg using a reg, make its stack home the
2306 aligned stack slot. */
2307 if (data->entry_parm)
2308 offset_rtx = ARGS_SIZE_RTX (data->locate.slot_offset);
2309 else
2310 offset_rtx = ARGS_SIZE_RTX (data->locate.offset);
2312 stack_parm = current_function_internal_arg_pointer;
2313 if (offset_rtx != const0_rtx)
2314 stack_parm = gen_rtx_PLUS (Pmode, stack_parm, offset_rtx);
2315 stack_parm = gen_rtx_MEM (data->promoted_mode, stack_parm);
2317 set_mem_attributes (stack_parm, parm, 1);
2319 boundary = data->locate.boundary;
2320 align = BITS_PER_UNIT;
2322 /* If we're padding upward, we know that the alignment of the slot
2323 is FUNCTION_ARG_BOUNDARY. If we're using slot_offset, we're
2324 intentionally forcing upward padding. Otherwise we have to come
2325 up with a guess at the alignment based on OFFSET_RTX. */
2326 if (data->locate.where_pad != downward || data->entry_parm)
2327 align = boundary;
2328 else if (GET_CODE (offset_rtx) == CONST_INT)
2330 align = INTVAL (offset_rtx) * BITS_PER_UNIT | boundary;
2331 align = align & -align;
2333 set_mem_align (stack_parm, align);
2335 if (data->entry_parm)
2336 set_reg_attrs_for_parm (data->entry_parm, stack_parm);
2338 data->stack_parm = stack_parm;
2341 /* A subroutine of assign_parms. Adjust DATA->ENTRY_RTL such that it's
2342 always valid and contiguous. */
2344 static void
2345 assign_parm_adjust_entry_rtl (struct assign_parm_data_one *data)
2347 rtx entry_parm = data->entry_parm;
2348 rtx stack_parm = data->stack_parm;
2350 /* If this parm was passed part in regs and part in memory, pretend it
2351 arrived entirely in memory by pushing the register-part onto the stack.
2352 In the special case of a DImode or DFmode that is split, we could put
2353 it together in a pseudoreg directly, but for now that's not worth
2354 bothering with. */
2355 if (data->partial != 0)
2357 /* Handle calls that pass values in multiple non-contiguous
2358 locations. The Irix 6 ABI has examples of this. */
2359 if (GET_CODE (entry_parm) == PARALLEL)
2360 emit_group_store (validize_mem (stack_parm), entry_parm,
2361 data->passed_type,
2362 int_size_in_bytes (data->passed_type));
2363 else
2365 gcc_assert (data->partial % UNITS_PER_WORD == 0);
2366 move_block_from_reg (REGNO (entry_parm), validize_mem (stack_parm),
2367 data->partial / UNITS_PER_WORD);
2370 entry_parm = stack_parm;
2373 /* If we didn't decide this parm came in a register, by default it came
2374 on the stack. */
2375 else if (entry_parm == NULL)
2376 entry_parm = stack_parm;
2378 /* When an argument is passed in multiple locations, we can't make use
2379 of this information, but we can save some copying if the whole argument
2380 is passed in a single register. */
2381 else if (GET_CODE (entry_parm) == PARALLEL
2382 && data->nominal_mode != BLKmode
2383 && data->passed_mode != BLKmode)
2385 size_t i, len = XVECLEN (entry_parm, 0);
2387 for (i = 0; i < len; i++)
2388 if (XEXP (XVECEXP (entry_parm, 0, i), 0) != NULL_RTX
2389 && REG_P (XEXP (XVECEXP (entry_parm, 0, i), 0))
2390 && (GET_MODE (XEXP (XVECEXP (entry_parm, 0, i), 0))
2391 == data->passed_mode)
2392 && INTVAL (XEXP (XVECEXP (entry_parm, 0, i), 1)) == 0)
2394 entry_parm = XEXP (XVECEXP (entry_parm, 0, i), 0);
2395 break;
2399 data->entry_parm = entry_parm;
2402 /* A subroutine of assign_parms. Adjust DATA->STACK_RTL such that it's
2403 always valid and properly aligned. */
2405 static void
2406 assign_parm_adjust_stack_rtl (struct assign_parm_data_one *data)
2408 rtx stack_parm = data->stack_parm;
2410 /* If we can't trust the parm stack slot to be aligned enough for its
2411 ultimate type, don't use that slot after entry. We'll make another
2412 stack slot, if we need one. */
2413 if (stack_parm
2414 && ((STRICT_ALIGNMENT
2415 && GET_MODE_ALIGNMENT (data->nominal_mode) > MEM_ALIGN (stack_parm))
2416 || (data->nominal_type
2417 && TYPE_ALIGN (data->nominal_type) > MEM_ALIGN (stack_parm)
2418 && MEM_ALIGN (stack_parm) < PREFERRED_STACK_BOUNDARY)))
2419 stack_parm = NULL;
2421 /* If parm was passed in memory, and we need to convert it on entry,
2422 don't store it back in that same slot. */
2423 else if (data->entry_parm == stack_parm
2424 && data->nominal_mode != BLKmode
2425 && data->nominal_mode != data->passed_mode)
2426 stack_parm = NULL;
2428 /* If stack protection is in effect for this function, don't leave any
2429 pointers in their passed stack slots. */
2430 else if (cfun->stack_protect_guard
2431 && (flag_stack_protect == 2
2432 || data->passed_pointer
2433 || POINTER_TYPE_P (data->nominal_type)))
2434 stack_parm = NULL;
2436 data->stack_parm = stack_parm;
2439 /* A subroutine of assign_parms. Return true if the current parameter
2440 should be stored as a BLKmode in the current frame. */
2442 static bool
2443 assign_parm_setup_block_p (struct assign_parm_data_one *data)
2445 if (data->nominal_mode == BLKmode)
2446 return true;
2447 if (GET_CODE (data->entry_parm) == PARALLEL)
2448 return true;
2450 #ifdef BLOCK_REG_PADDING
2451 /* Only assign_parm_setup_block knows how to deal with register arguments
2452 that are padded at the least significant end. */
2453 if (REG_P (data->entry_parm)
2454 && GET_MODE_SIZE (data->promoted_mode) < UNITS_PER_WORD
2455 && (BLOCK_REG_PADDING (data->passed_mode, data->passed_type, 1)
2456 == (BYTES_BIG_ENDIAN ? upward : downward)))
2457 return true;
2458 #endif
2460 return false;
2463 /* A subroutine of assign_parms. Arrange for the parameter to be
2464 present and valid in DATA->STACK_RTL. */
2466 static void
2467 assign_parm_setup_block (struct assign_parm_data_all *all,
2468 tree parm, struct assign_parm_data_one *data)
2470 rtx entry_parm = data->entry_parm;
2471 rtx stack_parm = data->stack_parm;
2472 HOST_WIDE_INT size;
2473 HOST_WIDE_INT size_stored;
2474 rtx orig_entry_parm = entry_parm;
2476 if (GET_CODE (entry_parm) == PARALLEL)
2477 entry_parm = emit_group_move_into_temps (entry_parm);
2479 /* If we've a non-block object that's nevertheless passed in parts,
2480 reconstitute it in register operations rather than on the stack. */
2481 if (GET_CODE (entry_parm) == PARALLEL
2482 && data->nominal_mode != BLKmode)
2484 rtx elt0 = XEXP (XVECEXP (orig_entry_parm, 0, 0), 0);
2486 if ((XVECLEN (entry_parm, 0) > 1
2487 || hard_regno_nregs[REGNO (elt0)][GET_MODE (elt0)] > 1)
2488 && use_register_for_decl (parm))
2490 rtx parmreg = gen_reg_rtx (data->nominal_mode);
2492 push_to_sequence (all->conversion_insns);
2494 /* For values returned in multiple registers, handle possible
2495 incompatible calls to emit_group_store.
2497 For example, the following would be invalid, and would have to
2498 be fixed by the conditional below:
2500 emit_group_store ((reg:SF), (parallel:DF))
2501 emit_group_store ((reg:SI), (parallel:DI))
2503 An example of this are doubles in e500 v2:
2504 (parallel:DF (expr_list (reg:SI) (const_int 0))
2505 (expr_list (reg:SI) (const_int 4))). */
2506 if (data->nominal_mode != data->passed_mode)
2508 rtx t = gen_reg_rtx (GET_MODE (entry_parm));
2509 emit_group_store (t, entry_parm, NULL_TREE,
2510 GET_MODE_SIZE (GET_MODE (entry_parm)));
2511 convert_move (parmreg, t, 0);
2513 else
2514 emit_group_store (parmreg, entry_parm, data->nominal_type,
2515 int_size_in_bytes (data->nominal_type));
2517 all->conversion_insns = get_insns ();
2518 end_sequence ();
2520 SET_DECL_RTL (parm, parmreg);
2521 return;
2525 size = int_size_in_bytes (data->passed_type);
2526 size_stored = CEIL_ROUND (size, UNITS_PER_WORD);
2527 if (stack_parm == 0)
2529 DECL_ALIGN (parm) = MAX (DECL_ALIGN (parm), BITS_PER_WORD);
2530 stack_parm = assign_stack_local (BLKmode, size_stored,
2531 DECL_ALIGN (parm));
2532 if (GET_MODE_SIZE (GET_MODE (entry_parm)) == size)
2533 PUT_MODE (stack_parm, GET_MODE (entry_parm));
2534 set_mem_attributes (stack_parm, parm, 1);
2537 /* If a BLKmode arrives in registers, copy it to a stack slot. Handle
2538 calls that pass values in multiple non-contiguous locations. */
2539 if (REG_P (entry_parm) || GET_CODE (entry_parm) == PARALLEL)
2541 rtx mem;
2543 /* Note that we will be storing an integral number of words.
2544 So we have to be careful to ensure that we allocate an
2545 integral number of words. We do this above when we call
2546 assign_stack_local if space was not allocated in the argument
2547 list. If it was, this will not work if PARM_BOUNDARY is not
2548 a multiple of BITS_PER_WORD. It isn't clear how to fix this
2549 if it becomes a problem. Exception is when BLKmode arrives
2550 with arguments not conforming to word_mode. */
2552 if (data->stack_parm == 0)
2554 else if (GET_CODE (entry_parm) == PARALLEL)
2556 else
2557 gcc_assert (!size || !(PARM_BOUNDARY % BITS_PER_WORD));
2559 mem = validize_mem (stack_parm);
2561 /* Handle values in multiple non-contiguous locations. */
2562 if (GET_CODE (entry_parm) == PARALLEL)
2564 push_to_sequence (all->conversion_insns);
2565 emit_group_store (mem, entry_parm, data->passed_type, size);
2566 all->conversion_insns = get_insns ();
2567 end_sequence ();
2570 else if (size == 0)
2573 /* If SIZE is that of a mode no bigger than a word, just use
2574 that mode's store operation. */
2575 else if (size <= UNITS_PER_WORD)
2577 enum machine_mode mode
2578 = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0);
2580 if (mode != BLKmode
2581 #ifdef BLOCK_REG_PADDING
2582 && (size == UNITS_PER_WORD
2583 || (BLOCK_REG_PADDING (mode, data->passed_type, 1)
2584 != (BYTES_BIG_ENDIAN ? upward : downward)))
2585 #endif
2588 rtx reg = gen_rtx_REG (mode, REGNO (entry_parm));
2589 emit_move_insn (change_address (mem, mode, 0), reg);
2592 /* Blocks smaller than a word on a BYTES_BIG_ENDIAN
2593 machine must be aligned to the left before storing
2594 to memory. Note that the previous test doesn't
2595 handle all cases (e.g. SIZE == 3). */
2596 else if (size != UNITS_PER_WORD
2597 #ifdef BLOCK_REG_PADDING
2598 && (BLOCK_REG_PADDING (mode, data->passed_type, 1)
2599 == downward)
2600 #else
2601 && BYTES_BIG_ENDIAN
2602 #endif
2605 rtx tem, x;
2606 int by = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
2607 rtx reg = gen_rtx_REG (word_mode, REGNO (entry_parm));
2609 x = expand_shift (LSHIFT_EXPR, word_mode, reg,
2610 build_int_cst (NULL_TREE, by),
2611 NULL_RTX, 1);
2612 tem = change_address (mem, word_mode, 0);
2613 emit_move_insn (tem, x);
2615 else
2616 move_block_from_reg (REGNO (entry_parm), mem,
2617 size_stored / UNITS_PER_WORD);
2619 else
2620 move_block_from_reg (REGNO (entry_parm), mem,
2621 size_stored / UNITS_PER_WORD);
2623 else if (data->stack_parm == 0)
2625 push_to_sequence (all->conversion_insns);
2626 emit_block_move (stack_parm, data->entry_parm, GEN_INT (size),
2627 BLOCK_OP_NORMAL);
2628 all->conversion_insns = get_insns ();
2629 end_sequence ();
2632 data->stack_parm = stack_parm;
2633 SET_DECL_RTL (parm, stack_parm);
2636 /* A subroutine of assign_parms. Allocate a pseudo to hold the current
2637 parameter. Get it there. Perform all ABI specified conversions. */
2639 static void
2640 assign_parm_setup_reg (struct assign_parm_data_all *all, tree parm,
2641 struct assign_parm_data_one *data)
2643 rtx parmreg;
2644 enum machine_mode promoted_nominal_mode;
2645 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (parm));
2646 bool did_conversion = false;
2648 /* Store the parm in a pseudoregister during the function, but we may
2649 need to do it in a wider mode. */
2651 /* This is not really promoting for a call. However we need to be
2652 consistent with assign_parm_find_data_types and expand_expr_real_1. */
2653 promoted_nominal_mode
2654 = promote_mode (data->nominal_type, data->nominal_mode, &unsignedp, 1);
2656 parmreg = gen_reg_rtx (promoted_nominal_mode);
2658 if (!DECL_ARTIFICIAL (parm))
2659 mark_user_reg (parmreg);
2661 /* If this was an item that we received a pointer to,
2662 set DECL_RTL appropriately. */
2663 if (data->passed_pointer)
2665 rtx x = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data->passed_type)), parmreg);
2666 set_mem_attributes (x, parm, 1);
2667 SET_DECL_RTL (parm, x);
2669 else
2670 SET_DECL_RTL (parm, parmreg);
2672 /* Copy the value into the register. */
2673 if (data->nominal_mode != data->passed_mode
2674 || promoted_nominal_mode != data->promoted_mode)
2676 int save_tree_used;
2678 /* ENTRY_PARM has been converted to PROMOTED_MODE, its
2679 mode, by the caller. We now have to convert it to
2680 NOMINAL_MODE, if different. However, PARMREG may be in
2681 a different mode than NOMINAL_MODE if it is being stored
2682 promoted.
2684 If ENTRY_PARM is a hard register, it might be in a register
2685 not valid for operating in its mode (e.g., an odd-numbered
2686 register for a DFmode). In that case, moves are the only
2687 thing valid, so we can't do a convert from there. This
2688 occurs when the calling sequence allow such misaligned
2689 usages.
2691 In addition, the conversion may involve a call, which could
2692 clobber parameters which haven't been copied to pseudo
2693 registers yet. Therefore, we must first copy the parm to
2694 a pseudo reg here, and save the conversion until after all
2695 parameters have been moved. */
2697 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
2699 emit_move_insn (tempreg, validize_mem (data->entry_parm));
2701 push_to_sequence (all->conversion_insns);
2702 tempreg = convert_to_mode (data->nominal_mode, tempreg, unsignedp);
2704 if (GET_CODE (tempreg) == SUBREG
2705 && GET_MODE (tempreg) == data->nominal_mode
2706 && REG_P (SUBREG_REG (tempreg))
2707 && data->nominal_mode == data->passed_mode
2708 && GET_MODE (SUBREG_REG (tempreg)) == GET_MODE (data->entry_parm)
2709 && GET_MODE_SIZE (GET_MODE (tempreg))
2710 < GET_MODE_SIZE (GET_MODE (data->entry_parm)))
2712 /* The argument is already sign/zero extended, so note it
2713 into the subreg. */
2714 SUBREG_PROMOTED_VAR_P (tempreg) = 1;
2715 SUBREG_PROMOTED_UNSIGNED_SET (tempreg, unsignedp);
2718 /* TREE_USED gets set erroneously during expand_assignment. */
2719 save_tree_used = TREE_USED (parm);
2720 expand_assignment (parm, make_tree (data->nominal_type, tempreg));
2721 TREE_USED (parm) = save_tree_used;
2722 all->conversion_insns = get_insns ();
2723 end_sequence ();
2725 did_conversion = true;
2727 else
2728 emit_move_insn (parmreg, validize_mem (data->entry_parm));
2730 /* If we were passed a pointer but the actual value can safely live
2731 in a register, put it in one. */
2732 if (data->passed_pointer
2733 && TYPE_MODE (TREE_TYPE (parm)) != BLKmode
2734 /* If by-reference argument was promoted, demote it. */
2735 && (TYPE_MODE (TREE_TYPE (parm)) != GET_MODE (DECL_RTL (parm))
2736 || use_register_for_decl (parm)))
2738 /* We can't use nominal_mode, because it will have been set to
2739 Pmode above. We must use the actual mode of the parm. */
2740 parmreg = gen_reg_rtx (TYPE_MODE (TREE_TYPE (parm)));
2741 mark_user_reg (parmreg);
2743 if (GET_MODE (parmreg) != GET_MODE (DECL_RTL (parm)))
2745 rtx tempreg = gen_reg_rtx (GET_MODE (DECL_RTL (parm)));
2746 int unsigned_p = TYPE_UNSIGNED (TREE_TYPE (parm));
2748 push_to_sequence (all->conversion_insns);
2749 emit_move_insn (tempreg, DECL_RTL (parm));
2750 tempreg = convert_to_mode (GET_MODE (parmreg), tempreg, unsigned_p);
2751 emit_move_insn (parmreg, tempreg);
2752 all->conversion_insns = get_insns ();
2753 end_sequence ();
2755 did_conversion = true;
2757 else
2758 emit_move_insn (parmreg, DECL_RTL (parm));
2760 SET_DECL_RTL (parm, parmreg);
2762 /* STACK_PARM is the pointer, not the parm, and PARMREG is
2763 now the parm. */
2764 data->stack_parm = NULL;
2767 /* Mark the register as eliminable if we did no conversion and it was
2768 copied from memory at a fixed offset, and the arg pointer was not
2769 copied to a pseudo-reg. If the arg pointer is a pseudo reg or the
2770 offset formed an invalid address, such memory-equivalences as we
2771 make here would screw up life analysis for it. */
2772 if (data->nominal_mode == data->passed_mode
2773 && !did_conversion
2774 && data->stack_parm != 0
2775 && MEM_P (data->stack_parm)
2776 && data->locate.offset.var == 0
2777 && reg_mentioned_p (virtual_incoming_args_rtx,
2778 XEXP (data->stack_parm, 0)))
2780 rtx linsn = get_last_insn ();
2781 rtx sinsn, set;
2783 /* Mark complex types separately. */
2784 if (GET_CODE (parmreg) == CONCAT)
2786 enum machine_mode submode
2787 = GET_MODE_INNER (GET_MODE (parmreg));
2788 int regnor = REGNO (XEXP (parmreg, 0));
2789 int regnoi = REGNO (XEXP (parmreg, 1));
2790 rtx stackr = adjust_address_nv (data->stack_parm, submode, 0);
2791 rtx stacki = adjust_address_nv (data->stack_parm, submode,
2792 GET_MODE_SIZE (submode));
2794 /* Scan backwards for the set of the real and
2795 imaginary parts. */
2796 for (sinsn = linsn; sinsn != 0;
2797 sinsn = prev_nonnote_insn (sinsn))
2799 set = single_set (sinsn);
2800 if (set == 0)
2801 continue;
2803 if (SET_DEST (set) == regno_reg_rtx [regnoi])
2804 set_unique_reg_note (sinsn, REG_EQUIV, stacki);
2805 else if (SET_DEST (set) == regno_reg_rtx [regnor])
2806 set_unique_reg_note (sinsn, REG_EQUIV, stackr);
2809 else if ((set = single_set (linsn)) != 0
2810 && SET_DEST (set) == parmreg)
2811 set_unique_reg_note (linsn, REG_EQUIV, data->stack_parm);
2814 /* For pointer data type, suggest pointer register. */
2815 if (POINTER_TYPE_P (TREE_TYPE (parm)))
2816 mark_reg_pointer (parmreg,
2817 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
2820 /* A subroutine of assign_parms. Allocate stack space to hold the current
2821 parameter. Get it there. Perform all ABI specified conversions. */
2823 static void
2824 assign_parm_setup_stack (struct assign_parm_data_all *all, tree parm,
2825 struct assign_parm_data_one *data)
2827 /* Value must be stored in the stack slot STACK_PARM during function
2828 execution. */
2829 bool to_conversion = false;
2831 if (data->promoted_mode != data->nominal_mode)
2833 /* Conversion is required. */
2834 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
2836 emit_move_insn (tempreg, validize_mem (data->entry_parm));
2838 push_to_sequence (all->conversion_insns);
2839 to_conversion = true;
2841 data->entry_parm = convert_to_mode (data->nominal_mode, tempreg,
2842 TYPE_UNSIGNED (TREE_TYPE (parm)));
2844 if (data->stack_parm)
2845 /* ??? This may need a big-endian conversion on sparc64. */
2846 data->stack_parm
2847 = adjust_address (data->stack_parm, data->nominal_mode, 0);
2850 if (data->entry_parm != data->stack_parm)
2852 rtx src, dest;
2854 if (data->stack_parm == 0)
2856 data->stack_parm
2857 = assign_stack_local (GET_MODE (data->entry_parm),
2858 GET_MODE_SIZE (GET_MODE (data->entry_parm)),
2859 TYPE_ALIGN (data->passed_type));
2860 set_mem_attributes (data->stack_parm, parm, 1);
2863 dest = validize_mem (data->stack_parm);
2864 src = validize_mem (data->entry_parm);
2866 if (MEM_P (src))
2868 /* Use a block move to handle potentially misaligned entry_parm. */
2869 if (!to_conversion)
2870 push_to_sequence (all->conversion_insns);
2871 to_conversion = true;
2873 emit_block_move (dest, src,
2874 GEN_INT (int_size_in_bytes (data->passed_type)),
2875 BLOCK_OP_NORMAL);
2877 else
2878 emit_move_insn (dest, src);
2881 if (to_conversion)
2883 all->conversion_insns = get_insns ();
2884 end_sequence ();
2887 SET_DECL_RTL (parm, data->stack_parm);
2890 /* A subroutine of assign_parms. If the ABI splits complex arguments, then
2891 undo the frobbing that we did in assign_parms_augmented_arg_list. */
2893 static void
2894 assign_parms_unsplit_complex (struct assign_parm_data_all *all, tree fnargs)
2896 tree parm;
2897 tree orig_fnargs = all->orig_fnargs;
2899 for (parm = orig_fnargs; parm; parm = TREE_CHAIN (parm))
2901 if (TREE_CODE (TREE_TYPE (parm)) == COMPLEX_TYPE
2902 && targetm.calls.split_complex_arg (TREE_TYPE (parm)))
2904 rtx tmp, real, imag;
2905 enum machine_mode inner = GET_MODE_INNER (DECL_MODE (parm));
2907 real = DECL_RTL (fnargs);
2908 imag = DECL_RTL (TREE_CHAIN (fnargs));
2909 if (inner != GET_MODE (real))
2911 real = gen_lowpart_SUBREG (inner, real);
2912 imag = gen_lowpart_SUBREG (inner, imag);
2915 if (TREE_ADDRESSABLE (parm))
2917 rtx rmem, imem;
2918 HOST_WIDE_INT size = int_size_in_bytes (TREE_TYPE (parm));
2920 /* split_complex_arg put the real and imag parts in
2921 pseudos. Move them to memory. */
2922 tmp = assign_stack_local (DECL_MODE (parm), size,
2923 TYPE_ALIGN (TREE_TYPE (parm)));
2924 set_mem_attributes (tmp, parm, 1);
2925 rmem = adjust_address_nv (tmp, inner, 0);
2926 imem = adjust_address_nv (tmp, inner, GET_MODE_SIZE (inner));
2927 push_to_sequence (all->conversion_insns);
2928 emit_move_insn (rmem, real);
2929 emit_move_insn (imem, imag);
2930 all->conversion_insns = get_insns ();
2931 end_sequence ();
2933 else
2934 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
2935 SET_DECL_RTL (parm, tmp);
2937 real = DECL_INCOMING_RTL (fnargs);
2938 imag = DECL_INCOMING_RTL (TREE_CHAIN (fnargs));
2939 if (inner != GET_MODE (real))
2941 real = gen_lowpart_SUBREG (inner, real);
2942 imag = gen_lowpart_SUBREG (inner, imag);
2944 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
2945 set_decl_incoming_rtl (parm, tmp);
2946 fnargs = TREE_CHAIN (fnargs);
2948 else
2950 SET_DECL_RTL (parm, DECL_RTL (fnargs));
2951 set_decl_incoming_rtl (parm, DECL_INCOMING_RTL (fnargs));
2953 /* Set MEM_EXPR to the original decl, i.e. to PARM,
2954 instead of the copy of decl, i.e. FNARGS. */
2955 if (DECL_INCOMING_RTL (parm) && MEM_P (DECL_INCOMING_RTL (parm)))
2956 set_mem_expr (DECL_INCOMING_RTL (parm), parm);
2959 fnargs = TREE_CHAIN (fnargs);
2963 /* Assign RTL expressions to the function's parameters. This may involve
2964 copying them into registers and using those registers as the DECL_RTL. */
2966 static void
2967 assign_parms (tree fndecl)
2969 struct assign_parm_data_all all;
2970 tree fnargs, parm;
2972 current_function_internal_arg_pointer
2973 = targetm.calls.internal_arg_pointer ();
2975 assign_parms_initialize_all (&all);
2976 fnargs = assign_parms_augmented_arg_list (&all);
2978 for (parm = fnargs; parm; parm = TREE_CHAIN (parm))
2980 struct assign_parm_data_one data;
2982 /* Extract the type of PARM; adjust it according to ABI. */
2983 assign_parm_find_data_types (&all, parm, &data);
2985 /* Early out for errors and void parameters. */
2986 if (data.passed_mode == VOIDmode)
2988 SET_DECL_RTL (parm, const0_rtx);
2989 DECL_INCOMING_RTL (parm) = DECL_RTL (parm);
2990 continue;
2993 if (current_function_stdarg && !TREE_CHAIN (parm))
2994 assign_parms_setup_varargs (&all, &data, false);
2996 /* Find out where the parameter arrives in this function. */
2997 assign_parm_find_entry_rtl (&all, &data);
2999 /* Find out where stack space for this parameter might be. */
3000 if (assign_parm_is_stack_parm (&all, &data))
3002 assign_parm_find_stack_rtl (parm, &data);
3003 assign_parm_adjust_entry_rtl (&data);
3006 /* Record permanently how this parm was passed. */
3007 set_decl_incoming_rtl (parm, data.entry_parm);
3009 /* Update info on where next arg arrives in registers. */
3010 FUNCTION_ARG_ADVANCE (all.args_so_far, data.promoted_mode,
3011 data.passed_type, data.named_arg);
3013 assign_parm_adjust_stack_rtl (&data);
3015 if (assign_parm_setup_block_p (&data))
3016 assign_parm_setup_block (&all, parm, &data);
3017 else if (data.passed_pointer || use_register_for_decl (parm))
3018 assign_parm_setup_reg (&all, parm, &data);
3019 else
3020 assign_parm_setup_stack (&all, parm, &data);
3023 if (targetm.calls.split_complex_arg && fnargs != all.orig_fnargs)
3024 assign_parms_unsplit_complex (&all, fnargs);
3026 /* Output all parameter conversion instructions (possibly including calls)
3027 now that all parameters have been copied out of hard registers. */
3028 emit_insn (all.conversion_insns);
3030 /* If we are receiving a struct value address as the first argument, set up
3031 the RTL for the function result. As this might require code to convert
3032 the transmitted address to Pmode, we do this here to ensure that possible
3033 preliminary conversions of the address have been emitted already. */
3034 if (all.function_result_decl)
3036 tree result = DECL_RESULT (current_function_decl);
3037 rtx addr = DECL_RTL (all.function_result_decl);
3038 rtx x;
3040 if (DECL_BY_REFERENCE (result))
3041 x = addr;
3042 else
3044 addr = convert_memory_address (Pmode, addr);
3045 x = gen_rtx_MEM (DECL_MODE (result), addr);
3046 set_mem_attributes (x, result, 1);
3048 SET_DECL_RTL (result, x);
3051 /* We have aligned all the args, so add space for the pretend args. */
3052 current_function_pretend_args_size = all.pretend_args_size;
3053 all.stack_args_size.constant += all.extra_pretend_bytes;
3054 current_function_args_size = all.stack_args_size.constant;
3056 /* Adjust function incoming argument size for alignment and
3057 minimum length. */
3059 #ifdef REG_PARM_STACK_SPACE
3060 current_function_args_size = MAX (current_function_args_size,
3061 REG_PARM_STACK_SPACE (fndecl));
3062 #endif
3064 current_function_args_size = CEIL_ROUND (current_function_args_size,
3065 PARM_BOUNDARY / BITS_PER_UNIT);
3067 #ifdef ARGS_GROW_DOWNWARD
3068 current_function_arg_offset_rtx
3069 = (all.stack_args_size.var == 0 ? GEN_INT (-all.stack_args_size.constant)
3070 : expand_expr (size_diffop (all.stack_args_size.var,
3071 size_int (-all.stack_args_size.constant)),
3072 NULL_RTX, VOIDmode, 0));
3073 #else
3074 current_function_arg_offset_rtx = ARGS_SIZE_RTX (all.stack_args_size);
3075 #endif
3077 /* See how many bytes, if any, of its args a function should try to pop
3078 on return. */
3080 current_function_pops_args = RETURN_POPS_ARGS (fndecl, TREE_TYPE (fndecl),
3081 current_function_args_size);
3083 /* For stdarg.h function, save info about
3084 regs and stack space used by the named args. */
3086 current_function_args_info = all.args_so_far;
3088 /* Set the rtx used for the function return value. Put this in its
3089 own variable so any optimizers that need this information don't have
3090 to include tree.h. Do this here so it gets done when an inlined
3091 function gets output. */
3093 current_function_return_rtx
3094 = (DECL_RTL_SET_P (DECL_RESULT (fndecl))
3095 ? DECL_RTL (DECL_RESULT (fndecl)) : NULL_RTX);
3097 /* If scalar return value was computed in a pseudo-reg, or was a named
3098 return value that got dumped to the stack, copy that to the hard
3099 return register. */
3100 if (DECL_RTL_SET_P (DECL_RESULT (fndecl)))
3102 tree decl_result = DECL_RESULT (fndecl);
3103 rtx decl_rtl = DECL_RTL (decl_result);
3105 if (REG_P (decl_rtl)
3106 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
3107 : DECL_REGISTER (decl_result))
3109 rtx real_decl_rtl;
3111 real_decl_rtl = targetm.calls.function_value (TREE_TYPE (decl_result),
3112 fndecl, true);
3113 REG_FUNCTION_VALUE_P (real_decl_rtl) = 1;
3114 /* The delay slot scheduler assumes that current_function_return_rtx
3115 holds the hard register containing the return value, not a
3116 temporary pseudo. */
3117 current_function_return_rtx = real_decl_rtl;
3122 /* A subroutine of gimplify_parameters, invoked via walk_tree.
3123 For all seen types, gimplify their sizes. */
3125 static tree
3126 gimplify_parm_type (tree *tp, int *walk_subtrees, void *data)
3128 tree t = *tp;
3130 *walk_subtrees = 0;
3131 if (TYPE_P (t))
3133 if (POINTER_TYPE_P (t))
3134 *walk_subtrees = 1;
3135 else if (TYPE_SIZE (t) && !TREE_CONSTANT (TYPE_SIZE (t))
3136 && !TYPE_SIZES_GIMPLIFIED (t))
3138 gimplify_type_sizes (t, (tree *) data);
3139 *walk_subtrees = 1;
3143 return NULL;
3146 /* Gimplify the parameter list for current_function_decl. This involves
3147 evaluating SAVE_EXPRs of variable sized parameters and generating code
3148 to implement callee-copies reference parameters. Returns a list of
3149 statements to add to the beginning of the function, or NULL if nothing
3150 to do. */
3152 tree
3153 gimplify_parameters (void)
3155 struct assign_parm_data_all all;
3156 tree fnargs, parm, stmts = NULL;
3158 assign_parms_initialize_all (&all);
3159 fnargs = assign_parms_augmented_arg_list (&all);
3161 for (parm = fnargs; parm; parm = TREE_CHAIN (parm))
3163 struct assign_parm_data_one data;
3165 /* Extract the type of PARM; adjust it according to ABI. */
3166 assign_parm_find_data_types (&all, parm, &data);
3168 /* Early out for errors and void parameters. */
3169 if (data.passed_mode == VOIDmode || DECL_SIZE (parm) == NULL)
3170 continue;
3172 /* Update info on where next arg arrives in registers. */
3173 FUNCTION_ARG_ADVANCE (all.args_so_far, data.promoted_mode,
3174 data.passed_type, data.named_arg);
3176 /* ??? Once upon a time variable_size stuffed parameter list
3177 SAVE_EXPRs (amongst others) onto a pending sizes list. This
3178 turned out to be less than manageable in the gimple world.
3179 Now we have to hunt them down ourselves. */
3180 walk_tree_without_duplicates (&data.passed_type,
3181 gimplify_parm_type, &stmts);
3183 if (!TREE_CONSTANT (DECL_SIZE (parm)))
3185 gimplify_one_sizepos (&DECL_SIZE (parm), &stmts);
3186 gimplify_one_sizepos (&DECL_SIZE_UNIT (parm), &stmts);
3189 if (data.passed_pointer)
3191 tree type = TREE_TYPE (data.passed_type);
3192 if (reference_callee_copied (&all.args_so_far, TYPE_MODE (type),
3193 type, data.named_arg))
3195 tree local, t;
3197 /* For constant sized objects, this is trivial; for
3198 variable-sized objects, we have to play games. */
3199 if (TREE_CONSTANT (DECL_SIZE (parm)))
3201 local = create_tmp_var (type, get_name (parm));
3202 DECL_IGNORED_P (local) = 0;
3204 else
3206 tree ptr_type, addr;
3208 ptr_type = build_pointer_type (type);
3209 addr = create_tmp_var (ptr_type, get_name (parm));
3210 DECL_IGNORED_P (addr) = 0;
3211 local = build_fold_indirect_ref (addr);
3213 t = built_in_decls[BUILT_IN_ALLOCA];
3214 t = build_call_expr (t, 1, DECL_SIZE_UNIT (parm));
3215 t = fold_convert (ptr_type, t);
3216 t = build_gimple_modify_stmt (addr, t);
3217 gimplify_and_add (t, &stmts);
3220 t = build_gimple_modify_stmt (local, parm);
3221 gimplify_and_add (t, &stmts);
3223 SET_DECL_VALUE_EXPR (parm, local);
3224 DECL_HAS_VALUE_EXPR_P (parm) = 1;
3229 return stmts;
3232 /* Compute the size and offset from the start of the stacked arguments for a
3233 parm passed in mode PASSED_MODE and with type TYPE.
3235 INITIAL_OFFSET_PTR points to the current offset into the stacked
3236 arguments.
3238 The starting offset and size for this parm are returned in
3239 LOCATE->OFFSET and LOCATE->SIZE, respectively. When IN_REGS is
3240 nonzero, the offset is that of stack slot, which is returned in
3241 LOCATE->SLOT_OFFSET. LOCATE->ALIGNMENT_PAD is the amount of
3242 padding required from the initial offset ptr to the stack slot.
3244 IN_REGS is nonzero if the argument will be passed in registers. It will
3245 never be set if REG_PARM_STACK_SPACE is not defined.
3247 FNDECL is the function in which the argument was defined.
3249 There are two types of rounding that are done. The first, controlled by
3250 FUNCTION_ARG_BOUNDARY, forces the offset from the start of the argument
3251 list to be aligned to the specific boundary (in bits). This rounding
3252 affects the initial and starting offsets, but not the argument size.
3254 The second, controlled by FUNCTION_ARG_PADDING and PARM_BOUNDARY,
3255 optionally rounds the size of the parm to PARM_BOUNDARY. The
3256 initial offset is not affected by this rounding, while the size always
3257 is and the starting offset may be. */
3259 /* LOCATE->OFFSET will be negative for ARGS_GROW_DOWNWARD case;
3260 INITIAL_OFFSET_PTR is positive because locate_and_pad_parm's
3261 callers pass in the total size of args so far as
3262 INITIAL_OFFSET_PTR. LOCATE->SIZE is always positive. */
3264 void
3265 locate_and_pad_parm (enum machine_mode passed_mode, tree type, int in_regs,
3266 int partial, tree fndecl ATTRIBUTE_UNUSED,
3267 struct args_size *initial_offset_ptr,
3268 struct locate_and_pad_arg_data *locate)
3270 tree sizetree;
3271 enum direction where_pad;
3272 unsigned int boundary;
3273 int reg_parm_stack_space = 0;
3274 int part_size_in_regs;
3276 #ifdef REG_PARM_STACK_SPACE
3277 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
3279 /* If we have found a stack parm before we reach the end of the
3280 area reserved for registers, skip that area. */
3281 if (! in_regs)
3283 if (reg_parm_stack_space > 0)
3285 if (initial_offset_ptr->var)
3287 initial_offset_ptr->var
3288 = size_binop (MAX_EXPR, ARGS_SIZE_TREE (*initial_offset_ptr),
3289 ssize_int (reg_parm_stack_space));
3290 initial_offset_ptr->constant = 0;
3292 else if (initial_offset_ptr->constant < reg_parm_stack_space)
3293 initial_offset_ptr->constant = reg_parm_stack_space;
3296 #endif /* REG_PARM_STACK_SPACE */
3298 part_size_in_regs = (reg_parm_stack_space == 0 ? partial : 0);
3300 sizetree
3301 = type ? size_in_bytes (type) : size_int (GET_MODE_SIZE (passed_mode));
3302 where_pad = FUNCTION_ARG_PADDING (passed_mode, type);
3303 boundary = FUNCTION_ARG_BOUNDARY (passed_mode, type);
3304 locate->where_pad = where_pad;
3305 locate->boundary = boundary;
3307 /* Remember if the outgoing parameter requires extra alignment on the
3308 calling function side. */
3309 if (boundary > PREFERRED_STACK_BOUNDARY)
3310 boundary = PREFERRED_STACK_BOUNDARY;
3311 if (cfun->stack_alignment_needed < boundary)
3312 cfun->stack_alignment_needed = boundary;
3314 #ifdef ARGS_GROW_DOWNWARD
3315 locate->slot_offset.constant = -initial_offset_ptr->constant;
3316 if (initial_offset_ptr->var)
3317 locate->slot_offset.var = size_binop (MINUS_EXPR, ssize_int (0),
3318 initial_offset_ptr->var);
3321 tree s2 = sizetree;
3322 if (where_pad != none
3323 && (!host_integerp (sizetree, 1)
3324 || (tree_low_cst (sizetree, 1) * BITS_PER_UNIT) % PARM_BOUNDARY))
3325 s2 = round_up (s2, PARM_BOUNDARY / BITS_PER_UNIT);
3326 SUB_PARM_SIZE (locate->slot_offset, s2);
3329 locate->slot_offset.constant += part_size_in_regs;
3331 if (!in_regs
3332 #ifdef REG_PARM_STACK_SPACE
3333 || REG_PARM_STACK_SPACE (fndecl) > 0
3334 #endif
3336 pad_to_arg_alignment (&locate->slot_offset, boundary,
3337 &locate->alignment_pad);
3339 locate->size.constant = (-initial_offset_ptr->constant
3340 - locate->slot_offset.constant);
3341 if (initial_offset_ptr->var)
3342 locate->size.var = size_binop (MINUS_EXPR,
3343 size_binop (MINUS_EXPR,
3344 ssize_int (0),
3345 initial_offset_ptr->var),
3346 locate->slot_offset.var);
3348 /* Pad_below needs the pre-rounded size to know how much to pad
3349 below. */
3350 locate->offset = locate->slot_offset;
3351 if (where_pad == downward)
3352 pad_below (&locate->offset, passed_mode, sizetree);
3354 #else /* !ARGS_GROW_DOWNWARD */
3355 if (!in_regs
3356 #ifdef REG_PARM_STACK_SPACE
3357 || REG_PARM_STACK_SPACE (fndecl) > 0
3358 #endif
3360 pad_to_arg_alignment (initial_offset_ptr, boundary,
3361 &locate->alignment_pad);
3362 locate->slot_offset = *initial_offset_ptr;
3364 #ifdef PUSH_ROUNDING
3365 if (passed_mode != BLKmode)
3366 sizetree = size_int (PUSH_ROUNDING (TREE_INT_CST_LOW (sizetree)));
3367 #endif
3369 /* Pad_below needs the pre-rounded size to know how much to pad below
3370 so this must be done before rounding up. */
3371 locate->offset = locate->slot_offset;
3372 if (where_pad == downward)
3373 pad_below (&locate->offset, passed_mode, sizetree);
3375 if (where_pad != none
3376 && (!host_integerp (sizetree, 1)
3377 || (tree_low_cst (sizetree, 1) * BITS_PER_UNIT) % PARM_BOUNDARY))
3378 sizetree = round_up (sizetree, PARM_BOUNDARY / BITS_PER_UNIT);
3380 ADD_PARM_SIZE (locate->size, sizetree);
3382 locate->size.constant -= part_size_in_regs;
3383 #endif /* ARGS_GROW_DOWNWARD */
3386 /* Round the stack offset in *OFFSET_PTR up to a multiple of BOUNDARY.
3387 BOUNDARY is measured in bits, but must be a multiple of a storage unit. */
3389 static void
3390 pad_to_arg_alignment (struct args_size *offset_ptr, int boundary,
3391 struct args_size *alignment_pad)
3393 tree save_var = NULL_TREE;
3394 HOST_WIDE_INT save_constant = 0;
3395 int boundary_in_bytes = boundary / BITS_PER_UNIT;
3396 HOST_WIDE_INT sp_offset = STACK_POINTER_OFFSET;
3398 #ifdef SPARC_STACK_BOUNDARY_HACK
3399 /* ??? The SPARC port may claim a STACK_BOUNDARY higher than
3400 the real alignment of %sp. However, when it does this, the
3401 alignment of %sp+STACK_POINTER_OFFSET is STACK_BOUNDARY. */
3402 if (SPARC_STACK_BOUNDARY_HACK)
3403 sp_offset = 0;
3404 #endif
3406 if (boundary > PARM_BOUNDARY && boundary > STACK_BOUNDARY)
3408 save_var = offset_ptr->var;
3409 save_constant = offset_ptr->constant;
3412 alignment_pad->var = NULL_TREE;
3413 alignment_pad->constant = 0;
3415 if (boundary > BITS_PER_UNIT)
3417 if (offset_ptr->var)
3419 tree sp_offset_tree = ssize_int (sp_offset);
3420 tree offset = size_binop (PLUS_EXPR,
3421 ARGS_SIZE_TREE (*offset_ptr),
3422 sp_offset_tree);
3423 #ifdef ARGS_GROW_DOWNWARD
3424 tree rounded = round_down (offset, boundary / BITS_PER_UNIT);
3425 #else
3426 tree rounded = round_up (offset, boundary / BITS_PER_UNIT);
3427 #endif
3429 offset_ptr->var = size_binop (MINUS_EXPR, rounded, sp_offset_tree);
3430 /* ARGS_SIZE_TREE includes constant term. */
3431 offset_ptr->constant = 0;
3432 if (boundary > PARM_BOUNDARY && boundary > STACK_BOUNDARY)
3433 alignment_pad->var = size_binop (MINUS_EXPR, offset_ptr->var,
3434 save_var);
3436 else
3438 offset_ptr->constant = -sp_offset +
3439 #ifdef ARGS_GROW_DOWNWARD
3440 FLOOR_ROUND (offset_ptr->constant + sp_offset, boundary_in_bytes);
3441 #else
3442 CEIL_ROUND (offset_ptr->constant + sp_offset, boundary_in_bytes);
3443 #endif
3444 if (boundary > PARM_BOUNDARY && boundary > STACK_BOUNDARY)
3445 alignment_pad->constant = offset_ptr->constant - save_constant;
3450 static void
3451 pad_below (struct args_size *offset_ptr, enum machine_mode passed_mode, tree sizetree)
3453 if (passed_mode != BLKmode)
3455 if (GET_MODE_BITSIZE (passed_mode) % PARM_BOUNDARY)
3456 offset_ptr->constant
3457 += (((GET_MODE_BITSIZE (passed_mode) + PARM_BOUNDARY - 1)
3458 / PARM_BOUNDARY * PARM_BOUNDARY / BITS_PER_UNIT)
3459 - GET_MODE_SIZE (passed_mode));
3461 else
3463 if (TREE_CODE (sizetree) != INTEGER_CST
3464 || (TREE_INT_CST_LOW (sizetree) * BITS_PER_UNIT) % PARM_BOUNDARY)
3466 /* Round the size up to multiple of PARM_BOUNDARY bits. */
3467 tree s2 = round_up (sizetree, PARM_BOUNDARY / BITS_PER_UNIT);
3468 /* Add it in. */
3469 ADD_PARM_SIZE (*offset_ptr, s2);
3470 SUB_PARM_SIZE (*offset_ptr, sizetree);
3475 /* Walk the tree of blocks describing the binding levels within a function
3476 and warn about variables the might be killed by setjmp or vfork.
3477 This is done after calling flow_analysis and before global_alloc
3478 clobbers the pseudo-regs to hard regs. */
3480 void
3481 setjmp_vars_warning (tree block)
3483 tree decl, sub;
3485 for (decl = BLOCK_VARS (block); decl; decl = TREE_CHAIN (decl))
3487 if (TREE_CODE (decl) == VAR_DECL
3488 && DECL_RTL_SET_P (decl)
3489 && REG_P (DECL_RTL (decl))
3490 && regno_clobbered_at_setjmp (REGNO (DECL_RTL (decl))))
3491 warning (OPT_Wclobbered, "variable %q+D might be clobbered by"
3492 " %<longjmp%> or %<vfork%>", decl);
3495 for (sub = BLOCK_SUBBLOCKS (block); sub; sub = TREE_CHAIN (sub))
3496 setjmp_vars_warning (sub);
3499 /* Do the appropriate part of setjmp_vars_warning
3500 but for arguments instead of local variables. */
3502 void
3503 setjmp_args_warning (void)
3505 tree decl;
3506 for (decl = DECL_ARGUMENTS (current_function_decl);
3507 decl; decl = TREE_CHAIN (decl))
3508 if (DECL_RTL (decl) != 0
3509 && REG_P (DECL_RTL (decl))
3510 && regno_clobbered_at_setjmp (REGNO (DECL_RTL (decl))))
3511 warning (OPT_Wclobbered,
3512 "argument %q+D might be clobbered by %<longjmp%> or %<vfork%>",
3513 decl);
3517 /* Identify BLOCKs referenced by more than one NOTE_INSN_BLOCK_{BEG,END},
3518 and create duplicate blocks. */
3519 /* ??? Need an option to either create block fragments or to create
3520 abstract origin duplicates of a source block. It really depends
3521 on what optimization has been performed. */
3523 void
3524 reorder_blocks (void)
3526 tree block = DECL_INITIAL (current_function_decl);
3527 VEC(tree,heap) *block_stack;
3529 if (block == NULL_TREE)
3530 return;
3532 block_stack = VEC_alloc (tree, heap, 10);
3534 /* Reset the TREE_ASM_WRITTEN bit for all blocks. */
3535 clear_block_marks (block);
3537 /* Prune the old trees away, so that they don't get in the way. */
3538 BLOCK_SUBBLOCKS (block) = NULL_TREE;
3539 BLOCK_CHAIN (block) = NULL_TREE;
3541 /* Recreate the block tree from the note nesting. */
3542 reorder_blocks_1 (get_insns (), block, &block_stack);
3543 BLOCK_SUBBLOCKS (block) = blocks_nreverse (BLOCK_SUBBLOCKS (block));
3545 VEC_free (tree, heap, block_stack);
3548 /* Helper function for reorder_blocks. Reset TREE_ASM_WRITTEN. */
3550 void
3551 clear_block_marks (tree block)
3553 while (block)
3555 TREE_ASM_WRITTEN (block) = 0;
3556 clear_block_marks (BLOCK_SUBBLOCKS (block));
3557 block = BLOCK_CHAIN (block);
3561 static void
3562 reorder_blocks_1 (rtx insns, tree current_block, VEC(tree,heap) **p_block_stack)
3564 rtx insn;
3566 for (insn = insns; insn; insn = NEXT_INSN (insn))
3568 if (NOTE_P (insn))
3570 if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_BLOCK_BEG)
3572 tree block = NOTE_BLOCK (insn);
3573 tree origin;
3575 origin = (BLOCK_FRAGMENT_ORIGIN (block)
3576 ? BLOCK_FRAGMENT_ORIGIN (block)
3577 : block);
3579 /* If we have seen this block before, that means it now
3580 spans multiple address regions. Create a new fragment. */
3581 if (TREE_ASM_WRITTEN (block))
3583 tree new_block = copy_node (block);
3585 BLOCK_FRAGMENT_ORIGIN (new_block) = origin;
3586 BLOCK_FRAGMENT_CHAIN (new_block)
3587 = BLOCK_FRAGMENT_CHAIN (origin);
3588 BLOCK_FRAGMENT_CHAIN (origin) = new_block;
3590 NOTE_BLOCK (insn) = new_block;
3591 block = new_block;
3594 BLOCK_SUBBLOCKS (block) = 0;
3595 TREE_ASM_WRITTEN (block) = 1;
3596 /* When there's only one block for the entire function,
3597 current_block == block and we mustn't do this, it
3598 will cause infinite recursion. */
3599 if (block != current_block)
3601 if (block != origin)
3602 gcc_assert (BLOCK_SUPERCONTEXT (origin) == current_block);
3604 BLOCK_SUPERCONTEXT (block) = current_block;
3605 BLOCK_CHAIN (block) = BLOCK_SUBBLOCKS (current_block);
3606 BLOCK_SUBBLOCKS (current_block) = block;
3607 current_block = origin;
3609 VEC_safe_push (tree, heap, *p_block_stack, block);
3611 else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_BLOCK_END)
3613 NOTE_BLOCK (insn) = VEC_pop (tree, *p_block_stack);
3614 BLOCK_SUBBLOCKS (current_block)
3615 = blocks_nreverse (BLOCK_SUBBLOCKS (current_block));
3616 current_block = BLOCK_SUPERCONTEXT (current_block);
3622 /* Reverse the order of elements in the chain T of blocks,
3623 and return the new head of the chain (old last element). */
3625 tree
3626 blocks_nreverse (tree t)
3628 tree prev = 0, decl, next;
3629 for (decl = t; decl; decl = next)
3631 next = BLOCK_CHAIN (decl);
3632 BLOCK_CHAIN (decl) = prev;
3633 prev = decl;
3635 return prev;
3638 /* Count the subblocks of the list starting with BLOCK. If VECTOR is
3639 non-NULL, list them all into VECTOR, in a depth-first preorder
3640 traversal of the block tree. Also clear TREE_ASM_WRITTEN in all
3641 blocks. */
3643 static int
3644 all_blocks (tree block, tree *vector)
3646 int n_blocks = 0;
3648 while (block)
3650 TREE_ASM_WRITTEN (block) = 0;
3652 /* Record this block. */
3653 if (vector)
3654 vector[n_blocks] = block;
3656 ++n_blocks;
3658 /* Record the subblocks, and their subblocks... */
3659 n_blocks += all_blocks (BLOCK_SUBBLOCKS (block),
3660 vector ? vector + n_blocks : 0);
3661 block = BLOCK_CHAIN (block);
3664 return n_blocks;
3667 /* Return a vector containing all the blocks rooted at BLOCK. The
3668 number of elements in the vector is stored in N_BLOCKS_P. The
3669 vector is dynamically allocated; it is the caller's responsibility
3670 to call `free' on the pointer returned. */
3672 static tree *
3673 get_block_vector (tree block, int *n_blocks_p)
3675 tree *block_vector;
3677 *n_blocks_p = all_blocks (block, NULL);
3678 block_vector = XNEWVEC (tree, *n_blocks_p);
3679 all_blocks (block, block_vector);
3681 return block_vector;
3684 static GTY(()) int next_block_index = 2;
3686 /* Set BLOCK_NUMBER for all the blocks in FN. */
3688 void
3689 number_blocks (tree fn)
3691 int i;
3692 int n_blocks;
3693 tree *block_vector;
3695 /* For SDB and XCOFF debugging output, we start numbering the blocks
3696 from 1 within each function, rather than keeping a running
3697 count. */
3698 #if defined (SDB_DEBUGGING_INFO) || defined (XCOFF_DEBUGGING_INFO)
3699 if (write_symbols == SDB_DEBUG || write_symbols == XCOFF_DEBUG)
3700 next_block_index = 1;
3701 #endif
3703 block_vector = get_block_vector (DECL_INITIAL (fn), &n_blocks);
3705 /* The top-level BLOCK isn't numbered at all. */
3706 for (i = 1; i < n_blocks; ++i)
3707 /* We number the blocks from two. */
3708 BLOCK_NUMBER (block_vector[i]) = next_block_index++;
3710 free (block_vector);
3712 return;
3715 /* If VAR is present in a subblock of BLOCK, return the subblock. */
3717 tree
3718 debug_find_var_in_block_tree (tree var, tree block)
3720 tree t;
3722 for (t = BLOCK_VARS (block); t; t = TREE_CHAIN (t))
3723 if (t == var)
3724 return block;
3726 for (t = BLOCK_SUBBLOCKS (block); t; t = TREE_CHAIN (t))
3728 tree ret = debug_find_var_in_block_tree (var, t);
3729 if (ret)
3730 return ret;
3733 return NULL_TREE;
3737 /* Return value of funcdef and increase it. */
3739 get_next_funcdef_no (void)
3741 return funcdef_no++;
3744 /* Allocate a function structure for FNDECL and set its contents
3745 to the defaults. */
3747 void
3748 allocate_struct_function (tree fndecl)
3750 tree result;
3751 tree fntype = fndecl ? TREE_TYPE (fndecl) : NULL_TREE;
3753 cfun = ggc_alloc_cleared (sizeof (struct function));
3755 cfun->stack_alignment_needed = STACK_BOUNDARY;
3756 cfun->preferred_stack_boundary = STACK_BOUNDARY;
3758 current_function_funcdef_no = get_next_funcdef_no ();
3760 cfun->function_frequency = FUNCTION_FREQUENCY_NORMAL;
3762 init_eh_for_function ();
3764 lang_hooks.function.init (cfun);
3765 if (init_machine_status)
3766 cfun->machine = (*init_machine_status) ();
3768 if (fndecl == NULL)
3769 return;
3771 DECL_STRUCT_FUNCTION (fndecl) = cfun;
3772 cfun->decl = fndecl;
3774 result = DECL_RESULT (fndecl);
3775 if (aggregate_value_p (result, fndecl))
3777 #ifdef PCC_STATIC_STRUCT_RETURN
3778 current_function_returns_pcc_struct = 1;
3779 #endif
3780 current_function_returns_struct = 1;
3783 current_function_returns_pointer = POINTER_TYPE_P (TREE_TYPE (result));
3785 current_function_stdarg
3786 = (fntype
3787 && TYPE_ARG_TYPES (fntype) != 0
3788 && (TREE_VALUE (tree_last (TYPE_ARG_TYPES (fntype)))
3789 != void_type_node));
3791 /* Assume all registers in stdarg functions need to be saved. */
3792 cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
3793 cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
3796 /* Reset cfun, and other non-struct-function variables to defaults as
3797 appropriate for emitting rtl at the start of a function. */
3799 static void
3800 prepare_function_start (tree fndecl)
3802 if (fndecl && DECL_STRUCT_FUNCTION (fndecl))
3803 cfun = DECL_STRUCT_FUNCTION (fndecl);
3804 else
3805 allocate_struct_function (fndecl);
3806 init_emit ();
3807 init_varasm_status (cfun);
3808 init_expr ();
3810 cse_not_expected = ! optimize;
3812 /* Caller save not needed yet. */
3813 caller_save_needed = 0;
3815 /* We haven't done register allocation yet. */
3816 reg_renumber = 0;
3818 /* Indicate that we have not instantiated virtual registers yet. */
3819 virtuals_instantiated = 0;
3821 /* Indicate that we want CONCATs now. */
3822 generating_concat_p = 1;
3824 /* Indicate we have no need of a frame pointer yet. */
3825 frame_pointer_needed = 0;
3828 /* Initialize the rtl expansion mechanism so that we can do simple things
3829 like generate sequences. This is used to provide a context during global
3830 initialization of some passes. */
3831 void
3832 init_dummy_function_start (void)
3834 prepare_function_start (NULL);
3837 /* Generate RTL for the start of the function SUBR (a FUNCTION_DECL tree node)
3838 and initialize static variables for generating RTL for the statements
3839 of the function. */
3841 void
3842 init_function_start (tree subr)
3844 prepare_function_start (subr);
3846 /* Prevent ever trying to delete the first instruction of a
3847 function. Also tell final how to output a linenum before the
3848 function prologue. Note linenums could be missing, e.g. when
3849 compiling a Java .class file. */
3850 if (! DECL_IS_BUILTIN (subr))
3851 emit_line_note (DECL_SOURCE_LOCATION (subr));
3853 /* Make sure first insn is a note even if we don't want linenums.
3854 This makes sure the first insn will never be deleted.
3855 Also, final expects a note to appear there. */
3856 emit_note (NOTE_INSN_DELETED);
3858 /* Warn if this value is an aggregate type,
3859 regardless of which calling convention we are using for it. */
3860 if (AGGREGATE_TYPE_P (TREE_TYPE (DECL_RESULT (subr))))
3861 warning (OPT_Waggregate_return, "function returns an aggregate");
3864 /* Make sure all values used by the optimization passes have sane
3865 defaults. */
3866 unsigned int
3867 init_function_for_compilation (void)
3869 reg_renumber = 0;
3871 /* No prologue/epilogue insns yet. Make sure that these vectors are
3872 empty. */
3873 gcc_assert (VEC_length (int, prologue) == 0);
3874 gcc_assert (VEC_length (int, epilogue) == 0);
3875 gcc_assert (VEC_length (int, sibcall_epilogue) == 0);
3876 return 0;
3879 struct tree_opt_pass pass_init_function =
3881 NULL, /* name */
3882 NULL, /* gate */
3883 init_function_for_compilation, /* execute */
3884 NULL, /* sub */
3885 NULL, /* next */
3886 0, /* static_pass_number */
3887 0, /* tv_id */
3888 0, /* properties_required */
3889 0, /* properties_provided */
3890 0, /* properties_destroyed */
3891 0, /* todo_flags_start */
3892 0, /* todo_flags_finish */
3893 0 /* letter */
3897 void
3898 expand_main_function (void)
3900 #if (defined(INVOKE__main) \
3901 || (!defined(HAS_INIT_SECTION) \
3902 && !defined(INIT_SECTION_ASM_OP) \
3903 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
3904 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
3905 #endif
3908 /* Expand code to initialize the stack_protect_guard. This is invoked at
3909 the beginning of a function to be protected. */
3911 #ifndef HAVE_stack_protect_set
3912 # define HAVE_stack_protect_set 0
3913 # define gen_stack_protect_set(x,y) (gcc_unreachable (), NULL_RTX)
3914 #endif
3916 void
3917 stack_protect_prologue (void)
3919 tree guard_decl = targetm.stack_protect_guard ();
3920 rtx x, y;
3922 /* Avoid expand_expr here, because we don't want guard_decl pulled
3923 into registers unless absolutely necessary. And we know that
3924 cfun->stack_protect_guard is a local stack slot, so this skips
3925 all the fluff. */
3926 x = validize_mem (DECL_RTL (cfun->stack_protect_guard));
3927 y = validize_mem (DECL_RTL (guard_decl));
3929 /* Allow the target to copy from Y to X without leaking Y into a
3930 register. */
3931 if (HAVE_stack_protect_set)
3933 rtx insn = gen_stack_protect_set (x, y);
3934 if (insn)
3936 emit_insn (insn);
3937 return;
3941 /* Otherwise do a straight move. */
3942 emit_move_insn (x, y);
3945 /* Expand code to verify the stack_protect_guard. This is invoked at
3946 the end of a function to be protected. */
3948 #ifndef HAVE_stack_protect_test
3949 # define HAVE_stack_protect_test 0
3950 # define gen_stack_protect_test(x, y, z) (gcc_unreachable (), NULL_RTX)
3951 #endif
3953 void
3954 stack_protect_epilogue (void)
3956 tree guard_decl = targetm.stack_protect_guard ();
3957 rtx label = gen_label_rtx ();
3958 rtx x, y, tmp;
3960 /* Avoid expand_expr here, because we don't want guard_decl pulled
3961 into registers unless absolutely necessary. And we know that
3962 cfun->stack_protect_guard is a local stack slot, so this skips
3963 all the fluff. */
3964 x = validize_mem (DECL_RTL (cfun->stack_protect_guard));
3965 y = validize_mem (DECL_RTL (guard_decl));
3967 /* Allow the target to compare Y with X without leaking either into
3968 a register. */
3969 switch (HAVE_stack_protect_test != 0)
3971 case 1:
3972 tmp = gen_stack_protect_test (x, y, label);
3973 if (tmp)
3975 emit_insn (tmp);
3976 break;
3978 /* FALLTHRU */
3980 default:
3981 emit_cmp_and_jump_insns (x, y, EQ, NULL_RTX, ptr_mode, 1, label);
3982 break;
3985 /* The noreturn predictor has been moved to the tree level. The rtl-level
3986 predictors estimate this branch about 20%, which isn't enough to get
3987 things moved out of line. Since this is the only extant case of adding
3988 a noreturn function at the rtl level, it doesn't seem worth doing ought
3989 except adding the prediction by hand. */
3990 tmp = get_last_insn ();
3991 if (JUMP_P (tmp))
3992 predict_insn_def (tmp, PRED_NORETURN, TAKEN);
3994 expand_expr_stmt (targetm.stack_protect_fail ());
3995 emit_label (label);
3998 /* Start the RTL for a new function, and set variables used for
3999 emitting RTL.
4000 SUBR is the FUNCTION_DECL node.
4001 PARMS_HAVE_CLEANUPS is nonzero if there are cleanups associated with
4002 the function's parameters, which must be run at any return statement. */
4004 void
4005 expand_function_start (tree subr)
4007 /* Make sure volatile mem refs aren't considered
4008 valid operands of arithmetic insns. */
4009 init_recog_no_volatile ();
4011 current_function_profile
4012 = (profile_flag
4013 && ! DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (subr));
4015 current_function_limit_stack
4016 = (stack_limit_rtx != NULL_RTX && ! DECL_NO_LIMIT_STACK (subr));
4018 /* Make the label for return statements to jump to. Do not special
4019 case machines with special return instructions -- they will be
4020 handled later during jump, ifcvt, or epilogue creation. */
4021 return_label = gen_label_rtx ();
4023 /* Initialize rtx used to return the value. */
4024 /* Do this before assign_parms so that we copy the struct value address
4025 before any library calls that assign parms might generate. */
4027 /* Decide whether to return the value in memory or in a register. */
4028 if (aggregate_value_p (DECL_RESULT (subr), subr))
4030 /* Returning something that won't go in a register. */
4031 rtx value_address = 0;
4033 #ifdef PCC_STATIC_STRUCT_RETURN
4034 if (current_function_returns_pcc_struct)
4036 int size = int_size_in_bytes (TREE_TYPE (DECL_RESULT (subr)));
4037 value_address = assemble_static_space (size);
4039 else
4040 #endif
4042 rtx sv = targetm.calls.struct_value_rtx (TREE_TYPE (subr), 2);
4043 /* Expect to be passed the address of a place to store the value.
4044 If it is passed as an argument, assign_parms will take care of
4045 it. */
4046 if (sv)
4048 value_address = gen_reg_rtx (Pmode);
4049 emit_move_insn (value_address, sv);
4052 if (value_address)
4054 rtx x = value_address;
4055 if (!DECL_BY_REFERENCE (DECL_RESULT (subr)))
4057 x = gen_rtx_MEM (DECL_MODE (DECL_RESULT (subr)), x);
4058 set_mem_attributes (x, DECL_RESULT (subr), 1);
4060 SET_DECL_RTL (DECL_RESULT (subr), x);
4063 else if (DECL_MODE (DECL_RESULT (subr)) == VOIDmode)
4064 /* If return mode is void, this decl rtl should not be used. */
4065 SET_DECL_RTL (DECL_RESULT (subr), NULL_RTX);
4066 else
4068 /* Compute the return values into a pseudo reg, which we will copy
4069 into the true return register after the cleanups are done. */
4070 tree return_type = TREE_TYPE (DECL_RESULT (subr));
4071 if (TYPE_MODE (return_type) != BLKmode
4072 && targetm.calls.return_in_msb (return_type))
4073 /* expand_function_end will insert the appropriate padding in
4074 this case. Use the return value's natural (unpadded) mode
4075 within the function proper. */
4076 SET_DECL_RTL (DECL_RESULT (subr),
4077 gen_reg_rtx (TYPE_MODE (return_type)));
4078 else
4080 /* In order to figure out what mode to use for the pseudo, we
4081 figure out what the mode of the eventual return register will
4082 actually be, and use that. */
4083 rtx hard_reg = hard_function_value (return_type, subr, 0, 1);
4085 /* Structures that are returned in registers are not
4086 aggregate_value_p, so we may see a PARALLEL or a REG. */
4087 if (REG_P (hard_reg))
4088 SET_DECL_RTL (DECL_RESULT (subr),
4089 gen_reg_rtx (GET_MODE (hard_reg)));
4090 else
4092 gcc_assert (GET_CODE (hard_reg) == PARALLEL);
4093 SET_DECL_RTL (DECL_RESULT (subr), gen_group_rtx (hard_reg));
4097 /* Set DECL_REGISTER flag so that expand_function_end will copy the
4098 result to the real return register(s). */
4099 DECL_REGISTER (DECL_RESULT (subr)) = 1;
4102 /* Initialize rtx for parameters and local variables.
4103 In some cases this requires emitting insns. */
4104 assign_parms (subr);
4106 /* If function gets a static chain arg, store it. */
4107 if (cfun->static_chain_decl)
4109 tree parm = cfun->static_chain_decl;
4110 rtx local = gen_reg_rtx (Pmode);
4112 set_decl_incoming_rtl (parm, static_chain_incoming_rtx);
4113 SET_DECL_RTL (parm, local);
4114 mark_reg_pointer (local, TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
4116 emit_move_insn (local, static_chain_incoming_rtx);
4119 /* If the function receives a non-local goto, then store the
4120 bits we need to restore the frame pointer. */
4121 if (cfun->nonlocal_goto_save_area)
4123 tree t_save;
4124 rtx r_save;
4126 /* ??? We need to do this save early. Unfortunately here is
4127 before the frame variable gets declared. Help out... */
4128 expand_var (TREE_OPERAND (cfun->nonlocal_goto_save_area, 0));
4130 t_save = build4 (ARRAY_REF, ptr_type_node,
4131 cfun->nonlocal_goto_save_area,
4132 integer_zero_node, NULL_TREE, NULL_TREE);
4133 r_save = expand_expr (t_save, NULL_RTX, VOIDmode, EXPAND_WRITE);
4134 r_save = convert_memory_address (Pmode, r_save);
4136 emit_move_insn (r_save, virtual_stack_vars_rtx);
4137 update_nonlocal_goto_save_area ();
4140 /* The following was moved from init_function_start.
4141 The move is supposed to make sdb output more accurate. */
4142 /* Indicate the beginning of the function body,
4143 as opposed to parm setup. */
4144 emit_note (NOTE_INSN_FUNCTION_BEG);
4146 gcc_assert (NOTE_P (get_last_insn ()));
4148 parm_birth_insn = get_last_insn ();
4150 if (current_function_profile)
4152 #ifdef PROFILE_HOOK
4153 PROFILE_HOOK (current_function_funcdef_no);
4154 #endif
4157 /* After the display initializations is where the stack checking
4158 probe should go. */
4159 if(flag_stack_check)
4160 stack_check_probe_note = emit_note (NOTE_INSN_DELETED);
4162 /* Make sure there is a line number after the function entry setup code. */
4163 force_next_line_note ();
4166 /* Undo the effects of init_dummy_function_start. */
4167 void
4168 expand_dummy_function_end (void)
4170 /* End any sequences that failed to be closed due to syntax errors. */
4171 while (in_sequence_p ())
4172 end_sequence ();
4174 /* Outside function body, can't compute type's actual size
4175 until next function's body starts. */
4177 free_after_parsing (cfun);
4178 free_after_compilation (cfun);
4179 cfun = 0;
4182 /* Call DOIT for each hard register used as a return value from
4183 the current function. */
4185 void
4186 diddle_return_value (void (*doit) (rtx, void *), void *arg)
4188 rtx outgoing = current_function_return_rtx;
4190 if (! outgoing)
4191 return;
4193 if (REG_P (outgoing))
4194 (*doit) (outgoing, arg);
4195 else if (GET_CODE (outgoing) == PARALLEL)
4197 int i;
4199 for (i = 0; i < XVECLEN (outgoing, 0); i++)
4201 rtx x = XEXP (XVECEXP (outgoing, 0, i), 0);
4203 if (REG_P (x) && REGNO (x) < FIRST_PSEUDO_REGISTER)
4204 (*doit) (x, arg);
4209 static void
4210 do_clobber_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
4212 emit_insn (gen_rtx_CLOBBER (VOIDmode, reg));
4215 void
4216 clobber_return_register (void)
4218 diddle_return_value (do_clobber_return_reg, NULL);
4220 /* In case we do use pseudo to return value, clobber it too. */
4221 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
4223 tree decl_result = DECL_RESULT (current_function_decl);
4224 rtx decl_rtl = DECL_RTL (decl_result);
4225 if (REG_P (decl_rtl) && REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER)
4227 do_clobber_return_reg (decl_rtl, NULL);
4232 static void
4233 do_use_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
4235 emit_insn (gen_rtx_USE (VOIDmode, reg));
4238 static void
4239 use_return_register (void)
4241 diddle_return_value (do_use_return_reg, NULL);
4244 /* Possibly warn about unused parameters. */
4245 void
4246 do_warn_unused_parameter (tree fn)
4248 tree decl;
4250 for (decl = DECL_ARGUMENTS (fn);
4251 decl; decl = TREE_CHAIN (decl))
4252 if (!TREE_USED (decl) && TREE_CODE (decl) == PARM_DECL
4253 && DECL_NAME (decl) && !DECL_ARTIFICIAL (decl))
4254 warning (OPT_Wunused_parameter, "unused parameter %q+D", decl);
4257 static GTY(()) rtx initial_trampoline;
4259 /* Generate RTL for the end of the current function. */
4261 void
4262 expand_function_end (void)
4264 rtx clobber_after;
4266 /* If arg_pointer_save_area was referenced only from a nested
4267 function, we will not have initialized it yet. Do that now. */
4268 if (arg_pointer_save_area && ! cfun->arg_pointer_save_area_init)
4269 get_arg_pointer_save_area (cfun);
4271 /* If we are doing stack checking and this function makes calls,
4272 do a stack probe at the start of the function to ensure we have enough
4273 space for another stack frame. */
4274 if (flag_stack_check && ! STACK_CHECK_BUILTIN)
4276 rtx insn, seq;
4278 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
4279 if (CALL_P (insn))
4281 start_sequence ();
4282 probe_stack_range (STACK_CHECK_PROTECT,
4283 GEN_INT (STACK_CHECK_MAX_FRAME_SIZE));
4284 seq = get_insns ();
4285 end_sequence ();
4286 emit_insn_before (seq, stack_check_probe_note);
4287 break;
4291 /* Possibly warn about unused parameters.
4292 When frontend does unit-at-a-time, the warning is already
4293 issued at finalization time. */
4294 if (warn_unused_parameter
4295 && !lang_hooks.callgraph.expand_function)
4296 do_warn_unused_parameter (current_function_decl);
4298 /* End any sequences that failed to be closed due to syntax errors. */
4299 while (in_sequence_p ())
4300 end_sequence ();
4302 clear_pending_stack_adjust ();
4303 do_pending_stack_adjust ();
4305 /* Output a linenumber for the end of the function.
4306 SDB depends on this. */
4307 force_next_line_note ();
4308 emit_line_note (input_location);
4310 /* Before the return label (if any), clobber the return
4311 registers so that they are not propagated live to the rest of
4312 the function. This can only happen with functions that drop
4313 through; if there had been a return statement, there would
4314 have either been a return rtx, or a jump to the return label.
4316 We delay actual code generation after the current_function_value_rtx
4317 is computed. */
4318 clobber_after = get_last_insn ();
4320 /* Output the label for the actual return from the function. */
4321 emit_label (return_label);
4323 if (USING_SJLJ_EXCEPTIONS)
4325 /* Let except.c know where it should emit the call to unregister
4326 the function context for sjlj exceptions. */
4327 if (flag_exceptions)
4328 sjlj_emit_function_exit_after (get_last_insn ());
4331 /* If this is an implementation of throw, do what's necessary to
4332 communicate between __builtin_eh_return and the epilogue. */
4333 expand_eh_return ();
4335 /* If scalar return value was computed in a pseudo-reg, or was a named
4336 return value that got dumped to the stack, copy that to the hard
4337 return register. */
4338 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
4340 tree decl_result = DECL_RESULT (current_function_decl);
4341 rtx decl_rtl = DECL_RTL (decl_result);
4343 if (REG_P (decl_rtl)
4344 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
4345 : DECL_REGISTER (decl_result))
4347 rtx real_decl_rtl = current_function_return_rtx;
4349 /* This should be set in assign_parms. */
4350 gcc_assert (REG_FUNCTION_VALUE_P (real_decl_rtl));
4352 /* If this is a BLKmode structure being returned in registers,
4353 then use the mode computed in expand_return. Note that if
4354 decl_rtl is memory, then its mode may have been changed,
4355 but that current_function_return_rtx has not. */
4356 if (GET_MODE (real_decl_rtl) == BLKmode)
4357 PUT_MODE (real_decl_rtl, GET_MODE (decl_rtl));
4359 /* If a non-BLKmode return value should be padded at the least
4360 significant end of the register, shift it left by the appropriate
4361 amount. BLKmode results are handled using the group load/store
4362 machinery. */
4363 if (TYPE_MODE (TREE_TYPE (decl_result)) != BLKmode
4364 && targetm.calls.return_in_msb (TREE_TYPE (decl_result)))
4366 emit_move_insn (gen_rtx_REG (GET_MODE (decl_rtl),
4367 REGNO (real_decl_rtl)),
4368 decl_rtl);
4369 shift_return_value (GET_MODE (decl_rtl), true, real_decl_rtl);
4371 /* If a named return value dumped decl_return to memory, then
4372 we may need to re-do the PROMOTE_MODE signed/unsigned
4373 extension. */
4374 else if (GET_MODE (real_decl_rtl) != GET_MODE (decl_rtl))
4376 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (decl_result));
4378 if (targetm.calls.promote_function_return (TREE_TYPE (current_function_decl)))
4379 promote_mode (TREE_TYPE (decl_result), GET_MODE (decl_rtl),
4380 &unsignedp, 1);
4382 convert_move (real_decl_rtl, decl_rtl, unsignedp);
4384 else if (GET_CODE (real_decl_rtl) == PARALLEL)
4386 /* If expand_function_start has created a PARALLEL for decl_rtl,
4387 move the result to the real return registers. Otherwise, do
4388 a group load from decl_rtl for a named return. */
4389 if (GET_CODE (decl_rtl) == PARALLEL)
4390 emit_group_move (real_decl_rtl, decl_rtl);
4391 else
4392 emit_group_load (real_decl_rtl, decl_rtl,
4393 TREE_TYPE (decl_result),
4394 int_size_in_bytes (TREE_TYPE (decl_result)));
4396 /* In the case of complex integer modes smaller than a word, we'll
4397 need to generate some non-trivial bitfield insertions. Do that
4398 on a pseudo and not the hard register. */
4399 else if (GET_CODE (decl_rtl) == CONCAT
4400 && GET_MODE_CLASS (GET_MODE (decl_rtl)) == MODE_COMPLEX_INT
4401 && GET_MODE_BITSIZE (GET_MODE (decl_rtl)) <= BITS_PER_WORD)
4403 int old_generating_concat_p;
4404 rtx tmp;
4406 old_generating_concat_p = generating_concat_p;
4407 generating_concat_p = 0;
4408 tmp = gen_reg_rtx (GET_MODE (decl_rtl));
4409 generating_concat_p = old_generating_concat_p;
4411 emit_move_insn (tmp, decl_rtl);
4412 emit_move_insn (real_decl_rtl, tmp);
4414 else
4415 emit_move_insn (real_decl_rtl, decl_rtl);
4419 /* If returning a structure, arrange to return the address of the value
4420 in a place where debuggers expect to find it.
4422 If returning a structure PCC style,
4423 the caller also depends on this value.
4424 And current_function_returns_pcc_struct is not necessarily set. */
4425 if (current_function_returns_struct
4426 || current_function_returns_pcc_struct)
4428 rtx value_address = DECL_RTL (DECL_RESULT (current_function_decl));
4429 tree type = TREE_TYPE (DECL_RESULT (current_function_decl));
4430 rtx outgoing;
4432 if (DECL_BY_REFERENCE (DECL_RESULT (current_function_decl)))
4433 type = TREE_TYPE (type);
4434 else
4435 value_address = XEXP (value_address, 0);
4437 outgoing = targetm.calls.function_value (build_pointer_type (type),
4438 current_function_decl, true);
4440 /* Mark this as a function return value so integrate will delete the
4441 assignment and USE below when inlining this function. */
4442 REG_FUNCTION_VALUE_P (outgoing) = 1;
4444 /* The address may be ptr_mode and OUTGOING may be Pmode. */
4445 value_address = convert_memory_address (GET_MODE (outgoing),
4446 value_address);
4448 emit_move_insn (outgoing, value_address);
4450 /* Show return register used to hold result (in this case the address
4451 of the result. */
4452 current_function_return_rtx = outgoing;
4455 /* Emit the actual code to clobber return register. */
4457 rtx seq;
4459 start_sequence ();
4460 clobber_return_register ();
4461 expand_naked_return ();
4462 seq = get_insns ();
4463 end_sequence ();
4465 emit_insn_after (seq, clobber_after);
4468 /* Output the label for the naked return from the function. */
4469 emit_label (naked_return_label);
4471 /* @@@ This is a kludge. We want to ensure that instructions that
4472 may trap are not moved into the epilogue by scheduling, because
4473 we don't always emit unwind information for the epilogue.
4474 However, not all machine descriptions define a blockage insn, so
4475 emit an ASM_INPUT to act as one. */
4476 if (! USING_SJLJ_EXCEPTIONS && flag_non_call_exceptions)
4477 emit_insn (gen_rtx_ASM_INPUT (VOIDmode, ""));
4479 /* If stack protection is enabled for this function, check the guard. */
4480 if (cfun->stack_protect_guard)
4481 stack_protect_epilogue ();
4483 /* If we had calls to alloca, and this machine needs
4484 an accurate stack pointer to exit the function,
4485 insert some code to save and restore the stack pointer. */
4486 if (! EXIT_IGNORE_STACK
4487 && current_function_calls_alloca)
4489 rtx tem = 0;
4491 emit_stack_save (SAVE_FUNCTION, &tem, parm_birth_insn);
4492 emit_stack_restore (SAVE_FUNCTION, tem, NULL_RTX);
4495 /* ??? This should no longer be necessary since stupid is no longer with
4496 us, but there are some parts of the compiler (eg reload_combine, and
4497 sh mach_dep_reorg) that still try and compute their own lifetime info
4498 instead of using the general framework. */
4499 use_return_register ();
4503 get_arg_pointer_save_area (struct function *f)
4505 rtx ret = f->x_arg_pointer_save_area;
4507 if (! ret)
4509 ret = assign_stack_local_1 (Pmode, GET_MODE_SIZE (Pmode), 0, f);
4510 f->x_arg_pointer_save_area = ret;
4513 if (f == cfun && ! f->arg_pointer_save_area_init)
4515 rtx seq;
4517 /* Save the arg pointer at the beginning of the function. The
4518 generated stack slot may not be a valid memory address, so we
4519 have to check it and fix it if necessary. */
4520 start_sequence ();
4521 emit_move_insn (validize_mem (ret), virtual_incoming_args_rtx);
4522 seq = get_insns ();
4523 end_sequence ();
4525 push_topmost_sequence ();
4526 emit_insn_after (seq, entry_of_function ());
4527 pop_topmost_sequence ();
4530 return ret;
4533 /* Extend a vector that records the INSN_UIDs of INSNS
4534 (a list of one or more insns). */
4536 static void
4537 record_insns (rtx insns, VEC(int,heap) **vecp)
4539 rtx tmp;
4541 for (tmp = insns; tmp != NULL_RTX; tmp = NEXT_INSN (tmp))
4542 VEC_safe_push (int, heap, *vecp, INSN_UID (tmp));
4545 /* Set the locator of the insn chain starting at INSN to LOC. */
4546 static void
4547 set_insn_locators (rtx insn, int loc)
4549 while (insn != NULL_RTX)
4551 if (INSN_P (insn))
4552 INSN_LOCATOR (insn) = loc;
4553 insn = NEXT_INSN (insn);
4557 /* Determine how many INSN_UIDs in VEC are part of INSN. Because we can
4558 be running after reorg, SEQUENCE rtl is possible. */
4560 static int
4561 contains (rtx insn, VEC(int,heap) **vec)
4563 int i, j;
4565 if (NONJUMP_INSN_P (insn)
4566 && GET_CODE (PATTERN (insn)) == SEQUENCE)
4568 int count = 0;
4569 for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
4570 for (j = VEC_length (int, *vec) - 1; j >= 0; --j)
4571 if (INSN_UID (XVECEXP (PATTERN (insn), 0, i))
4572 == VEC_index (int, *vec, j))
4573 count++;
4574 return count;
4576 else
4578 for (j = VEC_length (int, *vec) - 1; j >= 0; --j)
4579 if (INSN_UID (insn) == VEC_index (int, *vec, j))
4580 return 1;
4582 return 0;
4586 prologue_epilogue_contains (rtx insn)
4588 if (contains (insn, &prologue))
4589 return 1;
4590 if (contains (insn, &epilogue))
4591 return 1;
4592 return 0;
4596 sibcall_epilogue_contains (rtx insn)
4598 if (sibcall_epilogue)
4599 return contains (insn, &sibcall_epilogue);
4600 return 0;
4603 #ifdef HAVE_return
4604 /* Insert gen_return at the end of block BB. This also means updating
4605 block_for_insn appropriately. */
4607 static void
4608 emit_return_into_block (basic_block bb)
4610 emit_jump_insn_after (gen_return (), BB_END (bb));
4612 #endif /* HAVE_return */
4614 #if defined(HAVE_epilogue) && defined(INCOMING_RETURN_ADDR_RTX)
4616 /* These functions convert the epilogue into a variant that does not
4617 modify the stack pointer. This is used in cases where a function
4618 returns an object whose size is not known until it is computed.
4619 The called function leaves the object on the stack, leaves the
4620 stack depressed, and returns a pointer to the object.
4622 What we need to do is track all modifications and references to the
4623 stack pointer, deleting the modifications and changing the
4624 references to point to the location the stack pointer would have
4625 pointed to had the modifications taken place.
4627 These functions need to be portable so we need to make as few
4628 assumptions about the epilogue as we can. However, the epilogue
4629 basically contains three things: instructions to reset the stack
4630 pointer, instructions to reload registers, possibly including the
4631 frame pointer, and an instruction to return to the caller.
4633 We must be sure of what a relevant epilogue insn is doing. We also
4634 make no attempt to validate the insns we make since if they are
4635 invalid, we probably can't do anything valid. The intent is that
4636 these routines get "smarter" as more and more machines start to use
4637 them and they try operating on different epilogues.
4639 We use the following structure to track what the part of the
4640 epilogue that we've already processed has done. We keep two copies
4641 of the SP equivalence, one for use during the insn we are
4642 processing and one for use in the next insn. The difference is
4643 because one part of a PARALLEL may adjust SP and the other may use
4644 it. */
4646 struct epi_info
4648 rtx sp_equiv_reg; /* REG that SP is set from, perhaps SP. */
4649 HOST_WIDE_INT sp_offset; /* Offset from SP_EQUIV_REG of present SP. */
4650 rtx new_sp_equiv_reg; /* REG to be used at end of insn. */
4651 HOST_WIDE_INT new_sp_offset; /* Offset to be used at end of insn. */
4652 rtx equiv_reg_src; /* If nonzero, the value that SP_EQUIV_REG
4653 should be set to once we no longer need
4654 its value. */
4655 rtx const_equiv[FIRST_PSEUDO_REGISTER]; /* Any known constant equivalences
4656 for registers. */
4659 static void handle_epilogue_set (rtx, struct epi_info *);
4660 static void update_epilogue_consts (rtx, rtx, void *);
4661 static void emit_equiv_load (struct epi_info *);
4663 /* Modify INSN, a list of one or more insns that is part of the epilogue, to
4664 no modifications to the stack pointer. Return the new list of insns. */
4666 static rtx
4667 keep_stack_depressed (rtx insns)
4669 int j;
4670 struct epi_info info;
4671 rtx insn, next;
4673 /* If the epilogue is just a single instruction, it must be OK as is. */
4674 if (NEXT_INSN (insns) == NULL_RTX)
4675 return insns;
4677 /* Otherwise, start a sequence, initialize the information we have, and
4678 process all the insns we were given. */
4679 start_sequence ();
4681 info.sp_equiv_reg = stack_pointer_rtx;
4682 info.sp_offset = 0;
4683 info.equiv_reg_src = 0;
4685 for (j = 0; j < FIRST_PSEUDO_REGISTER; j++)
4686 info.const_equiv[j] = 0;
4688 insn = insns;
4689 next = NULL_RTX;
4690 while (insn != NULL_RTX)
4692 next = NEXT_INSN (insn);
4694 if (!INSN_P (insn))
4696 add_insn (insn);
4697 insn = next;
4698 continue;
4701 /* If this insn references the register that SP is equivalent to and
4702 we have a pending load to that register, we must force out the load
4703 first and then indicate we no longer know what SP's equivalent is. */
4704 if (info.equiv_reg_src != 0
4705 && reg_referenced_p (info.sp_equiv_reg, PATTERN (insn)))
4707 emit_equiv_load (&info);
4708 info.sp_equiv_reg = 0;
4711 info.new_sp_equiv_reg = info.sp_equiv_reg;
4712 info.new_sp_offset = info.sp_offset;
4714 /* If this is a (RETURN) and the return address is on the stack,
4715 update the address and change to an indirect jump. */
4716 if (GET_CODE (PATTERN (insn)) == RETURN
4717 || (GET_CODE (PATTERN (insn)) == PARALLEL
4718 && GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) == RETURN))
4720 rtx retaddr = INCOMING_RETURN_ADDR_RTX;
4721 rtx base = 0;
4722 HOST_WIDE_INT offset = 0;
4723 rtx jump_insn, jump_set;
4725 /* If the return address is in a register, we can emit the insn
4726 unchanged. Otherwise, it must be a MEM and we see what the
4727 base register and offset are. In any case, we have to emit any
4728 pending load to the equivalent reg of SP, if any. */
4729 if (REG_P (retaddr))
4731 emit_equiv_load (&info);
4732 add_insn (insn);
4733 insn = next;
4734 continue;
4736 else
4738 rtx ret_ptr;
4739 gcc_assert (MEM_P (retaddr));
4741 ret_ptr = XEXP (retaddr, 0);
4743 if (REG_P (ret_ptr))
4745 base = gen_rtx_REG (Pmode, REGNO (ret_ptr));
4746 offset = 0;
4748 else
4750 gcc_assert (GET_CODE (ret_ptr) == PLUS
4751 && REG_P (XEXP (ret_ptr, 0))
4752 && GET_CODE (XEXP (ret_ptr, 1)) == CONST_INT);
4753 base = gen_rtx_REG (Pmode, REGNO (XEXP (ret_ptr, 0)));
4754 offset = INTVAL (XEXP (ret_ptr, 1));
4758 /* If the base of the location containing the return pointer
4759 is SP, we must update it with the replacement address. Otherwise,
4760 just build the necessary MEM. */
4761 retaddr = plus_constant (base, offset);
4762 if (base == stack_pointer_rtx)
4763 retaddr = simplify_replace_rtx (retaddr, stack_pointer_rtx,
4764 plus_constant (info.sp_equiv_reg,
4765 info.sp_offset));
4767 retaddr = gen_rtx_MEM (Pmode, retaddr);
4768 MEM_NOTRAP_P (retaddr) = 1;
4770 /* If there is a pending load to the equivalent register for SP
4771 and we reference that register, we must load our address into
4772 a scratch register and then do that load. */
4773 if (info.equiv_reg_src
4774 && reg_overlap_mentioned_p (info.equiv_reg_src, retaddr))
4776 unsigned int regno;
4777 rtx reg;
4779 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
4780 if (HARD_REGNO_MODE_OK (regno, Pmode)
4781 && !fixed_regs[regno]
4782 && TEST_HARD_REG_BIT (regs_invalidated_by_call, regno)
4783 && !REGNO_REG_SET_P
4784 (EXIT_BLOCK_PTR->il.rtl->global_live_at_start, regno)
4785 && !refers_to_regno_p (regno,
4786 regno + hard_regno_nregs[regno]
4787 [Pmode],
4788 info.equiv_reg_src, NULL)
4789 && info.const_equiv[regno] == 0)
4790 break;
4792 gcc_assert (regno < FIRST_PSEUDO_REGISTER);
4794 reg = gen_rtx_REG (Pmode, regno);
4795 emit_move_insn (reg, retaddr);
4796 retaddr = reg;
4799 emit_equiv_load (&info);
4800 jump_insn = emit_jump_insn (gen_indirect_jump (retaddr));
4802 /* Show the SET in the above insn is a RETURN. */
4803 jump_set = single_set (jump_insn);
4804 gcc_assert (jump_set);
4805 SET_IS_RETURN_P (jump_set) = 1;
4808 /* If SP is not mentioned in the pattern and its equivalent register, if
4809 any, is not modified, just emit it. Otherwise, if neither is set,
4810 replace the reference to SP and emit the insn. If none of those are
4811 true, handle each SET individually. */
4812 else if (!reg_mentioned_p (stack_pointer_rtx, PATTERN (insn))
4813 && (info.sp_equiv_reg == stack_pointer_rtx
4814 || !reg_set_p (info.sp_equiv_reg, insn)))
4815 add_insn (insn);
4816 else if (! reg_set_p (stack_pointer_rtx, insn)
4817 && (info.sp_equiv_reg == stack_pointer_rtx
4818 || !reg_set_p (info.sp_equiv_reg, insn)))
4820 int changed;
4822 changed = validate_replace_rtx (stack_pointer_rtx,
4823 plus_constant (info.sp_equiv_reg,
4824 info.sp_offset),
4825 insn);
4826 gcc_assert (changed);
4828 add_insn (insn);
4830 else if (GET_CODE (PATTERN (insn)) == SET)
4831 handle_epilogue_set (PATTERN (insn), &info);
4832 else if (GET_CODE (PATTERN (insn)) == PARALLEL)
4834 for (j = 0; j < XVECLEN (PATTERN (insn), 0); j++)
4835 if (GET_CODE (XVECEXP (PATTERN (insn), 0, j)) == SET)
4836 handle_epilogue_set (XVECEXP (PATTERN (insn), 0, j), &info);
4838 else
4839 add_insn (insn);
4841 info.sp_equiv_reg = info.new_sp_equiv_reg;
4842 info.sp_offset = info.new_sp_offset;
4844 /* Now update any constants this insn sets. */
4845 note_stores (PATTERN (insn), update_epilogue_consts, &info);
4846 insn = next;
4849 insns = get_insns ();
4850 end_sequence ();
4851 return insns;
4854 /* SET is a SET from an insn in the epilogue. P is a pointer to the epi_info
4855 structure that contains information about what we've seen so far. We
4856 process this SET by either updating that data or by emitting one or
4857 more insns. */
4859 static void
4860 handle_epilogue_set (rtx set, struct epi_info *p)
4862 /* First handle the case where we are setting SP. Record what it is being
4863 set from, which we must be able to determine */
4864 if (reg_set_p (stack_pointer_rtx, set))
4866 gcc_assert (SET_DEST (set) == stack_pointer_rtx);
4868 if (GET_CODE (SET_SRC (set)) == PLUS)
4870 p->new_sp_equiv_reg = XEXP (SET_SRC (set), 0);
4871 if (GET_CODE (XEXP (SET_SRC (set), 1)) == CONST_INT)
4872 p->new_sp_offset = INTVAL (XEXP (SET_SRC (set), 1));
4873 else
4875 gcc_assert (REG_P (XEXP (SET_SRC (set), 1))
4876 && (REGNO (XEXP (SET_SRC (set), 1))
4877 < FIRST_PSEUDO_REGISTER)
4878 && p->const_equiv[REGNO (XEXP (SET_SRC (set), 1))]);
4879 p->new_sp_offset
4880 = INTVAL (p->const_equiv[REGNO (XEXP (SET_SRC (set), 1))]);
4883 else
4884 p->new_sp_equiv_reg = SET_SRC (set), p->new_sp_offset = 0;
4886 /* If we are adjusting SP, we adjust from the old data. */
4887 if (p->new_sp_equiv_reg == stack_pointer_rtx)
4889 p->new_sp_equiv_reg = p->sp_equiv_reg;
4890 p->new_sp_offset += p->sp_offset;
4893 gcc_assert (p->new_sp_equiv_reg && REG_P (p->new_sp_equiv_reg));
4895 return;
4898 /* Next handle the case where we are setting SP's equivalent
4899 register. We must not already have a value to set it to. We
4900 could update, but there seems little point in handling that case.
4901 Note that we have to allow for the case where we are setting the
4902 register set in the previous part of a PARALLEL inside a single
4903 insn. But use the old offset for any updates within this insn.
4904 We must allow for the case where the register is being set in a
4905 different (usually wider) mode than Pmode). */
4906 else if (p->new_sp_equiv_reg != 0 && reg_set_p (p->new_sp_equiv_reg, set))
4908 gcc_assert (!p->equiv_reg_src
4909 && REG_P (p->new_sp_equiv_reg)
4910 && REG_P (SET_DEST (set))
4911 && (GET_MODE_BITSIZE (GET_MODE (SET_DEST (set)))
4912 <= BITS_PER_WORD)
4913 && REGNO (p->new_sp_equiv_reg) == REGNO (SET_DEST (set)));
4914 p->equiv_reg_src
4915 = simplify_replace_rtx (SET_SRC (set), stack_pointer_rtx,
4916 plus_constant (p->sp_equiv_reg,
4917 p->sp_offset));
4920 /* Otherwise, replace any references to SP in the insn to its new value
4921 and emit the insn. */
4922 else
4924 SET_SRC (set) = simplify_replace_rtx (SET_SRC (set), stack_pointer_rtx,
4925 plus_constant (p->sp_equiv_reg,
4926 p->sp_offset));
4927 SET_DEST (set) = simplify_replace_rtx (SET_DEST (set), stack_pointer_rtx,
4928 plus_constant (p->sp_equiv_reg,
4929 p->sp_offset));
4930 emit_insn (set);
4934 /* Update the tracking information for registers set to constants. */
4936 static void
4937 update_epilogue_consts (rtx dest, rtx x, void *data)
4939 struct epi_info *p = (struct epi_info *) data;
4940 rtx new;
4942 if (!REG_P (dest) || REGNO (dest) >= FIRST_PSEUDO_REGISTER)
4943 return;
4945 /* If we are either clobbering a register or doing a partial set,
4946 show we don't know the value. */
4947 else if (GET_CODE (x) == CLOBBER || ! rtx_equal_p (dest, SET_DEST (x)))
4948 p->const_equiv[REGNO (dest)] = 0;
4950 /* If we are setting it to a constant, record that constant. */
4951 else if (GET_CODE (SET_SRC (x)) == CONST_INT)
4952 p->const_equiv[REGNO (dest)] = SET_SRC (x);
4954 /* If this is a binary operation between a register we have been tracking
4955 and a constant, see if we can compute a new constant value. */
4956 else if (ARITHMETIC_P (SET_SRC (x))
4957 && REG_P (XEXP (SET_SRC (x), 0))
4958 && REGNO (XEXP (SET_SRC (x), 0)) < FIRST_PSEUDO_REGISTER
4959 && p->const_equiv[REGNO (XEXP (SET_SRC (x), 0))] != 0
4960 && GET_CODE (XEXP (SET_SRC (x), 1)) == CONST_INT
4961 && 0 != (new = simplify_binary_operation
4962 (GET_CODE (SET_SRC (x)), GET_MODE (dest),
4963 p->const_equiv[REGNO (XEXP (SET_SRC (x), 0))],
4964 XEXP (SET_SRC (x), 1)))
4965 && GET_CODE (new) == CONST_INT)
4966 p->const_equiv[REGNO (dest)] = new;
4968 /* Otherwise, we can't do anything with this value. */
4969 else
4970 p->const_equiv[REGNO (dest)] = 0;
4973 /* Emit an insn to do the load shown in p->equiv_reg_src, if needed. */
4975 static void
4976 emit_equiv_load (struct epi_info *p)
4978 if (p->equiv_reg_src != 0)
4980 rtx dest = p->sp_equiv_reg;
4982 if (GET_MODE (p->equiv_reg_src) != GET_MODE (dest))
4983 dest = gen_rtx_REG (GET_MODE (p->equiv_reg_src),
4984 REGNO (p->sp_equiv_reg));
4986 emit_move_insn (dest, p->equiv_reg_src);
4987 p->equiv_reg_src = 0;
4990 #endif
4992 /* Generate the prologue and epilogue RTL if the machine supports it. Thread
4993 this into place with notes indicating where the prologue ends and where
4994 the epilogue begins. Update the basic block information when possible. */
4996 void
4997 thread_prologue_and_epilogue_insns (rtx f ATTRIBUTE_UNUSED)
4999 int inserted = 0;
5000 edge e;
5001 #if defined (HAVE_sibcall_epilogue) || defined (HAVE_epilogue) || defined (HAVE_return) || defined (HAVE_prologue)
5002 rtx seq;
5003 #endif
5004 #ifdef HAVE_prologue
5005 rtx prologue_end = NULL_RTX;
5006 #endif
5007 #if defined (HAVE_epilogue) || defined(HAVE_return)
5008 rtx epilogue_end = NULL_RTX;
5009 #endif
5010 edge_iterator ei;
5012 #ifdef HAVE_prologue
5013 if (HAVE_prologue)
5015 start_sequence ();
5016 seq = gen_prologue ();
5017 emit_insn (seq);
5019 /* Retain a map of the prologue insns. */
5020 record_insns (seq, &prologue);
5021 prologue_end = emit_note (NOTE_INSN_PROLOGUE_END);
5023 seq = get_insns ();
5024 end_sequence ();
5025 set_insn_locators (seq, prologue_locator);
5027 /* Can't deal with multiple successors of the entry block
5028 at the moment. Function should always have at least one
5029 entry point. */
5030 gcc_assert (single_succ_p (ENTRY_BLOCK_PTR));
5032 insert_insn_on_edge (seq, single_succ_edge (ENTRY_BLOCK_PTR));
5033 inserted = 1;
5035 #endif
5037 /* If the exit block has no non-fake predecessors, we don't need
5038 an epilogue. */
5039 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
5040 if ((e->flags & EDGE_FAKE) == 0)
5041 break;
5042 if (e == NULL)
5043 goto epilogue_done;
5045 #ifdef HAVE_return
5046 if (optimize && HAVE_return)
5048 /* If we're allowed to generate a simple return instruction,
5049 then by definition we don't need a full epilogue. Examine
5050 the block that falls through to EXIT. If it does not
5051 contain any code, examine its predecessors and try to
5052 emit (conditional) return instructions. */
5054 basic_block last;
5055 rtx label;
5057 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
5058 if (e->flags & EDGE_FALLTHRU)
5059 break;
5060 if (e == NULL)
5061 goto epilogue_done;
5062 last = e->src;
5064 /* Verify that there are no active instructions in the last block. */
5065 label = BB_END (last);
5066 while (label && !LABEL_P (label))
5068 if (active_insn_p (label))
5069 break;
5070 label = PREV_INSN (label);
5073 if (BB_HEAD (last) == label && LABEL_P (label))
5075 edge_iterator ei2;
5077 for (ei2 = ei_start (last->preds); (e = ei_safe_edge (ei2)); )
5079 basic_block bb = e->src;
5080 rtx jump;
5082 if (bb == ENTRY_BLOCK_PTR)
5084 ei_next (&ei2);
5085 continue;
5088 jump = BB_END (bb);
5089 if (!JUMP_P (jump) || JUMP_LABEL (jump) != label)
5091 ei_next (&ei2);
5092 continue;
5095 /* If we have an unconditional jump, we can replace that
5096 with a simple return instruction. */
5097 if (simplejump_p (jump))
5099 emit_return_into_block (bb);
5100 delete_insn (jump);
5103 /* If we have a conditional jump, we can try to replace
5104 that with a conditional return instruction. */
5105 else if (condjump_p (jump))
5107 if (! redirect_jump (jump, 0, 0))
5109 ei_next (&ei2);
5110 continue;
5113 /* If this block has only one successor, it both jumps
5114 and falls through to the fallthru block, so we can't
5115 delete the edge. */
5116 if (single_succ_p (bb))
5118 ei_next (&ei2);
5119 continue;
5122 else
5124 ei_next (&ei2);
5125 continue;
5128 /* Fix up the CFG for the successful change we just made. */
5129 redirect_edge_succ (e, EXIT_BLOCK_PTR);
5132 /* Emit a return insn for the exit fallthru block. Whether
5133 this is still reachable will be determined later. */
5135 emit_barrier_after (BB_END (last));
5136 emit_return_into_block (last);
5137 epilogue_end = BB_END (last);
5138 single_succ_edge (last)->flags &= ~EDGE_FALLTHRU;
5139 goto epilogue_done;
5142 #endif
5143 /* Find the edge that falls through to EXIT. Other edges may exist
5144 due to RETURN instructions, but those don't need epilogues.
5145 There really shouldn't be a mixture -- either all should have
5146 been converted or none, however... */
5148 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
5149 if (e->flags & EDGE_FALLTHRU)
5150 break;
5151 if (e == NULL)
5152 goto epilogue_done;
5154 #ifdef HAVE_epilogue
5155 if (HAVE_epilogue)
5157 start_sequence ();
5158 epilogue_end = emit_note (NOTE_INSN_EPILOGUE_BEG);
5160 seq = gen_epilogue ();
5162 #ifdef INCOMING_RETURN_ADDR_RTX
5163 /* If this function returns with the stack depressed and we can support
5164 it, massage the epilogue to actually do that. */
5165 if (TREE_CODE (TREE_TYPE (current_function_decl)) == FUNCTION_TYPE
5166 && TYPE_RETURNS_STACK_DEPRESSED (TREE_TYPE (current_function_decl)))
5167 seq = keep_stack_depressed (seq);
5168 #endif
5170 emit_jump_insn (seq);
5172 /* Retain a map of the epilogue insns. */
5173 record_insns (seq, &epilogue);
5174 set_insn_locators (seq, epilogue_locator);
5176 seq = get_insns ();
5177 end_sequence ();
5179 insert_insn_on_edge (seq, e);
5180 inserted = 1;
5182 else
5183 #endif
5185 basic_block cur_bb;
5187 if (! next_active_insn (BB_END (e->src)))
5188 goto epilogue_done;
5189 /* We have a fall-through edge to the exit block, the source is not
5190 at the end of the function, and there will be an assembler epilogue
5191 at the end of the function.
5192 We can't use force_nonfallthru here, because that would try to
5193 use return. Inserting a jump 'by hand' is extremely messy, so
5194 we take advantage of cfg_layout_finalize using
5195 fixup_fallthru_exit_predecessor. */
5196 cfg_layout_initialize (0);
5197 FOR_EACH_BB (cur_bb)
5198 if (cur_bb->index >= NUM_FIXED_BLOCKS
5199 && cur_bb->next_bb->index >= NUM_FIXED_BLOCKS)
5200 cur_bb->aux = cur_bb->next_bb;
5201 cfg_layout_finalize ();
5203 epilogue_done:
5205 if (inserted)
5206 commit_edge_insertions ();
5208 #ifdef HAVE_sibcall_epilogue
5209 /* Emit sibling epilogues before any sibling call sites. */
5210 for (ei = ei_start (EXIT_BLOCK_PTR->preds); (e = ei_safe_edge (ei)); )
5212 basic_block bb = e->src;
5213 rtx insn = BB_END (bb);
5215 if (!CALL_P (insn)
5216 || ! SIBLING_CALL_P (insn))
5218 ei_next (&ei);
5219 continue;
5222 start_sequence ();
5223 emit_insn (gen_sibcall_epilogue ());
5224 seq = get_insns ();
5225 end_sequence ();
5227 /* Retain a map of the epilogue insns. Used in life analysis to
5228 avoid getting rid of sibcall epilogue insns. Do this before we
5229 actually emit the sequence. */
5230 record_insns (seq, &sibcall_epilogue);
5231 set_insn_locators (seq, epilogue_locator);
5233 emit_insn_before (seq, insn);
5234 ei_next (&ei);
5236 #endif
5238 #ifdef HAVE_epilogue
5239 if (epilogue_end)
5241 rtx insn, next;
5243 /* Similarly, move any line notes that appear after the epilogue.
5244 There is no need, however, to be quite so anal about the existence
5245 of such a note. Also possibly move
5246 NOTE_INSN_FUNCTION_BEG notes, as those can be relevant for debug
5247 info generation. */
5248 for (insn = epilogue_end; insn; insn = next)
5250 next = NEXT_INSN (insn);
5251 if (NOTE_P (insn)
5252 && (NOTE_LINE_NUMBER (insn) == NOTE_INSN_FUNCTION_BEG))
5253 reorder_insns (insn, insn, PREV_INSN (epilogue_end));
5256 #endif
5259 /* Reposition the prologue-end and epilogue-begin notes after instruction
5260 scheduling and delayed branch scheduling. */
5262 void
5263 reposition_prologue_and_epilogue_notes (rtx f ATTRIBUTE_UNUSED)
5265 #if defined (HAVE_prologue) || defined (HAVE_epilogue)
5266 rtx insn, last, note;
5267 int len;
5269 if ((len = VEC_length (int, prologue)) > 0)
5271 last = 0, note = 0;
5273 /* Scan from the beginning until we reach the last prologue insn.
5274 We apparently can't depend on basic_block_{head,end} after
5275 reorg has run. */
5276 for (insn = f; insn; insn = NEXT_INSN (insn))
5278 if (NOTE_P (insn))
5280 if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_PROLOGUE_END)
5281 note = insn;
5283 else if (contains (insn, &prologue))
5285 last = insn;
5286 if (--len == 0)
5287 break;
5291 if (last)
5293 /* Find the prologue-end note if we haven't already, and
5294 move it to just after the last prologue insn. */
5295 if (note == 0)
5297 for (note = last; (note = NEXT_INSN (note));)
5298 if (NOTE_P (note)
5299 && NOTE_LINE_NUMBER (note) == NOTE_INSN_PROLOGUE_END)
5300 break;
5303 /* Avoid placing note between CODE_LABEL and BASIC_BLOCK note. */
5304 if (LABEL_P (last))
5305 last = NEXT_INSN (last);
5306 reorder_insns (note, note, last);
5310 if ((len = VEC_length (int, epilogue)) > 0)
5312 last = 0, note = 0;
5314 /* Scan from the end until we reach the first epilogue insn.
5315 We apparently can't depend on basic_block_{head,end} after
5316 reorg has run. */
5317 for (insn = get_last_insn (); insn; insn = PREV_INSN (insn))
5319 if (NOTE_P (insn))
5321 if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_EPILOGUE_BEG)
5322 note = insn;
5324 else if (contains (insn, &epilogue))
5326 last = insn;
5327 if (--len == 0)
5328 break;
5332 if (last)
5334 /* Find the epilogue-begin note if we haven't already, and
5335 move it to just before the first epilogue insn. */
5336 if (note == 0)
5338 for (note = insn; (note = PREV_INSN (note));)
5339 if (NOTE_P (note)
5340 && NOTE_LINE_NUMBER (note) == NOTE_INSN_EPILOGUE_BEG)
5341 break;
5344 if (PREV_INSN (last) != note)
5345 reorder_insns (note, note, PREV_INSN (last));
5348 #endif /* HAVE_prologue or HAVE_epilogue */
5351 /* Resets insn_block_boundaries array. */
5353 void
5354 reset_block_changes (void)
5356 cfun->ib_boundaries_block = VEC_alloc (tree, gc, 100);
5357 VEC_quick_push (tree, cfun->ib_boundaries_block, NULL_TREE);
5360 /* Record the boundary for BLOCK. */
5361 void
5362 record_block_change (tree block)
5364 int i, n;
5365 tree last_block;
5367 if (!block)
5368 return;
5370 if(!cfun->ib_boundaries_block)
5371 return;
5373 last_block = VEC_pop (tree, cfun->ib_boundaries_block);
5374 n = get_max_uid ();
5375 for (i = VEC_length (tree, cfun->ib_boundaries_block); i < n; i++)
5376 VEC_safe_push (tree, gc, cfun->ib_boundaries_block, last_block);
5378 VEC_safe_push (tree, gc, cfun->ib_boundaries_block, block);
5381 /* Finishes record of boundaries. */
5382 void
5383 finalize_block_changes (void)
5385 record_block_change (DECL_INITIAL (current_function_decl));
5388 /* For INSN return the BLOCK it belongs to. */
5389 void
5390 check_block_change (rtx insn, tree *block)
5392 unsigned uid = INSN_UID (insn);
5394 if (uid >= VEC_length (tree, cfun->ib_boundaries_block))
5395 return;
5397 *block = VEC_index (tree, cfun->ib_boundaries_block, uid);
5400 /* Releases the ib_boundaries_block records. */
5401 void
5402 free_block_changes (void)
5404 VEC_free (tree, gc, cfun->ib_boundaries_block);
5407 /* Returns the name of the current function. */
5408 const char *
5409 current_function_name (void)
5411 return lang_hooks.decl_printable_name (cfun->decl, 2);
5415 static unsigned int
5416 rest_of_handle_check_leaf_regs (void)
5418 #ifdef LEAF_REGISTERS
5419 current_function_uses_only_leaf_regs
5420 = optimize > 0 && only_leaf_regs_used () && leaf_function_p ();
5421 #endif
5422 return 0;
5425 /* Insert a TYPE into the used types hash table of CFUN. */
5426 static void
5427 used_types_insert_helper (tree type, struct function *func)
5429 if (type != NULL && func != NULL)
5431 void **slot;
5433 if (func->used_types_hash == NULL)
5434 func->used_types_hash = htab_create_ggc (37, htab_hash_pointer,
5435 htab_eq_pointer, NULL);
5436 slot = htab_find_slot (func->used_types_hash, type, INSERT);
5437 if (*slot == NULL)
5438 *slot = type;
5442 /* Given a type, insert it into the used hash table in cfun. */
5443 void
5444 used_types_insert (tree t)
5446 while (POINTER_TYPE_P (t) || TREE_CODE (t) == ARRAY_TYPE)
5447 t = TREE_TYPE (t);
5448 t = TYPE_MAIN_VARIANT (t);
5449 if (debug_info_level > DINFO_LEVEL_NONE)
5450 used_types_insert_helper (t, cfun);
5453 struct tree_opt_pass pass_leaf_regs =
5455 NULL, /* name */
5456 NULL, /* gate */
5457 rest_of_handle_check_leaf_regs, /* execute */
5458 NULL, /* sub */
5459 NULL, /* next */
5460 0, /* static_pass_number */
5461 0, /* tv_id */
5462 0, /* properties_required */
5463 0, /* properties_provided */
5464 0, /* properties_destroyed */
5465 0, /* todo_flags_start */
5466 0, /* todo_flags_finish */
5467 0 /* letter */
5471 #include "gt-function.h"