* invoke.texi: Fix typo.
[official-gcc.git] / gcc / calls.c
blobcfcf01cf4673b70831a693171b07c1d23d9fc8d8
1 /* Convert function calls to rtl insns, for GNU C compiler.
2 Copyright (C) 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998,
3 1999, 2000, 2001, 2002, 2003, 2004 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "rtl.h"
27 #include "tree.h"
28 #include "flags.h"
29 #include "expr.h"
30 #include "optabs.h"
31 #include "libfuncs.h"
32 #include "function.h"
33 #include "regs.h"
34 #include "toplev.h"
35 #include "output.h"
36 #include "tm_p.h"
37 #include "timevar.h"
38 #include "sbitmap.h"
39 #include "langhooks.h"
40 #include "target.h"
41 #include "cgraph.h"
42 #include "except.h"
44 /* Like PREFERRED_STACK_BOUNDARY but in units of bytes, not bits. */
45 #define STACK_BYTES (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT)
47 /* Data structure and subroutines used within expand_call. */
49 struct arg_data
51 /* Tree node for this argument. */
52 tree tree_value;
53 /* Mode for value; TYPE_MODE unless promoted. */
54 enum machine_mode mode;
55 /* Current RTL value for argument, or 0 if it isn't precomputed. */
56 rtx value;
57 /* Initially-compute RTL value for argument; only for const functions. */
58 rtx initial_value;
59 /* Register to pass this argument in, 0 if passed on stack, or an
60 PARALLEL if the arg is to be copied into multiple non-contiguous
61 registers. */
62 rtx reg;
63 /* Register to pass this argument in when generating tail call sequence.
64 This is not the same register as for normal calls on machines with
65 register windows. */
66 rtx tail_call_reg;
67 /* If REG was promoted from the actual mode of the argument expression,
68 indicates whether the promotion is sign- or zero-extended. */
69 int unsignedp;
70 /* Number of registers to use. 0 means put the whole arg in registers.
71 Also 0 if not passed in registers. */
72 int partial;
73 /* Nonzero if argument must be passed on stack.
74 Note that some arguments may be passed on the stack
75 even though pass_on_stack is zero, just because FUNCTION_ARG says so.
76 pass_on_stack identifies arguments that *cannot* go in registers. */
77 int pass_on_stack;
78 /* Some fields packaged up for locate_and_pad_parm. */
79 struct locate_and_pad_arg_data locate;
80 /* Location on the stack at which parameter should be stored. The store
81 has already been done if STACK == VALUE. */
82 rtx stack;
83 /* Location on the stack of the start of this argument slot. This can
84 differ from STACK if this arg pads downward. This location is known
85 to be aligned to FUNCTION_ARG_BOUNDARY. */
86 rtx stack_slot;
87 /* Place that this stack area has been saved, if needed. */
88 rtx save_area;
89 /* If an argument's alignment does not permit direct copying into registers,
90 copy in smaller-sized pieces into pseudos. These are stored in a
91 block pointed to by this field. The next field says how many
92 word-sized pseudos we made. */
93 rtx *aligned_regs;
94 int n_aligned_regs;
97 /* A vector of one char per byte of stack space. A byte if nonzero if
98 the corresponding stack location has been used.
99 This vector is used to prevent a function call within an argument from
100 clobbering any stack already set up. */
101 static char *stack_usage_map;
103 /* Size of STACK_USAGE_MAP. */
104 static int highest_outgoing_arg_in_use;
106 /* A bitmap of virtual-incoming stack space. Bit is set if the corresponding
107 stack location's tail call argument has been already stored into the stack.
108 This bitmap is used to prevent sibling call optimization if function tries
109 to use parent's incoming argument slots when they have been already
110 overwritten with tail call arguments. */
111 static sbitmap stored_args_map;
113 /* stack_arg_under_construction is nonzero when an argument may be
114 initialized with a constructor call (including a C function that
115 returns a BLKmode struct) and expand_call must take special action
116 to make sure the object being constructed does not overlap the
117 argument list for the constructor call. */
118 int stack_arg_under_construction;
120 static void emit_call_1 (rtx, tree, tree, tree, HOST_WIDE_INT, HOST_WIDE_INT,
121 HOST_WIDE_INT, rtx, rtx, int, rtx, int,
122 CUMULATIVE_ARGS *);
123 static void precompute_register_parameters (int, struct arg_data *, int *);
124 static int store_one_arg (struct arg_data *, rtx, int, int, int);
125 static void store_unaligned_arguments_into_pseudos (struct arg_data *, int);
126 static int finalize_must_preallocate (int, int, struct arg_data *,
127 struct args_size *);
128 static void precompute_arguments (int, int, struct arg_data *);
129 static int compute_argument_block_size (int, struct args_size *, int);
130 static void initialize_argument_information (int, struct arg_data *,
131 struct args_size *, int, tree,
132 tree, CUMULATIVE_ARGS *, int,
133 rtx *, int *, int *, int *,
134 bool *, bool);
135 static void compute_argument_addresses (struct arg_data *, rtx, int);
136 static rtx rtx_for_function_call (tree, tree);
137 static void load_register_parameters (struct arg_data *, int, rtx *, int,
138 int, int *);
139 static rtx emit_library_call_value_1 (int, rtx, rtx, enum libcall_type,
140 enum machine_mode, int, va_list);
141 static int special_function_p (tree, int);
142 static int check_sibcall_argument_overlap_1 (rtx);
143 static int check_sibcall_argument_overlap (rtx, struct arg_data *, int);
145 static int combine_pending_stack_adjustment_and_call (int, struct args_size *,
146 unsigned int);
147 static bool shift_returned_value (tree, rtx *);
148 static tree split_complex_values (tree);
149 static tree split_complex_types (tree);
151 #ifdef REG_PARM_STACK_SPACE
152 static rtx save_fixed_argument_area (int, rtx, int *, int *);
153 static void restore_fixed_argument_area (rtx, rtx, int, int);
154 #endif
156 /* Force FUNEXP into a form suitable for the address of a CALL,
157 and return that as an rtx. Also load the static chain register
158 if FNDECL is a nested function.
160 CALL_FUSAGE points to a variable holding the prospective
161 CALL_INSN_FUNCTION_USAGE information. */
164 prepare_call_address (rtx funexp, rtx static_chain_value,
165 rtx *call_fusage, int reg_parm_seen, int sibcallp)
167 /* Make a valid memory address and copy constants through pseudo-regs,
168 but not for a constant address if -fno-function-cse. */
169 if (GET_CODE (funexp) != SYMBOL_REF)
170 /* If we are using registers for parameters, force the
171 function address into a register now. */
172 funexp = ((SMALL_REGISTER_CLASSES && reg_parm_seen)
173 ? force_not_mem (memory_address (FUNCTION_MODE, funexp))
174 : memory_address (FUNCTION_MODE, funexp));
175 else if (! sibcallp)
177 #ifndef NO_FUNCTION_CSE
178 if (optimize && ! flag_no_function_cse)
179 funexp = force_reg (Pmode, funexp);
180 #endif
183 if (static_chain_value != 0)
185 static_chain_value = convert_memory_address (Pmode, static_chain_value);
186 emit_move_insn (static_chain_rtx, static_chain_value);
188 if (REG_P (static_chain_rtx))
189 use_reg (call_fusage, static_chain_rtx);
192 return funexp;
195 /* Generate instructions to call function FUNEXP,
196 and optionally pop the results.
197 The CALL_INSN is the first insn generated.
199 FNDECL is the declaration node of the function. This is given to the
200 macro RETURN_POPS_ARGS to determine whether this function pops its own args.
202 FUNTYPE is the data type of the function. This is given to the macro
203 RETURN_POPS_ARGS to determine whether this function pops its own args.
204 We used to allow an identifier for library functions, but that doesn't
205 work when the return type is an aggregate type and the calling convention
206 says that the pointer to this aggregate is to be popped by the callee.
208 STACK_SIZE is the number of bytes of arguments on the stack,
209 ROUNDED_STACK_SIZE is that number rounded up to
210 PREFERRED_STACK_BOUNDARY; zero if the size is variable. This is
211 both to put into the call insn and to generate explicit popping
212 code if necessary.
214 STRUCT_VALUE_SIZE is the number of bytes wanted in a structure value.
215 It is zero if this call doesn't want a structure value.
217 NEXT_ARG_REG is the rtx that results from executing
218 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1)
219 just after all the args have had their registers assigned.
220 This could be whatever you like, but normally it is the first
221 arg-register beyond those used for args in this call,
222 or 0 if all the arg-registers are used in this call.
223 It is passed on to `gen_call' so you can put this info in the call insn.
225 VALREG is a hard register in which a value is returned,
226 or 0 if the call does not return a value.
228 OLD_INHIBIT_DEFER_POP is the value that `inhibit_defer_pop' had before
229 the args to this call were processed.
230 We restore `inhibit_defer_pop' to that value.
232 CALL_FUSAGE is either empty or an EXPR_LIST of USE expressions that
233 denote registers used by the called function. */
235 static void
236 emit_call_1 (rtx funexp, tree fntree, tree fndecl ATTRIBUTE_UNUSED,
237 tree funtype ATTRIBUTE_UNUSED,
238 HOST_WIDE_INT stack_size ATTRIBUTE_UNUSED,
239 HOST_WIDE_INT rounded_stack_size,
240 HOST_WIDE_INT struct_value_size ATTRIBUTE_UNUSED,
241 rtx next_arg_reg ATTRIBUTE_UNUSED, rtx valreg,
242 int old_inhibit_defer_pop, rtx call_fusage, int ecf_flags,
243 CUMULATIVE_ARGS *args_so_far ATTRIBUTE_UNUSED)
245 rtx rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
246 rtx call_insn;
247 int already_popped = 0;
248 HOST_WIDE_INT n_popped = RETURN_POPS_ARGS (fndecl, funtype, stack_size);
249 #if defined (HAVE_call) && defined (HAVE_call_value)
250 rtx struct_value_size_rtx;
251 struct_value_size_rtx = GEN_INT (struct_value_size);
252 #endif
254 #ifdef CALL_POPS_ARGS
255 n_popped += CALL_POPS_ARGS (* args_so_far);
256 #endif
258 /* Ensure address is valid. SYMBOL_REF is already valid, so no need,
259 and we don't want to load it into a register as an optimization,
260 because prepare_call_address already did it if it should be done. */
261 if (GET_CODE (funexp) != SYMBOL_REF)
262 funexp = memory_address (FUNCTION_MODE, funexp);
264 #if defined (HAVE_sibcall_pop) && defined (HAVE_sibcall_value_pop)
265 if ((ecf_flags & ECF_SIBCALL)
266 && HAVE_sibcall_pop && HAVE_sibcall_value_pop
267 && (n_popped > 0 || stack_size == 0))
269 rtx n_pop = GEN_INT (n_popped);
270 rtx pat;
272 /* If this subroutine pops its own args, record that in the call insn
273 if possible, for the sake of frame pointer elimination. */
275 if (valreg)
276 pat = GEN_SIBCALL_VALUE_POP (valreg,
277 gen_rtx_MEM (FUNCTION_MODE, funexp),
278 rounded_stack_size_rtx, next_arg_reg,
279 n_pop);
280 else
281 pat = GEN_SIBCALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
282 rounded_stack_size_rtx, next_arg_reg, n_pop);
284 emit_call_insn (pat);
285 already_popped = 1;
287 else
288 #endif
290 #if defined (HAVE_call_pop) && defined (HAVE_call_value_pop)
291 /* If the target has "call" or "call_value" insns, then prefer them
292 if no arguments are actually popped. If the target does not have
293 "call" or "call_value" insns, then we must use the popping versions
294 even if the call has no arguments to pop. */
295 #if defined (HAVE_call) && defined (HAVE_call_value)
296 if (HAVE_call && HAVE_call_value && HAVE_call_pop && HAVE_call_value_pop
297 && n_popped > 0 && ! (ecf_flags & ECF_SP_DEPRESSED))
298 #else
299 if (HAVE_call_pop && HAVE_call_value_pop)
300 #endif
302 rtx n_pop = GEN_INT (n_popped);
303 rtx pat;
305 /* If this subroutine pops its own args, record that in the call insn
306 if possible, for the sake of frame pointer elimination. */
308 if (valreg)
309 pat = GEN_CALL_VALUE_POP (valreg,
310 gen_rtx_MEM (FUNCTION_MODE, funexp),
311 rounded_stack_size_rtx, next_arg_reg, n_pop);
312 else
313 pat = GEN_CALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
314 rounded_stack_size_rtx, next_arg_reg, n_pop);
316 emit_call_insn (pat);
317 already_popped = 1;
319 else
320 #endif
322 #if defined (HAVE_sibcall) && defined (HAVE_sibcall_value)
323 if ((ecf_flags & ECF_SIBCALL)
324 && HAVE_sibcall && HAVE_sibcall_value)
326 if (valreg)
327 emit_call_insn (GEN_SIBCALL_VALUE (valreg,
328 gen_rtx_MEM (FUNCTION_MODE, funexp),
329 rounded_stack_size_rtx,
330 next_arg_reg, NULL_RTX));
331 else
332 emit_call_insn (GEN_SIBCALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
333 rounded_stack_size_rtx, next_arg_reg,
334 struct_value_size_rtx));
336 else
337 #endif
339 #if defined (HAVE_call) && defined (HAVE_call_value)
340 if (HAVE_call && HAVE_call_value)
342 if (valreg)
343 emit_call_insn (GEN_CALL_VALUE (valreg,
344 gen_rtx_MEM (FUNCTION_MODE, funexp),
345 rounded_stack_size_rtx, next_arg_reg,
346 NULL_RTX));
347 else
348 emit_call_insn (GEN_CALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
349 rounded_stack_size_rtx, next_arg_reg,
350 struct_value_size_rtx));
352 else
353 #endif
354 gcc_unreachable ();
356 /* Find the call we just emitted. */
357 call_insn = last_call_insn ();
359 /* Mark memory as used for "pure" function call. */
360 if (ecf_flags & ECF_PURE)
361 call_fusage
362 = gen_rtx_EXPR_LIST
363 (VOIDmode,
364 gen_rtx_USE (VOIDmode,
365 gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode))),
366 call_fusage);
368 /* Put the register usage information there. */
369 add_function_usage_to (call_insn, call_fusage);
371 /* If this is a const call, then set the insn's unchanging bit. */
372 if (ecf_flags & (ECF_CONST | ECF_PURE))
373 CONST_OR_PURE_CALL_P (call_insn) = 1;
375 /* If this call can't throw, attach a REG_EH_REGION reg note to that
376 effect. */
377 if (ecf_flags & ECF_NOTHROW)
378 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_EH_REGION, const0_rtx,
379 REG_NOTES (call_insn));
380 else
382 int rn = lookup_stmt_eh_region (fntree);
384 /* If rn < 0, then either (1) tree-ssa not used or (2) doesn't
385 throw, which we already took care of. */
386 if (rn > 0)
387 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_EH_REGION, GEN_INT (rn),
388 REG_NOTES (call_insn));
389 note_current_region_may_contain_throw ();
392 if (ecf_flags & ECF_NORETURN)
393 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_NORETURN, const0_rtx,
394 REG_NOTES (call_insn));
395 if (ecf_flags & ECF_ALWAYS_RETURN)
396 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_ALWAYS_RETURN, const0_rtx,
397 REG_NOTES (call_insn));
399 if (ecf_flags & ECF_RETURNS_TWICE)
401 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_SETJMP, const0_rtx,
402 REG_NOTES (call_insn));
403 current_function_calls_setjmp = 1;
406 SIBLING_CALL_P (call_insn) = ((ecf_flags & ECF_SIBCALL) != 0);
408 /* Restore this now, so that we do defer pops for this call's args
409 if the context of the call as a whole permits. */
410 inhibit_defer_pop = old_inhibit_defer_pop;
412 if (n_popped > 0)
414 if (!already_popped)
415 CALL_INSN_FUNCTION_USAGE (call_insn)
416 = gen_rtx_EXPR_LIST (VOIDmode,
417 gen_rtx_CLOBBER (VOIDmode, stack_pointer_rtx),
418 CALL_INSN_FUNCTION_USAGE (call_insn));
419 rounded_stack_size -= n_popped;
420 rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
421 stack_pointer_delta -= n_popped;
424 if (!ACCUMULATE_OUTGOING_ARGS)
426 /* If returning from the subroutine does not automatically pop the args,
427 we need an instruction to pop them sooner or later.
428 Perhaps do it now; perhaps just record how much space to pop later.
430 If returning from the subroutine does pop the args, indicate that the
431 stack pointer will be changed. */
433 if (rounded_stack_size != 0)
435 if (ecf_flags & (ECF_SP_DEPRESSED | ECF_NORETURN | ECF_LONGJMP))
436 /* Just pretend we did the pop. */
437 stack_pointer_delta -= rounded_stack_size;
438 else if (flag_defer_pop && inhibit_defer_pop == 0
439 && ! (ecf_flags & (ECF_CONST | ECF_PURE)))
440 pending_stack_adjust += rounded_stack_size;
441 else
442 adjust_stack (rounded_stack_size_rtx);
445 /* When we accumulate outgoing args, we must avoid any stack manipulations.
446 Restore the stack pointer to its original value now. Usually
447 ACCUMULATE_OUTGOING_ARGS targets don't get here, but there are exceptions.
448 On i386 ACCUMULATE_OUTGOING_ARGS can be enabled on demand, and
449 popping variants of functions exist as well.
451 ??? We may optimize similar to defer_pop above, but it is
452 probably not worthwhile.
454 ??? It will be worthwhile to enable combine_stack_adjustments even for
455 such machines. */
456 else if (n_popped)
457 anti_adjust_stack (GEN_INT (n_popped));
460 /* Determine if the function identified by NAME and FNDECL is one with
461 special properties we wish to know about.
463 For example, if the function might return more than one time (setjmp), then
464 set RETURNS_TWICE to a nonzero value.
466 Similarly set LONGJMP for if the function is in the longjmp family.
468 Set MAY_BE_ALLOCA for any memory allocation function that might allocate
469 space from the stack such as alloca. */
471 static int
472 special_function_p (tree fndecl, int flags)
474 if (fndecl && DECL_NAME (fndecl)
475 && IDENTIFIER_LENGTH (DECL_NAME (fndecl)) <= 17
476 /* Exclude functions not at the file scope, or not `extern',
477 since they are not the magic functions we would otherwise
478 think they are.
479 FIXME: this should be handled with attributes, not with this
480 hacky imitation of DECL_ASSEMBLER_NAME. It's (also) wrong
481 because you can declare fork() inside a function if you
482 wish. */
483 && (DECL_CONTEXT (fndecl) == NULL_TREE
484 || TREE_CODE (DECL_CONTEXT (fndecl)) == TRANSLATION_UNIT_DECL)
485 && TREE_PUBLIC (fndecl))
487 const char *name = IDENTIFIER_POINTER (DECL_NAME (fndecl));
488 const char *tname = name;
490 /* We assume that alloca will always be called by name. It
491 makes no sense to pass it as a pointer-to-function to
492 anything that does not understand its behavior. */
493 if (((IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 6
494 && name[0] == 'a'
495 && ! strcmp (name, "alloca"))
496 || (IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 16
497 && name[0] == '_'
498 && ! strcmp (name, "__builtin_alloca"))))
499 flags |= ECF_MAY_BE_ALLOCA;
501 /* Disregard prefix _, __ or __x. */
502 if (name[0] == '_')
504 if (name[1] == '_' && name[2] == 'x')
505 tname += 3;
506 else if (name[1] == '_')
507 tname += 2;
508 else
509 tname += 1;
512 if (tname[0] == 's')
514 if ((tname[1] == 'e'
515 && (! strcmp (tname, "setjmp")
516 || ! strcmp (tname, "setjmp_syscall")))
517 || (tname[1] == 'i'
518 && ! strcmp (tname, "sigsetjmp"))
519 || (tname[1] == 'a'
520 && ! strcmp (tname, "savectx")))
521 flags |= ECF_RETURNS_TWICE;
523 if (tname[1] == 'i'
524 && ! strcmp (tname, "siglongjmp"))
525 flags |= ECF_LONGJMP;
527 else if ((tname[0] == 'q' && tname[1] == 's'
528 && ! strcmp (tname, "qsetjmp"))
529 || (tname[0] == 'v' && tname[1] == 'f'
530 && ! strcmp (tname, "vfork")))
531 flags |= ECF_RETURNS_TWICE;
533 else if (tname[0] == 'l' && tname[1] == 'o'
534 && ! strcmp (tname, "longjmp"))
535 flags |= ECF_LONGJMP;
538 return flags;
541 /* Return nonzero when tree represent call to longjmp. */
544 setjmp_call_p (tree fndecl)
546 return special_function_p (fndecl, 0) & ECF_RETURNS_TWICE;
549 /* Return true when exp contains alloca call. */
550 bool
551 alloca_call_p (tree exp)
553 if (TREE_CODE (exp) == CALL_EXPR
554 && TREE_CODE (TREE_OPERAND (exp, 0)) == ADDR_EXPR
555 && (TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
556 == FUNCTION_DECL)
557 && (special_function_p (TREE_OPERAND (TREE_OPERAND (exp, 0), 0),
558 0) & ECF_MAY_BE_ALLOCA))
559 return true;
560 return false;
563 /* Detect flags (function attributes) from the function decl or type node. */
566 flags_from_decl_or_type (tree exp)
568 int flags = 0;
569 tree type = exp;
571 if (DECL_P (exp))
573 struct cgraph_rtl_info *i = cgraph_rtl_info (exp);
574 type = TREE_TYPE (exp);
576 if (i)
578 if (i->pure_function)
579 flags |= ECF_PURE | ECF_LIBCALL_BLOCK;
580 if (i->const_function)
581 flags |= ECF_CONST | ECF_LIBCALL_BLOCK;
584 /* The function exp may have the `malloc' attribute. */
585 if (DECL_IS_MALLOC (exp))
586 flags |= ECF_MALLOC;
588 /* The function exp may have the `pure' attribute. */
589 if (DECL_IS_PURE (exp))
590 flags |= ECF_PURE | ECF_LIBCALL_BLOCK;
592 if (TREE_NOTHROW (exp))
593 flags |= ECF_NOTHROW;
595 if (TREE_READONLY (exp) && ! TREE_THIS_VOLATILE (exp))
596 flags |= ECF_LIBCALL_BLOCK | ECF_CONST;
598 flags = special_function_p (exp, flags);
600 else if (TYPE_P (exp) && TYPE_READONLY (exp) && ! TREE_THIS_VOLATILE (exp))
601 flags |= ECF_CONST;
603 if (TREE_THIS_VOLATILE (exp))
604 flags |= ECF_NORETURN;
606 /* Mark if the function returns with the stack pointer depressed. We
607 cannot consider it pure or constant in that case. */
608 if (TREE_CODE (type) == FUNCTION_TYPE && TYPE_RETURNS_STACK_DEPRESSED (type))
610 flags |= ECF_SP_DEPRESSED;
611 flags &= ~(ECF_PURE | ECF_CONST | ECF_LIBCALL_BLOCK);
614 return flags;
617 /* Detect flags from a CALL_EXPR. */
620 call_expr_flags (tree t)
622 int flags;
623 tree decl = get_callee_fndecl (t);
625 if (decl)
626 flags = flags_from_decl_or_type (decl);
627 else
629 t = TREE_TYPE (TREE_OPERAND (t, 0));
630 if (t && TREE_CODE (t) == POINTER_TYPE)
631 flags = flags_from_decl_or_type (TREE_TYPE (t));
632 else
633 flags = 0;
636 return flags;
639 /* Precompute all register parameters as described by ARGS, storing values
640 into fields within the ARGS array.
642 NUM_ACTUALS indicates the total number elements in the ARGS array.
644 Set REG_PARM_SEEN if we encounter a register parameter. */
646 static void
647 precompute_register_parameters (int num_actuals, struct arg_data *args, int *reg_parm_seen)
649 int i;
651 *reg_parm_seen = 0;
653 for (i = 0; i < num_actuals; i++)
654 if (args[i].reg != 0 && ! args[i].pass_on_stack)
656 *reg_parm_seen = 1;
658 if (args[i].value == 0)
660 push_temp_slots ();
661 args[i].value = expand_expr (args[i].tree_value, NULL_RTX,
662 VOIDmode, 0);
663 preserve_temp_slots (args[i].value);
664 pop_temp_slots ();
667 /* If the value is a non-legitimate constant, force it into a
668 pseudo now. TLS symbols sometimes need a call to resolve. */
669 if (CONSTANT_P (args[i].value)
670 && !LEGITIMATE_CONSTANT_P (args[i].value))
671 args[i].value = force_reg (args[i].mode, args[i].value);
673 /* If we are to promote the function arg to a wider mode,
674 do it now. */
676 if (args[i].mode != TYPE_MODE (TREE_TYPE (args[i].tree_value)))
677 args[i].value
678 = convert_modes (args[i].mode,
679 TYPE_MODE (TREE_TYPE (args[i].tree_value)),
680 args[i].value, args[i].unsignedp);
682 /* If the value is expensive, and we are inside an appropriately
683 short loop, put the value into a pseudo and then put the pseudo
684 into the hard reg.
686 For small register classes, also do this if this call uses
687 register parameters. This is to avoid reload conflicts while
688 loading the parameters registers. */
690 if ((! (REG_P (args[i].value)
691 || (GET_CODE (args[i].value) == SUBREG
692 && REG_P (SUBREG_REG (args[i].value)))))
693 && args[i].mode != BLKmode
694 && rtx_cost (args[i].value, SET) > COSTS_N_INSNS (1)
695 && ((SMALL_REGISTER_CLASSES && *reg_parm_seen)
696 || optimize))
697 args[i].value = copy_to_mode_reg (args[i].mode, args[i].value);
701 #ifdef REG_PARM_STACK_SPACE
703 /* The argument list is the property of the called routine and it
704 may clobber it. If the fixed area has been used for previous
705 parameters, we must save and restore it. */
707 static rtx
708 save_fixed_argument_area (int reg_parm_stack_space, rtx argblock, int *low_to_save, int *high_to_save)
710 int low;
711 int high;
713 /* Compute the boundary of the area that needs to be saved, if any. */
714 high = reg_parm_stack_space;
715 #ifdef ARGS_GROW_DOWNWARD
716 high += 1;
717 #endif
718 if (high > highest_outgoing_arg_in_use)
719 high = highest_outgoing_arg_in_use;
721 for (low = 0; low < high; low++)
722 if (stack_usage_map[low] != 0)
724 int num_to_save;
725 enum machine_mode save_mode;
726 int delta;
727 rtx stack_area;
728 rtx save_area;
730 while (stack_usage_map[--high] == 0)
733 *low_to_save = low;
734 *high_to_save = high;
736 num_to_save = high - low + 1;
737 save_mode = mode_for_size (num_to_save * BITS_PER_UNIT, MODE_INT, 1);
739 /* If we don't have the required alignment, must do this
740 in BLKmode. */
741 if ((low & (MIN (GET_MODE_SIZE (save_mode),
742 BIGGEST_ALIGNMENT / UNITS_PER_WORD) - 1)))
743 save_mode = BLKmode;
745 #ifdef ARGS_GROW_DOWNWARD
746 delta = -high;
747 #else
748 delta = low;
749 #endif
750 stack_area = gen_rtx_MEM (save_mode,
751 memory_address (save_mode,
752 plus_constant (argblock,
753 delta)));
755 set_mem_align (stack_area, PARM_BOUNDARY);
756 if (save_mode == BLKmode)
758 save_area = assign_stack_temp (BLKmode, num_to_save, 0);
759 emit_block_move (validize_mem (save_area), stack_area,
760 GEN_INT (num_to_save), BLOCK_OP_CALL_PARM);
762 else
764 save_area = gen_reg_rtx (save_mode);
765 emit_move_insn (save_area, stack_area);
768 return save_area;
771 return NULL_RTX;
774 static void
775 restore_fixed_argument_area (rtx save_area, rtx argblock, int high_to_save, int low_to_save)
777 enum machine_mode save_mode = GET_MODE (save_area);
778 int delta;
779 rtx stack_area;
781 #ifdef ARGS_GROW_DOWNWARD
782 delta = -high_to_save;
783 #else
784 delta = low_to_save;
785 #endif
786 stack_area = gen_rtx_MEM (save_mode,
787 memory_address (save_mode,
788 plus_constant (argblock, delta)));
789 set_mem_align (stack_area, PARM_BOUNDARY);
791 if (save_mode != BLKmode)
792 emit_move_insn (stack_area, save_area);
793 else
794 emit_block_move (stack_area, validize_mem (save_area),
795 GEN_INT (high_to_save - low_to_save + 1),
796 BLOCK_OP_CALL_PARM);
798 #endif /* REG_PARM_STACK_SPACE */
800 /* If any elements in ARGS refer to parameters that are to be passed in
801 registers, but not in memory, and whose alignment does not permit a
802 direct copy into registers. Copy the values into a group of pseudos
803 which we will later copy into the appropriate hard registers.
805 Pseudos for each unaligned argument will be stored into the array
806 args[argnum].aligned_regs. The caller is responsible for deallocating
807 the aligned_regs array if it is nonzero. */
809 static void
810 store_unaligned_arguments_into_pseudos (struct arg_data *args, int num_actuals)
812 int i, j;
814 for (i = 0; i < num_actuals; i++)
815 if (args[i].reg != 0 && ! args[i].pass_on_stack
816 && args[i].mode == BLKmode
817 && (TYPE_ALIGN (TREE_TYPE (args[i].tree_value))
818 < (unsigned int) MIN (BIGGEST_ALIGNMENT, BITS_PER_WORD)))
820 int bytes = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
821 int nregs = (bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
822 int endian_correction = 0;
824 args[i].n_aligned_regs = args[i].partial ? args[i].partial : nregs;
825 args[i].aligned_regs = xmalloc (sizeof (rtx) * args[i].n_aligned_regs);
827 /* Structures smaller than a word are normally aligned to the
828 least significant byte. On a BYTES_BIG_ENDIAN machine,
829 this means we must skip the empty high order bytes when
830 calculating the bit offset. */
831 if (bytes < UNITS_PER_WORD
832 #ifdef BLOCK_REG_PADDING
833 && (BLOCK_REG_PADDING (args[i].mode,
834 TREE_TYPE (args[i].tree_value), 1)
835 == downward)
836 #else
837 && BYTES_BIG_ENDIAN
838 #endif
840 endian_correction = BITS_PER_WORD - bytes * BITS_PER_UNIT;
842 for (j = 0; j < args[i].n_aligned_regs; j++)
844 rtx reg = gen_reg_rtx (word_mode);
845 rtx word = operand_subword_force (args[i].value, j, BLKmode);
846 int bitsize = MIN (bytes * BITS_PER_UNIT, BITS_PER_WORD);
848 args[i].aligned_regs[j] = reg;
849 word = extract_bit_field (word, bitsize, 0, 1, NULL_RTX,
850 word_mode, word_mode);
852 /* There is no need to restrict this code to loading items
853 in TYPE_ALIGN sized hunks. The bitfield instructions can
854 load up entire word sized registers efficiently.
856 ??? This may not be needed anymore.
857 We use to emit a clobber here but that doesn't let later
858 passes optimize the instructions we emit. By storing 0 into
859 the register later passes know the first AND to zero out the
860 bitfield being set in the register is unnecessary. The store
861 of 0 will be deleted as will at least the first AND. */
863 emit_move_insn (reg, const0_rtx);
865 bytes -= bitsize / BITS_PER_UNIT;
866 store_bit_field (reg, bitsize, endian_correction, word_mode,
867 word);
872 /* Fill in ARGS_SIZE and ARGS array based on the parameters found in
873 ACTPARMS.
875 NUM_ACTUALS is the total number of parameters.
877 N_NAMED_ARGS is the total number of named arguments.
879 FNDECL is the tree code for the target of this call (if known)
881 ARGS_SO_FAR holds state needed by the target to know where to place
882 the next argument.
884 REG_PARM_STACK_SPACE is the number of bytes of stack space reserved
885 for arguments which are passed in registers.
887 OLD_STACK_LEVEL is a pointer to an rtx which olds the old stack level
888 and may be modified by this routine.
890 OLD_PENDING_ADJ, MUST_PREALLOCATE and FLAGS are pointers to integer
891 flags which may may be modified by this routine.
893 MAY_TAILCALL is cleared if we encounter an invisible pass-by-reference
894 that requires allocation of stack space.
896 CALL_FROM_THUNK_P is true if this call is the jump from a thunk to
897 the thunked-to function. */
899 static void
900 initialize_argument_information (int num_actuals ATTRIBUTE_UNUSED,
901 struct arg_data *args,
902 struct args_size *args_size,
903 int n_named_args ATTRIBUTE_UNUSED,
904 tree actparms, tree fndecl,
905 CUMULATIVE_ARGS *args_so_far,
906 int reg_parm_stack_space,
907 rtx *old_stack_level, int *old_pending_adj,
908 int *must_preallocate, int *ecf_flags,
909 bool *may_tailcall, bool call_from_thunk_p)
911 /* 1 if scanning parms front to back, -1 if scanning back to front. */
912 int inc;
914 /* Count arg position in order args appear. */
915 int argpos;
917 int i;
918 tree p;
920 args_size->constant = 0;
921 args_size->var = 0;
923 /* In this loop, we consider args in the order they are written.
924 We fill up ARGS from the front or from the back if necessary
925 so that in any case the first arg to be pushed ends up at the front. */
927 if (PUSH_ARGS_REVERSED)
929 i = num_actuals - 1, inc = -1;
930 /* In this case, must reverse order of args
931 so that we compute and push the last arg first. */
933 else
935 i = 0, inc = 1;
938 /* I counts args in order (to be) pushed; ARGPOS counts in order written. */
939 for (p = actparms, argpos = 0; p; p = TREE_CHAIN (p), i += inc, argpos++)
941 tree type = TREE_TYPE (TREE_VALUE (p));
942 int unsignedp;
943 enum machine_mode mode;
945 args[i].tree_value = TREE_VALUE (p);
947 /* Replace erroneous argument with constant zero. */
948 if (type == error_mark_node || !COMPLETE_TYPE_P (type))
949 args[i].tree_value = integer_zero_node, type = integer_type_node;
951 /* If TYPE is a transparent union, pass things the way we would
952 pass the first field of the union. We have already verified that
953 the modes are the same. */
954 if (TREE_CODE (type) == UNION_TYPE && TYPE_TRANSPARENT_UNION (type))
955 type = TREE_TYPE (TYPE_FIELDS (type));
957 /* Decide where to pass this arg.
959 args[i].reg is nonzero if all or part is passed in registers.
961 args[i].partial is nonzero if part but not all is passed in registers,
962 and the exact value says how many words are passed in registers.
964 args[i].pass_on_stack is nonzero if the argument must at least be
965 computed on the stack. It may then be loaded back into registers
966 if args[i].reg is nonzero.
968 These decisions are driven by the FUNCTION_... macros and must agree
969 with those made by function.c. */
971 /* See if this argument should be passed by invisible reference. */
972 if (pass_by_reference (args_so_far, TYPE_MODE (type),
973 type, argpos < n_named_args))
975 bool callee_copies;
976 tree base;
978 callee_copies
979 = reference_callee_copied (args_so_far, TYPE_MODE (type),
980 type, argpos < n_named_args);
982 /* If we're compiling a thunk, pass through invisible references
983 instead of making a copy. */
984 if (call_from_thunk_p
985 || (callee_copies
986 && !TREE_ADDRESSABLE (type)
987 && (base = get_base_address (args[i].tree_value))
988 && (!DECL_P (base) || MEM_P (DECL_RTL (base)))))
990 /* We can't use sibcalls if a callee-copied argument is
991 stored in the current function's frame. */
992 if (!call_from_thunk_p && DECL_P (base) && !TREE_STATIC (base))
993 *may_tailcall = false;
995 args[i].tree_value = build_fold_addr_expr (args[i].tree_value);
996 type = TREE_TYPE (args[i].tree_value);
998 *ecf_flags &= ~(ECF_CONST | ECF_LIBCALL_BLOCK);
1000 else
1002 /* We make a copy of the object and pass the address to the
1003 function being called. */
1004 rtx copy;
1006 if (!COMPLETE_TYPE_P (type)
1007 || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST
1008 || (flag_stack_check && ! STACK_CHECK_BUILTIN
1009 && (0 < compare_tree_int (TYPE_SIZE_UNIT (type),
1010 STACK_CHECK_MAX_VAR_SIZE))))
1012 /* This is a variable-sized object. Make space on the stack
1013 for it. */
1014 rtx size_rtx = expr_size (TREE_VALUE (p));
1016 if (*old_stack_level == 0)
1018 emit_stack_save (SAVE_BLOCK, old_stack_level, NULL_RTX);
1019 *old_pending_adj = pending_stack_adjust;
1020 pending_stack_adjust = 0;
1023 copy = gen_rtx_MEM (BLKmode,
1024 allocate_dynamic_stack_space
1025 (size_rtx, NULL_RTX, TYPE_ALIGN (type)));
1026 set_mem_attributes (copy, type, 1);
1028 else
1029 copy = assign_temp (type, 0, 1, 0);
1031 store_expr (args[i].tree_value, copy, 0);
1033 if (callee_copies)
1034 *ecf_flags &= ~(ECF_CONST | ECF_LIBCALL_BLOCK);
1035 else
1036 *ecf_flags &= ~(ECF_CONST | ECF_PURE | ECF_LIBCALL_BLOCK);
1038 args[i].tree_value
1039 = build_fold_addr_expr (make_tree (type, copy));
1040 type = TREE_TYPE (args[i].tree_value);
1041 *may_tailcall = false;
1045 mode = TYPE_MODE (type);
1046 unsignedp = TYPE_UNSIGNED (type);
1048 if (targetm.calls.promote_function_args (fndecl ? TREE_TYPE (fndecl) : 0))
1049 mode = promote_mode (type, mode, &unsignedp, 1);
1051 args[i].unsignedp = unsignedp;
1052 args[i].mode = mode;
1054 args[i].reg = FUNCTION_ARG (*args_so_far, mode, type,
1055 argpos < n_named_args);
1056 #ifdef FUNCTION_INCOMING_ARG
1057 /* If this is a sibling call and the machine has register windows, the
1058 register window has to be unwinded before calling the routine, so
1059 arguments have to go into the incoming registers. */
1060 args[i].tail_call_reg = FUNCTION_INCOMING_ARG (*args_so_far, mode, type,
1061 argpos < n_named_args);
1062 #else
1063 args[i].tail_call_reg = args[i].reg;
1064 #endif
1066 if (args[i].reg)
1067 args[i].partial
1068 = FUNCTION_ARG_PARTIAL_NREGS (*args_so_far, mode, type,
1069 argpos < n_named_args);
1071 args[i].pass_on_stack = targetm.calls.must_pass_in_stack (mode, type);
1073 /* If FUNCTION_ARG returned a (parallel [(expr_list (nil) ...) ...]),
1074 it means that we are to pass this arg in the register(s) designated
1075 by the PARALLEL, but also to pass it in the stack. */
1076 if (args[i].reg && GET_CODE (args[i].reg) == PARALLEL
1077 && XEXP (XVECEXP (args[i].reg, 0, 0), 0) == 0)
1078 args[i].pass_on_stack = 1;
1080 /* If this is an addressable type, we must preallocate the stack
1081 since we must evaluate the object into its final location.
1083 If this is to be passed in both registers and the stack, it is simpler
1084 to preallocate. */
1085 if (TREE_ADDRESSABLE (type)
1086 || (args[i].pass_on_stack && args[i].reg != 0))
1087 *must_preallocate = 1;
1089 /* If this is an addressable type, we cannot pre-evaluate it. Thus,
1090 we cannot consider this function call constant. */
1091 if (TREE_ADDRESSABLE (type))
1092 *ecf_flags &= ~ECF_LIBCALL_BLOCK;
1094 /* Compute the stack-size of this argument. */
1095 if (args[i].reg == 0 || args[i].partial != 0
1096 || reg_parm_stack_space > 0
1097 || args[i].pass_on_stack)
1098 locate_and_pad_parm (mode, type,
1099 #ifdef STACK_PARMS_IN_REG_PARM_AREA
1101 #else
1102 args[i].reg != 0,
1103 #endif
1104 args[i].pass_on_stack ? 0 : args[i].partial,
1105 fndecl, args_size, &args[i].locate);
1106 #ifdef BLOCK_REG_PADDING
1107 else
1108 /* The argument is passed entirely in registers. See at which
1109 end it should be padded. */
1110 args[i].locate.where_pad =
1111 BLOCK_REG_PADDING (mode, type,
1112 int_size_in_bytes (type) <= UNITS_PER_WORD);
1113 #endif
1115 /* Update ARGS_SIZE, the total stack space for args so far. */
1117 args_size->constant += args[i].locate.size.constant;
1118 if (args[i].locate.size.var)
1119 ADD_PARM_SIZE (*args_size, args[i].locate.size.var);
1121 /* Increment ARGS_SO_FAR, which has info about which arg-registers
1122 have been used, etc. */
1124 FUNCTION_ARG_ADVANCE (*args_so_far, TYPE_MODE (type), type,
1125 argpos < n_named_args);
1129 /* Update ARGS_SIZE to contain the total size for the argument block.
1130 Return the original constant component of the argument block's size.
1132 REG_PARM_STACK_SPACE holds the number of bytes of stack space reserved
1133 for arguments passed in registers. */
1135 static int
1136 compute_argument_block_size (int reg_parm_stack_space,
1137 struct args_size *args_size,
1138 int preferred_stack_boundary ATTRIBUTE_UNUSED)
1140 int unadjusted_args_size = args_size->constant;
1142 /* For accumulate outgoing args mode we don't need to align, since the frame
1143 will be already aligned. Align to STACK_BOUNDARY in order to prevent
1144 backends from generating misaligned frame sizes. */
1145 if (ACCUMULATE_OUTGOING_ARGS && preferred_stack_boundary > STACK_BOUNDARY)
1146 preferred_stack_boundary = STACK_BOUNDARY;
1148 /* Compute the actual size of the argument block required. The variable
1149 and constant sizes must be combined, the size may have to be rounded,
1150 and there may be a minimum required size. */
1152 if (args_size->var)
1154 args_size->var = ARGS_SIZE_TREE (*args_size);
1155 args_size->constant = 0;
1157 preferred_stack_boundary /= BITS_PER_UNIT;
1158 if (preferred_stack_boundary > 1)
1160 /* We don't handle this case yet. To handle it correctly we have
1161 to add the delta, round and subtract the delta.
1162 Currently no machine description requires this support. */
1163 gcc_assert (!(stack_pointer_delta & (preferred_stack_boundary - 1)));
1164 args_size->var = round_up (args_size->var, preferred_stack_boundary);
1167 if (reg_parm_stack_space > 0)
1169 args_size->var
1170 = size_binop (MAX_EXPR, args_size->var,
1171 ssize_int (reg_parm_stack_space));
1173 #ifndef OUTGOING_REG_PARM_STACK_SPACE
1174 /* The area corresponding to register parameters is not to count in
1175 the size of the block we need. So make the adjustment. */
1176 args_size->var
1177 = size_binop (MINUS_EXPR, args_size->var,
1178 ssize_int (reg_parm_stack_space));
1179 #endif
1182 else
1184 preferred_stack_boundary /= BITS_PER_UNIT;
1185 if (preferred_stack_boundary < 1)
1186 preferred_stack_boundary = 1;
1187 args_size->constant = (((args_size->constant
1188 + stack_pointer_delta
1189 + preferred_stack_boundary - 1)
1190 / preferred_stack_boundary
1191 * preferred_stack_boundary)
1192 - stack_pointer_delta);
1194 args_size->constant = MAX (args_size->constant,
1195 reg_parm_stack_space);
1197 #ifndef OUTGOING_REG_PARM_STACK_SPACE
1198 args_size->constant -= reg_parm_stack_space;
1199 #endif
1201 return unadjusted_args_size;
1204 /* Precompute parameters as needed for a function call.
1206 FLAGS is mask of ECF_* constants.
1208 NUM_ACTUALS is the number of arguments.
1210 ARGS is an array containing information for each argument; this
1211 routine fills in the INITIAL_VALUE and VALUE fields for each
1212 precomputed argument. */
1214 static void
1215 precompute_arguments (int flags, int num_actuals, struct arg_data *args)
1217 int i;
1219 /* If this is a libcall, then precompute all arguments so that we do not
1220 get extraneous instructions emitted as part of the libcall sequence. */
1221 if ((flags & ECF_LIBCALL_BLOCK) == 0)
1222 return;
1224 for (i = 0; i < num_actuals; i++)
1226 enum machine_mode mode;
1228 /* If this is an addressable type, we cannot pre-evaluate it. */
1229 gcc_assert (!TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value)));
1231 args[i].initial_value = args[i].value
1232 = expand_expr (args[i].tree_value, NULL_RTX, VOIDmode, 0);
1234 mode = TYPE_MODE (TREE_TYPE (args[i].tree_value));
1235 if (mode != args[i].mode)
1237 args[i].value
1238 = convert_modes (args[i].mode, mode,
1239 args[i].value, args[i].unsignedp);
1240 #if defined(PROMOTE_FUNCTION_MODE) && !defined(PROMOTE_MODE)
1241 /* CSE will replace this only if it contains args[i].value
1242 pseudo, so convert it down to the declared mode using
1243 a SUBREG. */
1244 if (REG_P (args[i].value)
1245 && GET_MODE_CLASS (args[i].mode) == MODE_INT)
1247 args[i].initial_value
1248 = gen_lowpart_SUBREG (mode, args[i].value);
1249 SUBREG_PROMOTED_VAR_P (args[i].initial_value) = 1;
1250 SUBREG_PROMOTED_UNSIGNED_SET (args[i].initial_value,
1251 args[i].unsignedp);
1253 #endif
1258 /* Given the current state of MUST_PREALLOCATE and information about
1259 arguments to a function call in NUM_ACTUALS, ARGS and ARGS_SIZE,
1260 compute and return the final value for MUST_PREALLOCATE. */
1262 static int
1263 finalize_must_preallocate (int must_preallocate, int num_actuals, struct arg_data *args, struct args_size *args_size)
1265 /* See if we have or want to preallocate stack space.
1267 If we would have to push a partially-in-regs parm
1268 before other stack parms, preallocate stack space instead.
1270 If the size of some parm is not a multiple of the required stack
1271 alignment, we must preallocate.
1273 If the total size of arguments that would otherwise create a copy in
1274 a temporary (such as a CALL) is more than half the total argument list
1275 size, preallocation is faster.
1277 Another reason to preallocate is if we have a machine (like the m88k)
1278 where stack alignment is required to be maintained between every
1279 pair of insns, not just when the call is made. However, we assume here
1280 that such machines either do not have push insns (and hence preallocation
1281 would occur anyway) or the problem is taken care of with
1282 PUSH_ROUNDING. */
1284 if (! must_preallocate)
1286 int partial_seen = 0;
1287 int copy_to_evaluate_size = 0;
1288 int i;
1290 for (i = 0; i < num_actuals && ! must_preallocate; i++)
1292 if (args[i].partial > 0 && ! args[i].pass_on_stack)
1293 partial_seen = 1;
1294 else if (partial_seen && args[i].reg == 0)
1295 must_preallocate = 1;
1297 if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode
1298 && (TREE_CODE (args[i].tree_value) == CALL_EXPR
1299 || TREE_CODE (args[i].tree_value) == TARGET_EXPR
1300 || TREE_CODE (args[i].tree_value) == COND_EXPR
1301 || TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value))))
1302 copy_to_evaluate_size
1303 += int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1306 if (copy_to_evaluate_size * 2 >= args_size->constant
1307 && args_size->constant > 0)
1308 must_preallocate = 1;
1310 return must_preallocate;
1313 /* If we preallocated stack space, compute the address of each argument
1314 and store it into the ARGS array.
1316 We need not ensure it is a valid memory address here; it will be
1317 validized when it is used.
1319 ARGBLOCK is an rtx for the address of the outgoing arguments. */
1321 static void
1322 compute_argument_addresses (struct arg_data *args, rtx argblock, int num_actuals)
1324 if (argblock)
1326 rtx arg_reg = argblock;
1327 int i, arg_offset = 0;
1329 if (GET_CODE (argblock) == PLUS)
1330 arg_reg = XEXP (argblock, 0), arg_offset = INTVAL (XEXP (argblock, 1));
1332 for (i = 0; i < num_actuals; i++)
1334 rtx offset = ARGS_SIZE_RTX (args[i].locate.offset);
1335 rtx slot_offset = ARGS_SIZE_RTX (args[i].locate.slot_offset);
1336 rtx addr;
1338 /* Skip this parm if it will not be passed on the stack. */
1339 if (! args[i].pass_on_stack && args[i].reg != 0)
1340 continue;
1342 if (GET_CODE (offset) == CONST_INT)
1343 addr = plus_constant (arg_reg, INTVAL (offset));
1344 else
1345 addr = gen_rtx_PLUS (Pmode, arg_reg, offset);
1347 addr = plus_constant (addr, arg_offset);
1348 args[i].stack = gen_rtx_MEM (args[i].mode, addr);
1349 set_mem_align (args[i].stack, PARM_BOUNDARY);
1350 set_mem_attributes (args[i].stack,
1351 TREE_TYPE (args[i].tree_value), 1);
1353 if (GET_CODE (slot_offset) == CONST_INT)
1354 addr = plus_constant (arg_reg, INTVAL (slot_offset));
1355 else
1356 addr = gen_rtx_PLUS (Pmode, arg_reg, slot_offset);
1358 addr = plus_constant (addr, arg_offset);
1359 args[i].stack_slot = gen_rtx_MEM (args[i].mode, addr);
1360 set_mem_align (args[i].stack_slot, PARM_BOUNDARY);
1361 set_mem_attributes (args[i].stack_slot,
1362 TREE_TYPE (args[i].tree_value), 1);
1364 /* Function incoming arguments may overlap with sibling call
1365 outgoing arguments and we cannot allow reordering of reads
1366 from function arguments with stores to outgoing arguments
1367 of sibling calls. */
1368 set_mem_alias_set (args[i].stack, 0);
1369 set_mem_alias_set (args[i].stack_slot, 0);
1374 /* Given a FNDECL and EXP, return an rtx suitable for use as a target address
1375 in a call instruction.
1377 FNDECL is the tree node for the target function. For an indirect call
1378 FNDECL will be NULL_TREE.
1380 ADDR is the operand 0 of CALL_EXPR for this call. */
1382 static rtx
1383 rtx_for_function_call (tree fndecl, tree addr)
1385 rtx funexp;
1387 /* Get the function to call, in the form of RTL. */
1388 if (fndecl)
1390 /* If this is the first use of the function, see if we need to
1391 make an external definition for it. */
1392 if (! TREE_USED (fndecl))
1394 assemble_external (fndecl);
1395 TREE_USED (fndecl) = 1;
1398 /* Get a SYMBOL_REF rtx for the function address. */
1399 funexp = XEXP (DECL_RTL (fndecl), 0);
1401 else
1402 /* Generate an rtx (probably a pseudo-register) for the address. */
1404 push_temp_slots ();
1405 funexp = expand_expr (addr, NULL_RTX, VOIDmode, 0);
1406 pop_temp_slots (); /* FUNEXP can't be BLKmode. */
1408 return funexp;
1411 /* Do the register loads required for any wholly-register parms or any
1412 parms which are passed both on the stack and in a register. Their
1413 expressions were already evaluated.
1415 Mark all register-parms as living through the call, putting these USE
1416 insns in the CALL_INSN_FUNCTION_USAGE field.
1418 When IS_SIBCALL, perform the check_sibcall_overlap_argument_overlap
1419 checking, setting *SIBCALL_FAILURE if appropriate. */
1421 static void
1422 load_register_parameters (struct arg_data *args, int num_actuals,
1423 rtx *call_fusage, int flags, int is_sibcall,
1424 int *sibcall_failure)
1426 int i, j;
1428 for (i = 0; i < num_actuals; i++)
1430 rtx reg = ((flags & ECF_SIBCALL)
1431 ? args[i].tail_call_reg : args[i].reg);
1432 if (reg)
1434 int partial = args[i].partial;
1435 int nregs;
1436 int size = 0;
1437 rtx before_arg = get_last_insn ();
1438 /* Set to non-negative if must move a word at a time, even if just
1439 one word (e.g, partial == 1 && mode == DFmode). Set to -1 if
1440 we just use a normal move insn. This value can be zero if the
1441 argument is a zero size structure with no fields. */
1442 nregs = -1;
1443 if (partial)
1444 nregs = partial;
1445 else if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode)
1447 size = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1448 nregs = (size + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD;
1450 else
1451 size = GET_MODE_SIZE (args[i].mode);
1453 /* Handle calls that pass values in multiple non-contiguous
1454 locations. The Irix 6 ABI has examples of this. */
1456 if (GET_CODE (reg) == PARALLEL)
1458 tree type = TREE_TYPE (args[i].tree_value);
1459 emit_group_load (reg, args[i].value, type,
1460 int_size_in_bytes (type));
1463 /* If simple case, just do move. If normal partial, store_one_arg
1464 has already loaded the register for us. In all other cases,
1465 load the register(s) from memory. */
1467 else if (nregs == -1)
1469 emit_move_insn (reg, args[i].value);
1470 #ifdef BLOCK_REG_PADDING
1471 /* Handle case where we have a value that needs shifting
1472 up to the msb. eg. a QImode value and we're padding
1473 upward on a BYTES_BIG_ENDIAN machine. */
1474 if (size < UNITS_PER_WORD
1475 && (args[i].locate.where_pad
1476 == (BYTES_BIG_ENDIAN ? upward : downward)))
1478 rtx x;
1479 int shift = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
1481 /* Assigning REG here rather than a temp makes CALL_FUSAGE
1482 report the whole reg as used. Strictly speaking, the
1483 call only uses SIZE bytes at the msb end, but it doesn't
1484 seem worth generating rtl to say that. */
1485 reg = gen_rtx_REG (word_mode, REGNO (reg));
1486 x = expand_shift (LSHIFT_EXPR, word_mode, reg,
1487 build_int_cst (NULL_TREE, shift),
1488 reg, 1);
1489 if (x != reg)
1490 emit_move_insn (reg, x);
1492 #endif
1495 /* If we have pre-computed the values to put in the registers in
1496 the case of non-aligned structures, copy them in now. */
1498 else if (args[i].n_aligned_regs != 0)
1499 for (j = 0; j < args[i].n_aligned_regs; j++)
1500 emit_move_insn (gen_rtx_REG (word_mode, REGNO (reg) + j),
1501 args[i].aligned_regs[j]);
1503 else if (partial == 0 || args[i].pass_on_stack)
1505 rtx mem = validize_mem (args[i].value);
1507 /* Handle a BLKmode that needs shifting. */
1508 if (nregs == 1 && size < UNITS_PER_WORD
1509 #ifdef BLOCK_REG_PADDING
1510 && args[i].locate.where_pad == downward
1511 #else
1512 && BYTES_BIG_ENDIAN
1513 #endif
1516 rtx tem = operand_subword_force (mem, 0, args[i].mode);
1517 rtx ri = gen_rtx_REG (word_mode, REGNO (reg));
1518 rtx x = gen_reg_rtx (word_mode);
1519 int shift = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
1520 enum tree_code dir = BYTES_BIG_ENDIAN ? RSHIFT_EXPR
1521 : LSHIFT_EXPR;
1523 emit_move_insn (x, tem);
1524 x = expand_shift (dir, word_mode, x,
1525 build_int_cst (NULL_TREE, shift),
1526 ri, 1);
1527 if (x != ri)
1528 emit_move_insn (ri, x);
1530 else
1531 move_block_to_reg (REGNO (reg), mem, nregs, args[i].mode);
1534 /* When a parameter is a block, and perhaps in other cases, it is
1535 possible that it did a load from an argument slot that was
1536 already clobbered. */
1537 if (is_sibcall
1538 && check_sibcall_argument_overlap (before_arg, &args[i], 0))
1539 *sibcall_failure = 1;
1541 /* Handle calls that pass values in multiple non-contiguous
1542 locations. The Irix 6 ABI has examples of this. */
1543 if (GET_CODE (reg) == PARALLEL)
1544 use_group_regs (call_fusage, reg);
1545 else if (nregs == -1)
1546 use_reg (call_fusage, reg);
1547 else
1548 use_regs (call_fusage, REGNO (reg), nregs == 0 ? 1 : nregs);
1553 /* We need to pop PENDING_STACK_ADJUST bytes. But, if the arguments
1554 wouldn't fill up an even multiple of PREFERRED_UNIT_STACK_BOUNDARY
1555 bytes, then we would need to push some additional bytes to pad the
1556 arguments. So, we compute an adjust to the stack pointer for an
1557 amount that will leave the stack under-aligned by UNADJUSTED_ARGS_SIZE
1558 bytes. Then, when the arguments are pushed the stack will be perfectly
1559 aligned. ARGS_SIZE->CONSTANT is set to the number of bytes that should
1560 be popped after the call. Returns the adjustment. */
1562 static int
1563 combine_pending_stack_adjustment_and_call (int unadjusted_args_size,
1564 struct args_size *args_size,
1565 unsigned int preferred_unit_stack_boundary)
1567 /* The number of bytes to pop so that the stack will be
1568 under-aligned by UNADJUSTED_ARGS_SIZE bytes. */
1569 HOST_WIDE_INT adjustment;
1570 /* The alignment of the stack after the arguments are pushed, if we
1571 just pushed the arguments without adjust the stack here. */
1572 unsigned HOST_WIDE_INT unadjusted_alignment;
1574 unadjusted_alignment
1575 = ((stack_pointer_delta + unadjusted_args_size)
1576 % preferred_unit_stack_boundary);
1578 /* We want to get rid of as many of the PENDING_STACK_ADJUST bytes
1579 as possible -- leaving just enough left to cancel out the
1580 UNADJUSTED_ALIGNMENT. In other words, we want to ensure that the
1581 PENDING_STACK_ADJUST is non-negative, and congruent to
1582 -UNADJUSTED_ALIGNMENT modulo the PREFERRED_UNIT_STACK_BOUNDARY. */
1584 /* Begin by trying to pop all the bytes. */
1585 unadjusted_alignment
1586 = (unadjusted_alignment
1587 - (pending_stack_adjust % preferred_unit_stack_boundary));
1588 adjustment = pending_stack_adjust;
1589 /* Push enough additional bytes that the stack will be aligned
1590 after the arguments are pushed. */
1591 if (preferred_unit_stack_boundary > 1)
1593 if (unadjusted_alignment > 0)
1594 adjustment -= preferred_unit_stack_boundary - unadjusted_alignment;
1595 else
1596 adjustment += unadjusted_alignment;
1599 /* Now, sets ARGS_SIZE->CONSTANT so that we pop the right number of
1600 bytes after the call. The right number is the entire
1601 PENDING_STACK_ADJUST less our ADJUSTMENT plus the amount required
1602 by the arguments in the first place. */
1603 args_size->constant
1604 = pending_stack_adjust - adjustment + unadjusted_args_size;
1606 return adjustment;
1609 /* Scan X expression if it does not dereference any argument slots
1610 we already clobbered by tail call arguments (as noted in stored_args_map
1611 bitmap).
1612 Return nonzero if X expression dereferences such argument slots,
1613 zero otherwise. */
1615 static int
1616 check_sibcall_argument_overlap_1 (rtx x)
1618 RTX_CODE code;
1619 int i, j;
1620 unsigned int k;
1621 const char *fmt;
1623 if (x == NULL_RTX)
1624 return 0;
1626 code = GET_CODE (x);
1628 if (code == MEM)
1630 if (XEXP (x, 0) == current_function_internal_arg_pointer)
1631 i = 0;
1632 else if (GET_CODE (XEXP (x, 0)) == PLUS
1633 && XEXP (XEXP (x, 0), 0) ==
1634 current_function_internal_arg_pointer
1635 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
1636 i = INTVAL (XEXP (XEXP (x, 0), 1));
1637 else
1638 return 1;
1640 #ifdef ARGS_GROW_DOWNWARD
1641 i = -i - GET_MODE_SIZE (GET_MODE (x));
1642 #endif
1644 for (k = 0; k < GET_MODE_SIZE (GET_MODE (x)); k++)
1645 if (i + k < stored_args_map->n_bits
1646 && TEST_BIT (stored_args_map, i + k))
1647 return 1;
1649 return 0;
1652 /* Scan all subexpressions. */
1653 fmt = GET_RTX_FORMAT (code);
1654 for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
1656 if (*fmt == 'e')
1658 if (check_sibcall_argument_overlap_1 (XEXP (x, i)))
1659 return 1;
1661 else if (*fmt == 'E')
1663 for (j = 0; j < XVECLEN (x, i); j++)
1664 if (check_sibcall_argument_overlap_1 (XVECEXP (x, i, j)))
1665 return 1;
1668 return 0;
1671 /* Scan sequence after INSN if it does not dereference any argument slots
1672 we already clobbered by tail call arguments (as noted in stored_args_map
1673 bitmap). If MARK_STORED_ARGS_MAP, add stack slots for ARG to
1674 stored_args_map bitmap afterwards (when ARG is a register MARK_STORED_ARGS_MAP
1675 should be 0). Return nonzero if sequence after INSN dereferences such argument
1676 slots, zero otherwise. */
1678 static int
1679 check_sibcall_argument_overlap (rtx insn, struct arg_data *arg, int mark_stored_args_map)
1681 int low, high;
1683 if (insn == NULL_RTX)
1684 insn = get_insns ();
1685 else
1686 insn = NEXT_INSN (insn);
1688 for (; insn; insn = NEXT_INSN (insn))
1689 if (INSN_P (insn)
1690 && check_sibcall_argument_overlap_1 (PATTERN (insn)))
1691 break;
1693 if (mark_stored_args_map)
1695 #ifdef ARGS_GROW_DOWNWARD
1696 low = -arg->locate.slot_offset.constant - arg->locate.size.constant;
1697 #else
1698 low = arg->locate.slot_offset.constant;
1699 #endif
1701 for (high = low + arg->locate.size.constant; low < high; low++)
1702 SET_BIT (stored_args_map, low);
1704 return insn != NULL_RTX;
1707 /* If function value *VALUE was returned at the most significant end of a
1708 register, shift it towards the least significant end and convert it to
1709 TYPE's mode. Return true and update *VALUE if some action was needed.
1711 TYPE is the type of the function's return value, which is known not
1712 to have mode BLKmode. */
1714 static bool
1715 shift_returned_value (tree type, rtx *value)
1717 if (targetm.calls.return_in_msb (type))
1719 HOST_WIDE_INT shift;
1721 shift = (GET_MODE_BITSIZE (GET_MODE (*value))
1722 - BITS_PER_UNIT * int_size_in_bytes (type));
1723 if (shift > 0)
1725 /* Shift the value into the low part of the register. */
1726 *value = expand_binop (GET_MODE (*value), lshr_optab, *value,
1727 GEN_INT (shift), 0, 1, OPTAB_WIDEN);
1729 /* Truncate it to the type's mode, or its integer equivalent.
1730 This is subject to TRULY_NOOP_TRUNCATION. */
1731 *value = convert_to_mode (int_mode_for_mode (TYPE_MODE (type)),
1732 *value, 0);
1734 /* Now convert it to the final form. */
1735 *value = gen_lowpart (TYPE_MODE (type), *value);
1736 return true;
1739 return false;
1742 /* Remove all REG_EQUIV notes found in the insn chain. */
1744 static void
1745 purge_reg_equiv_notes (void)
1747 rtx insn;
1749 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
1751 while (1)
1753 rtx note = find_reg_note (insn, REG_EQUIV, 0);
1754 if (note)
1756 /* Remove the note and keep looking at the notes for
1757 this insn. */
1758 remove_note (insn, note);
1759 continue;
1761 break;
1766 /* Generate all the code for a function call
1767 and return an rtx for its value.
1768 Store the value in TARGET (specified as an rtx) if convenient.
1769 If the value is stored in TARGET then TARGET is returned.
1770 If IGNORE is nonzero, then we ignore the value of the function call. */
1773 expand_call (tree exp, rtx target, int ignore)
1775 /* Nonzero if we are currently expanding a call. */
1776 static int currently_expanding_call = 0;
1778 /* List of actual parameters. */
1779 tree actparms = TREE_OPERAND (exp, 1);
1780 /* RTX for the function to be called. */
1781 rtx funexp;
1782 /* Sequence of insns to perform a normal "call". */
1783 rtx normal_call_insns = NULL_RTX;
1784 /* Sequence of insns to perform a tail "call". */
1785 rtx tail_call_insns = NULL_RTX;
1786 /* Data type of the function. */
1787 tree funtype;
1788 tree type_arg_types;
1789 /* Declaration of the function being called,
1790 or 0 if the function is computed (not known by name). */
1791 tree fndecl = 0;
1792 /* The type of the function being called. */
1793 tree fntype;
1794 bool try_tail_call = CALL_EXPR_TAILCALL (exp);
1795 int pass;
1797 /* Register in which non-BLKmode value will be returned,
1798 or 0 if no value or if value is BLKmode. */
1799 rtx valreg;
1800 /* Address where we should return a BLKmode value;
1801 0 if value not BLKmode. */
1802 rtx structure_value_addr = 0;
1803 /* Nonzero if that address is being passed by treating it as
1804 an extra, implicit first parameter. Otherwise,
1805 it is passed by being copied directly into struct_value_rtx. */
1806 int structure_value_addr_parm = 0;
1807 /* Size of aggregate value wanted, or zero if none wanted
1808 or if we are using the non-reentrant PCC calling convention
1809 or expecting the value in registers. */
1810 HOST_WIDE_INT struct_value_size = 0;
1811 /* Nonzero if called function returns an aggregate in memory PCC style,
1812 by returning the address of where to find it. */
1813 int pcc_struct_value = 0;
1814 rtx struct_value = 0;
1816 /* Number of actual parameters in this call, including struct value addr. */
1817 int num_actuals;
1818 /* Number of named args. Args after this are anonymous ones
1819 and they must all go on the stack. */
1820 int n_named_args;
1822 /* Vector of information about each argument.
1823 Arguments are numbered in the order they will be pushed,
1824 not the order they are written. */
1825 struct arg_data *args;
1827 /* Total size in bytes of all the stack-parms scanned so far. */
1828 struct args_size args_size;
1829 struct args_size adjusted_args_size;
1830 /* Size of arguments before any adjustments (such as rounding). */
1831 int unadjusted_args_size;
1832 /* Data on reg parms scanned so far. */
1833 CUMULATIVE_ARGS args_so_far;
1834 /* Nonzero if a reg parm has been scanned. */
1835 int reg_parm_seen;
1836 /* Nonzero if this is an indirect function call. */
1838 /* Nonzero if we must avoid push-insns in the args for this call.
1839 If stack space is allocated for register parameters, but not by the
1840 caller, then it is preallocated in the fixed part of the stack frame.
1841 So the entire argument block must then be preallocated (i.e., we
1842 ignore PUSH_ROUNDING in that case). */
1844 int must_preallocate = !PUSH_ARGS;
1846 /* Size of the stack reserved for parameter registers. */
1847 int reg_parm_stack_space = 0;
1849 /* Address of space preallocated for stack parms
1850 (on machines that lack push insns), or 0 if space not preallocated. */
1851 rtx argblock = 0;
1853 /* Mask of ECF_ flags. */
1854 int flags = 0;
1855 #ifdef REG_PARM_STACK_SPACE
1856 /* Define the boundary of the register parm stack space that needs to be
1857 saved, if any. */
1858 int low_to_save, high_to_save;
1859 rtx save_area = 0; /* Place that it is saved */
1860 #endif
1862 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
1863 char *initial_stack_usage_map = stack_usage_map;
1865 int old_stack_allocated;
1867 /* State variables to track stack modifications. */
1868 rtx old_stack_level = 0;
1869 int old_stack_arg_under_construction = 0;
1870 int old_pending_adj = 0;
1871 int old_inhibit_defer_pop = inhibit_defer_pop;
1873 /* Some stack pointer alterations we make are performed via
1874 allocate_dynamic_stack_space. This modifies the stack_pointer_delta,
1875 which we then also need to save/restore along the way. */
1876 int old_stack_pointer_delta = 0;
1878 rtx call_fusage;
1879 tree p = TREE_OPERAND (exp, 0);
1880 tree addr = TREE_OPERAND (exp, 0);
1881 int i;
1882 /* The alignment of the stack, in bits. */
1883 unsigned HOST_WIDE_INT preferred_stack_boundary;
1884 /* The alignment of the stack, in bytes. */
1885 unsigned HOST_WIDE_INT preferred_unit_stack_boundary;
1886 /* The static chain value to use for this call. */
1887 rtx static_chain_value;
1888 /* See if this is "nothrow" function call. */
1889 if (TREE_NOTHROW (exp))
1890 flags |= ECF_NOTHROW;
1892 /* See if we can find a DECL-node for the actual function, and get the
1893 function attributes (flags) from the function decl or type node. */
1894 fndecl = get_callee_fndecl (exp);
1895 if (fndecl)
1897 fntype = TREE_TYPE (fndecl);
1898 flags |= flags_from_decl_or_type (fndecl);
1900 else
1902 fntype = TREE_TYPE (TREE_TYPE (p));
1903 flags |= flags_from_decl_or_type (fntype);
1906 struct_value = targetm.calls.struct_value_rtx (fntype, 0);
1908 /* Warn if this value is an aggregate type,
1909 regardless of which calling convention we are using for it. */
1910 if (warn_aggregate_return && AGGREGATE_TYPE_P (TREE_TYPE (exp)))
1911 warning ("function call has aggregate value");
1913 /* If the result of a pure or const function call is ignored (or void),
1914 and none of its arguments are volatile, we can avoid expanding the
1915 call and just evaluate the arguments for side-effects. */
1916 if ((flags & (ECF_CONST | ECF_PURE))
1917 && (ignore || target == const0_rtx
1918 || TYPE_MODE (TREE_TYPE (exp)) == VOIDmode))
1920 bool volatilep = false;
1921 tree arg;
1923 for (arg = actparms; arg; arg = TREE_CHAIN (arg))
1924 if (TREE_THIS_VOLATILE (TREE_VALUE (arg)))
1926 volatilep = true;
1927 break;
1930 if (! volatilep)
1932 for (arg = actparms; arg; arg = TREE_CHAIN (arg))
1933 expand_expr (TREE_VALUE (arg), const0_rtx,
1934 VOIDmode, EXPAND_NORMAL);
1935 return const0_rtx;
1939 #ifdef REG_PARM_STACK_SPACE
1940 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
1941 #endif
1943 #ifndef OUTGOING_REG_PARM_STACK_SPACE
1944 if (reg_parm_stack_space > 0 && PUSH_ARGS)
1945 must_preallocate = 1;
1946 #endif
1948 /* Set up a place to return a structure. */
1950 /* Cater to broken compilers. */
1951 if (aggregate_value_p (exp, fndecl))
1953 /* This call returns a big structure. */
1954 flags &= ~(ECF_CONST | ECF_PURE | ECF_LIBCALL_BLOCK);
1956 #ifdef PCC_STATIC_STRUCT_RETURN
1958 pcc_struct_value = 1;
1960 #else /* not PCC_STATIC_STRUCT_RETURN */
1962 struct_value_size = int_size_in_bytes (TREE_TYPE (exp));
1964 if (CALL_EXPR_HAS_RETURN_SLOT_ADDR (exp))
1966 /* The structure value address arg is already in actparms.
1967 Pull it out. It might be nice to just leave it there, but
1968 we need to set structure_value_addr. */
1969 tree return_arg = TREE_VALUE (actparms);
1970 actparms = TREE_CHAIN (actparms);
1971 structure_value_addr = expand_expr (return_arg, NULL_RTX,
1972 VOIDmode, EXPAND_NORMAL);
1974 else if (target && MEM_P (target))
1975 structure_value_addr = XEXP (target, 0);
1976 else
1978 /* For variable-sized objects, we must be called with a target
1979 specified. If we were to allocate space on the stack here,
1980 we would have no way of knowing when to free it. */
1981 rtx d = assign_temp (TREE_TYPE (exp), 1, 1, 1);
1983 mark_temp_addr_taken (d);
1984 structure_value_addr = XEXP (d, 0);
1985 target = 0;
1988 #endif /* not PCC_STATIC_STRUCT_RETURN */
1991 /* Figure out the amount to which the stack should be aligned. */
1992 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
1993 if (fndecl)
1995 struct cgraph_rtl_info *i = cgraph_rtl_info (fndecl);
1996 if (i && i->preferred_incoming_stack_boundary)
1997 preferred_stack_boundary = i->preferred_incoming_stack_boundary;
2000 /* Operand 0 is a pointer-to-function; get the type of the function. */
2001 funtype = TREE_TYPE (addr);
2002 gcc_assert (POINTER_TYPE_P (funtype));
2003 funtype = TREE_TYPE (funtype);
2005 /* Munge the tree to split complex arguments into their imaginary
2006 and real parts. */
2007 if (targetm.calls.split_complex_arg)
2009 type_arg_types = split_complex_types (TYPE_ARG_TYPES (funtype));
2010 actparms = split_complex_values (actparms);
2012 else
2013 type_arg_types = TYPE_ARG_TYPES (funtype);
2015 if (flags & ECF_MAY_BE_ALLOCA)
2016 current_function_calls_alloca = 1;
2018 /* If struct_value_rtx is 0, it means pass the address
2019 as if it were an extra parameter. */
2020 if (structure_value_addr && struct_value == 0)
2022 /* If structure_value_addr is a REG other than
2023 virtual_outgoing_args_rtx, we can use always use it. If it
2024 is not a REG, we must always copy it into a register.
2025 If it is virtual_outgoing_args_rtx, we must copy it to another
2026 register in some cases. */
2027 rtx temp = (!REG_P (structure_value_addr)
2028 || (ACCUMULATE_OUTGOING_ARGS
2029 && stack_arg_under_construction
2030 && structure_value_addr == virtual_outgoing_args_rtx)
2031 ? copy_addr_to_reg (convert_memory_address
2032 (Pmode, structure_value_addr))
2033 : structure_value_addr);
2035 actparms
2036 = tree_cons (error_mark_node,
2037 make_tree (build_pointer_type (TREE_TYPE (funtype)),
2038 temp),
2039 actparms);
2040 structure_value_addr_parm = 1;
2043 /* Count the arguments and set NUM_ACTUALS. */
2044 for (p = actparms, num_actuals = 0; p; p = TREE_CHAIN (p))
2045 num_actuals++;
2047 /* Compute number of named args.
2048 First, do a raw count of the args for INIT_CUMULATIVE_ARGS. */
2050 if (type_arg_types != 0)
2051 n_named_args
2052 = (list_length (type_arg_types)
2053 /* Count the struct value address, if it is passed as a parm. */
2054 + structure_value_addr_parm);
2055 else
2056 /* If we know nothing, treat all args as named. */
2057 n_named_args = num_actuals;
2059 /* Start updating where the next arg would go.
2061 On some machines (such as the PA) indirect calls have a different
2062 calling convention than normal calls. The fourth argument in
2063 INIT_CUMULATIVE_ARGS tells the backend if this is an indirect call
2064 or not. */
2065 INIT_CUMULATIVE_ARGS (args_so_far, funtype, NULL_RTX, fndecl, n_named_args);
2067 /* Now possibly adjust the number of named args.
2068 Normally, don't include the last named arg if anonymous args follow.
2069 We do include the last named arg if
2070 targetm.calls.strict_argument_naming() returns nonzero.
2071 (If no anonymous args follow, the result of list_length is actually
2072 one too large. This is harmless.)
2074 If targetm.calls.pretend_outgoing_varargs_named() returns
2075 nonzero, and targetm.calls.strict_argument_naming() returns zero,
2076 this machine will be able to place unnamed args that were passed
2077 in registers into the stack. So treat all args as named. This
2078 allows the insns emitting for a specific argument list to be
2079 independent of the function declaration.
2081 If targetm.calls.pretend_outgoing_varargs_named() returns zero,
2082 we do not have any reliable way to pass unnamed args in
2083 registers, so we must force them into memory. */
2085 if (type_arg_types != 0
2086 && targetm.calls.strict_argument_naming (&args_so_far))
2088 else if (type_arg_types != 0
2089 && ! targetm.calls.pretend_outgoing_varargs_named (&args_so_far))
2090 /* Don't include the last named arg. */
2091 --n_named_args;
2092 else
2093 /* Treat all args as named. */
2094 n_named_args = num_actuals;
2096 /* Make a vector to hold all the information about each arg. */
2097 args = alloca (num_actuals * sizeof (struct arg_data));
2098 memset (args, 0, num_actuals * sizeof (struct arg_data));
2100 /* Build up entries in the ARGS array, compute the size of the
2101 arguments into ARGS_SIZE, etc. */
2102 initialize_argument_information (num_actuals, args, &args_size,
2103 n_named_args, actparms, fndecl,
2104 &args_so_far, reg_parm_stack_space,
2105 &old_stack_level, &old_pending_adj,
2106 &must_preallocate, &flags,
2107 &try_tail_call, CALL_FROM_THUNK_P (exp));
2109 if (args_size.var)
2111 /* If this function requires a variable-sized argument list, don't
2112 try to make a cse'able block for this call. We may be able to
2113 do this eventually, but it is too complicated to keep track of
2114 what insns go in the cse'able block and which don't. */
2116 flags &= ~ECF_LIBCALL_BLOCK;
2117 must_preallocate = 1;
2120 /* Now make final decision about preallocating stack space. */
2121 must_preallocate = finalize_must_preallocate (must_preallocate,
2122 num_actuals, args,
2123 &args_size);
2125 /* If the structure value address will reference the stack pointer, we
2126 must stabilize it. We don't need to do this if we know that we are
2127 not going to adjust the stack pointer in processing this call. */
2129 if (structure_value_addr
2130 && (reg_mentioned_p (virtual_stack_dynamic_rtx, structure_value_addr)
2131 || reg_mentioned_p (virtual_outgoing_args_rtx,
2132 structure_value_addr))
2133 && (args_size.var
2134 || (!ACCUMULATE_OUTGOING_ARGS && args_size.constant)))
2135 structure_value_addr = copy_to_reg (structure_value_addr);
2137 /* Tail calls can make things harder to debug, and we've traditionally
2138 pushed these optimizations into -O2. Don't try if we're already
2139 expanding a call, as that means we're an argument. Don't try if
2140 there's cleanups, as we know there's code to follow the call. */
2142 if (currently_expanding_call++ != 0
2143 || !flag_optimize_sibling_calls
2144 || args_size.var
2145 || lookup_stmt_eh_region (exp) >= 0)
2146 try_tail_call = 0;
2148 /* Rest of purposes for tail call optimizations to fail. */
2149 if (
2150 #ifdef HAVE_sibcall_epilogue
2151 !HAVE_sibcall_epilogue
2152 #else
2154 #endif
2155 || !try_tail_call
2156 /* Doing sibling call optimization needs some work, since
2157 structure_value_addr can be allocated on the stack.
2158 It does not seem worth the effort since few optimizable
2159 sibling calls will return a structure. */
2160 || structure_value_addr != NULL_RTX
2161 /* Check whether the target is able to optimize the call
2162 into a sibcall. */
2163 || !targetm.function_ok_for_sibcall (fndecl, exp)
2164 /* Functions that do not return exactly once may not be sibcall
2165 optimized. */
2166 || (flags & (ECF_RETURNS_TWICE | ECF_LONGJMP | ECF_NORETURN))
2167 || TYPE_VOLATILE (TREE_TYPE (TREE_TYPE (addr)))
2168 /* If the called function is nested in the current one, it might access
2169 some of the caller's arguments, but could clobber them beforehand if
2170 the argument areas are shared. */
2171 || (fndecl && decl_function_context (fndecl) == current_function_decl)
2172 /* If this function requires more stack slots than the current
2173 function, we cannot change it into a sibling call. */
2174 || args_size.constant > current_function_args_size
2175 /* If the callee pops its own arguments, then it must pop exactly
2176 the same number of arguments as the current function. */
2177 || (RETURN_POPS_ARGS (fndecl, funtype, args_size.constant)
2178 != RETURN_POPS_ARGS (current_function_decl,
2179 TREE_TYPE (current_function_decl),
2180 current_function_args_size))
2181 || !lang_hooks.decls.ok_for_sibcall (fndecl))
2182 try_tail_call = 0;
2184 /* Ensure current function's preferred stack boundary is at least
2185 what we need. We don't have to increase alignment for recursive
2186 functions. */
2187 if (cfun->preferred_stack_boundary < preferred_stack_boundary
2188 && fndecl != current_function_decl)
2189 cfun->preferred_stack_boundary = preferred_stack_boundary;
2190 if (fndecl == current_function_decl)
2191 cfun->recursive_call_emit = true;
2193 preferred_unit_stack_boundary = preferred_stack_boundary / BITS_PER_UNIT;
2195 /* We want to make two insn chains; one for a sibling call, the other
2196 for a normal call. We will select one of the two chains after
2197 initial RTL generation is complete. */
2198 for (pass = try_tail_call ? 0 : 1; pass < 2; pass++)
2200 int sibcall_failure = 0;
2201 /* We want to emit any pending stack adjustments before the tail
2202 recursion "call". That way we know any adjustment after the tail
2203 recursion call can be ignored if we indeed use the tail
2204 call expansion. */
2205 int save_pending_stack_adjust = 0;
2206 int save_stack_pointer_delta = 0;
2207 rtx insns;
2208 rtx before_call, next_arg_reg;
2210 if (pass == 0)
2212 /* State variables we need to save and restore between
2213 iterations. */
2214 save_pending_stack_adjust = pending_stack_adjust;
2215 save_stack_pointer_delta = stack_pointer_delta;
2217 if (pass)
2218 flags &= ~ECF_SIBCALL;
2219 else
2220 flags |= ECF_SIBCALL;
2222 /* Other state variables that we must reinitialize each time
2223 through the loop (that are not initialized by the loop itself). */
2224 argblock = 0;
2225 call_fusage = 0;
2227 /* Start a new sequence for the normal call case.
2229 From this point on, if the sibling call fails, we want to set
2230 sibcall_failure instead of continuing the loop. */
2231 start_sequence ();
2233 /* Don't let pending stack adjusts add up to too much.
2234 Also, do all pending adjustments now if there is any chance
2235 this might be a call to alloca or if we are expanding a sibling
2236 call sequence or if we are calling a function that is to return
2237 with stack pointer depressed. */
2238 if (pending_stack_adjust >= 32
2239 || (pending_stack_adjust > 0
2240 && (flags & (ECF_MAY_BE_ALLOCA | ECF_SP_DEPRESSED)))
2241 || pass == 0)
2242 do_pending_stack_adjust ();
2244 /* When calling a const function, we must pop the stack args right away,
2245 so that the pop is deleted or moved with the call. */
2246 if (pass && (flags & ECF_LIBCALL_BLOCK))
2247 NO_DEFER_POP;
2249 /* Precompute any arguments as needed. */
2250 if (pass)
2251 precompute_arguments (flags, num_actuals, args);
2253 /* Now we are about to start emitting insns that can be deleted
2254 if a libcall is deleted. */
2255 if (pass && (flags & (ECF_LIBCALL_BLOCK | ECF_MALLOC)))
2256 start_sequence ();
2258 adjusted_args_size = args_size;
2259 /* Compute the actual size of the argument block required. The variable
2260 and constant sizes must be combined, the size may have to be rounded,
2261 and there may be a minimum required size. When generating a sibcall
2262 pattern, do not round up, since we'll be re-using whatever space our
2263 caller provided. */
2264 unadjusted_args_size
2265 = compute_argument_block_size (reg_parm_stack_space,
2266 &adjusted_args_size,
2267 (pass == 0 ? 0
2268 : preferred_stack_boundary));
2270 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
2272 /* The argument block when performing a sibling call is the
2273 incoming argument block. */
2274 if (pass == 0)
2276 argblock = virtual_incoming_args_rtx;
2277 argblock
2278 #ifdef STACK_GROWS_DOWNWARD
2279 = plus_constant (argblock, current_function_pretend_args_size);
2280 #else
2281 = plus_constant (argblock, -current_function_pretend_args_size);
2282 #endif
2283 stored_args_map = sbitmap_alloc (args_size.constant);
2284 sbitmap_zero (stored_args_map);
2287 /* If we have no actual push instructions, or shouldn't use them,
2288 make space for all args right now. */
2289 else if (adjusted_args_size.var != 0)
2291 if (old_stack_level == 0)
2293 emit_stack_save (SAVE_BLOCK, &old_stack_level, NULL_RTX);
2294 old_stack_pointer_delta = stack_pointer_delta;
2295 old_pending_adj = pending_stack_adjust;
2296 pending_stack_adjust = 0;
2297 /* stack_arg_under_construction says whether a stack arg is
2298 being constructed at the old stack level. Pushing the stack
2299 gets a clean outgoing argument block. */
2300 old_stack_arg_under_construction = stack_arg_under_construction;
2301 stack_arg_under_construction = 0;
2303 argblock = push_block (ARGS_SIZE_RTX (adjusted_args_size), 0, 0);
2305 else
2307 /* Note that we must go through the motions of allocating an argument
2308 block even if the size is zero because we may be storing args
2309 in the area reserved for register arguments, which may be part of
2310 the stack frame. */
2312 int needed = adjusted_args_size.constant;
2314 /* Store the maximum argument space used. It will be pushed by
2315 the prologue (if ACCUMULATE_OUTGOING_ARGS, or stack overflow
2316 checking). */
2318 if (needed > current_function_outgoing_args_size)
2319 current_function_outgoing_args_size = needed;
2321 if (must_preallocate)
2323 if (ACCUMULATE_OUTGOING_ARGS)
2325 /* Since the stack pointer will never be pushed, it is
2326 possible for the evaluation of a parm to clobber
2327 something we have already written to the stack.
2328 Since most function calls on RISC machines do not use
2329 the stack, this is uncommon, but must work correctly.
2331 Therefore, we save any area of the stack that was already
2332 written and that we are using. Here we set up to do this
2333 by making a new stack usage map from the old one. The
2334 actual save will be done by store_one_arg.
2336 Another approach might be to try to reorder the argument
2337 evaluations to avoid this conflicting stack usage. */
2339 #ifndef OUTGOING_REG_PARM_STACK_SPACE
2340 /* Since we will be writing into the entire argument area,
2341 the map must be allocated for its entire size, not just
2342 the part that is the responsibility of the caller. */
2343 needed += reg_parm_stack_space;
2344 #endif
2346 #ifdef ARGS_GROW_DOWNWARD
2347 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2348 needed + 1);
2349 #else
2350 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2351 needed);
2352 #endif
2353 stack_usage_map = alloca (highest_outgoing_arg_in_use);
2355 if (initial_highest_arg_in_use)
2356 memcpy (stack_usage_map, initial_stack_usage_map,
2357 initial_highest_arg_in_use);
2359 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
2360 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
2361 (highest_outgoing_arg_in_use
2362 - initial_highest_arg_in_use));
2363 needed = 0;
2365 /* The address of the outgoing argument list must not be
2366 copied to a register here, because argblock would be left
2367 pointing to the wrong place after the call to
2368 allocate_dynamic_stack_space below. */
2370 argblock = virtual_outgoing_args_rtx;
2372 else
2374 if (inhibit_defer_pop == 0)
2376 /* Try to reuse some or all of the pending_stack_adjust
2377 to get this space. */
2378 needed
2379 = (combine_pending_stack_adjustment_and_call
2380 (unadjusted_args_size,
2381 &adjusted_args_size,
2382 preferred_unit_stack_boundary));
2384 /* combine_pending_stack_adjustment_and_call computes
2385 an adjustment before the arguments are allocated.
2386 Account for them and see whether or not the stack
2387 needs to go up or down. */
2388 needed = unadjusted_args_size - needed;
2390 if (needed < 0)
2392 /* We're releasing stack space. */
2393 /* ??? We can avoid any adjustment at all if we're
2394 already aligned. FIXME. */
2395 pending_stack_adjust = -needed;
2396 do_pending_stack_adjust ();
2397 needed = 0;
2399 else
2400 /* We need to allocate space. We'll do that in
2401 push_block below. */
2402 pending_stack_adjust = 0;
2405 /* Special case this because overhead of `push_block' in
2406 this case is non-trivial. */
2407 if (needed == 0)
2408 argblock = virtual_outgoing_args_rtx;
2409 else
2411 argblock = push_block (GEN_INT (needed), 0, 0);
2412 #ifdef ARGS_GROW_DOWNWARD
2413 argblock = plus_constant (argblock, needed);
2414 #endif
2417 /* We only really need to call `copy_to_reg' in the case
2418 where push insns are going to be used to pass ARGBLOCK
2419 to a function call in ARGS. In that case, the stack
2420 pointer changes value from the allocation point to the
2421 call point, and hence the value of
2422 VIRTUAL_OUTGOING_ARGS_RTX changes as well. But might
2423 as well always do it. */
2424 argblock = copy_to_reg (argblock);
2429 if (ACCUMULATE_OUTGOING_ARGS)
2431 /* The save/restore code in store_one_arg handles all
2432 cases except one: a constructor call (including a C
2433 function returning a BLKmode struct) to initialize
2434 an argument. */
2435 if (stack_arg_under_construction)
2437 #ifndef OUTGOING_REG_PARM_STACK_SPACE
2438 rtx push_size = GEN_INT (reg_parm_stack_space
2439 + adjusted_args_size.constant);
2440 #else
2441 rtx push_size = GEN_INT (adjusted_args_size.constant);
2442 #endif
2443 if (old_stack_level == 0)
2445 emit_stack_save (SAVE_BLOCK, &old_stack_level,
2446 NULL_RTX);
2447 old_stack_pointer_delta = stack_pointer_delta;
2448 old_pending_adj = pending_stack_adjust;
2449 pending_stack_adjust = 0;
2450 /* stack_arg_under_construction says whether a stack
2451 arg is being constructed at the old stack level.
2452 Pushing the stack gets a clean outgoing argument
2453 block. */
2454 old_stack_arg_under_construction
2455 = stack_arg_under_construction;
2456 stack_arg_under_construction = 0;
2457 /* Make a new map for the new argument list. */
2458 stack_usage_map = alloca (highest_outgoing_arg_in_use);
2459 memset (stack_usage_map, 0, highest_outgoing_arg_in_use);
2460 highest_outgoing_arg_in_use = 0;
2462 allocate_dynamic_stack_space (push_size, NULL_RTX,
2463 BITS_PER_UNIT);
2466 /* If argument evaluation might modify the stack pointer,
2467 copy the address of the argument list to a register. */
2468 for (i = 0; i < num_actuals; i++)
2469 if (args[i].pass_on_stack)
2471 argblock = copy_addr_to_reg (argblock);
2472 break;
2476 compute_argument_addresses (args, argblock, num_actuals);
2478 /* If we push args individually in reverse order, perform stack alignment
2479 before the first push (the last arg). */
2480 if (PUSH_ARGS_REVERSED && argblock == 0
2481 && adjusted_args_size.constant != unadjusted_args_size)
2483 /* When the stack adjustment is pending, we get better code
2484 by combining the adjustments. */
2485 if (pending_stack_adjust
2486 && ! (flags & ECF_LIBCALL_BLOCK)
2487 && ! inhibit_defer_pop)
2489 pending_stack_adjust
2490 = (combine_pending_stack_adjustment_and_call
2491 (unadjusted_args_size,
2492 &adjusted_args_size,
2493 preferred_unit_stack_boundary));
2494 do_pending_stack_adjust ();
2496 else if (argblock == 0)
2497 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
2498 - unadjusted_args_size));
2500 /* Now that the stack is properly aligned, pops can't safely
2501 be deferred during the evaluation of the arguments. */
2502 NO_DEFER_POP;
2504 funexp = rtx_for_function_call (fndecl, addr);
2506 /* Figure out the register where the value, if any, will come back. */
2507 valreg = 0;
2508 if (TYPE_MODE (TREE_TYPE (exp)) != VOIDmode
2509 && ! structure_value_addr)
2511 if (pcc_struct_value)
2512 valreg = hard_function_value (build_pointer_type (TREE_TYPE (exp)),
2513 fndecl, (pass == 0));
2514 else
2515 valreg = hard_function_value (TREE_TYPE (exp), fndecl, (pass == 0));
2518 /* Precompute all register parameters. It isn't safe to compute anything
2519 once we have started filling any specific hard regs. */
2520 precompute_register_parameters (num_actuals, args, &reg_parm_seen);
2522 if (TREE_OPERAND (exp, 2))
2523 static_chain_value = expand_expr (TREE_OPERAND (exp, 2),
2524 NULL_RTX, VOIDmode, 0);
2525 else
2526 static_chain_value = 0;
2528 #ifdef REG_PARM_STACK_SPACE
2529 /* Save the fixed argument area if it's part of the caller's frame and
2530 is clobbered by argument setup for this call. */
2531 if (ACCUMULATE_OUTGOING_ARGS && pass)
2532 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
2533 &low_to_save, &high_to_save);
2534 #endif
2536 /* Now store (and compute if necessary) all non-register parms.
2537 These come before register parms, since they can require block-moves,
2538 which could clobber the registers used for register parms.
2539 Parms which have partial registers are not stored here,
2540 but we do preallocate space here if they want that. */
2542 for (i = 0; i < num_actuals; i++)
2543 if (args[i].reg == 0 || args[i].pass_on_stack)
2545 rtx before_arg = get_last_insn ();
2547 if (store_one_arg (&args[i], argblock, flags,
2548 adjusted_args_size.var != 0,
2549 reg_parm_stack_space)
2550 || (pass == 0
2551 && check_sibcall_argument_overlap (before_arg,
2552 &args[i], 1)))
2553 sibcall_failure = 1;
2555 if (flags & ECF_CONST
2556 && args[i].stack
2557 && args[i].value == args[i].stack)
2558 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
2559 gen_rtx_USE (VOIDmode,
2560 args[i].value),
2561 call_fusage);
2564 /* If we have a parm that is passed in registers but not in memory
2565 and whose alignment does not permit a direct copy into registers,
2566 make a group of pseudos that correspond to each register that we
2567 will later fill. */
2568 if (STRICT_ALIGNMENT)
2569 store_unaligned_arguments_into_pseudos (args, num_actuals);
2571 /* Now store any partially-in-registers parm.
2572 This is the last place a block-move can happen. */
2573 if (reg_parm_seen)
2574 for (i = 0; i < num_actuals; i++)
2575 if (args[i].partial != 0 && ! args[i].pass_on_stack)
2577 rtx before_arg = get_last_insn ();
2579 if (store_one_arg (&args[i], argblock, flags,
2580 adjusted_args_size.var != 0,
2581 reg_parm_stack_space)
2582 || (pass == 0
2583 && check_sibcall_argument_overlap (before_arg,
2584 &args[i], 1)))
2585 sibcall_failure = 1;
2588 /* If we pushed args in forward order, perform stack alignment
2589 after pushing the last arg. */
2590 if (!PUSH_ARGS_REVERSED && argblock == 0)
2591 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
2592 - unadjusted_args_size));
2594 /* If register arguments require space on the stack and stack space
2595 was not preallocated, allocate stack space here for arguments
2596 passed in registers. */
2597 #ifdef OUTGOING_REG_PARM_STACK_SPACE
2598 if (!ACCUMULATE_OUTGOING_ARGS
2599 && must_preallocate == 0 && reg_parm_stack_space > 0)
2600 anti_adjust_stack (GEN_INT (reg_parm_stack_space));
2601 #endif
2603 /* Pass the function the address in which to return a
2604 structure value. */
2605 if (pass != 0 && structure_value_addr && ! structure_value_addr_parm)
2607 structure_value_addr
2608 = convert_memory_address (Pmode, structure_value_addr);
2609 emit_move_insn (struct_value,
2610 force_reg (Pmode,
2611 force_operand (structure_value_addr,
2612 NULL_RTX)));
2614 if (REG_P (struct_value))
2615 use_reg (&call_fusage, struct_value);
2618 funexp = prepare_call_address (funexp, static_chain_value,
2619 &call_fusage, reg_parm_seen, pass == 0);
2621 load_register_parameters (args, num_actuals, &call_fusage, flags,
2622 pass == 0, &sibcall_failure);
2624 /* Save a pointer to the last insn before the call, so that we can
2625 later safely search backwards to find the CALL_INSN. */
2626 before_call = get_last_insn ();
2628 /* Set up next argument register. For sibling calls on machines
2629 with register windows this should be the incoming register. */
2630 #ifdef FUNCTION_INCOMING_ARG
2631 if (pass == 0)
2632 next_arg_reg = FUNCTION_INCOMING_ARG (args_so_far, VOIDmode,
2633 void_type_node, 1);
2634 else
2635 #endif
2636 next_arg_reg = FUNCTION_ARG (args_so_far, VOIDmode,
2637 void_type_node, 1);
2639 /* All arguments and registers used for the call must be set up by
2640 now! */
2642 /* Stack must be properly aligned now. */
2643 gcc_assert (!pass
2644 || !(stack_pointer_delta % preferred_unit_stack_boundary));
2646 /* Generate the actual call instruction. */
2647 emit_call_1 (funexp, exp, fndecl, funtype, unadjusted_args_size,
2648 adjusted_args_size.constant, struct_value_size,
2649 next_arg_reg, valreg, old_inhibit_defer_pop, call_fusage,
2650 flags, & args_so_far);
2652 /* If call is cse'able, make appropriate pair of reg-notes around it.
2653 Test valreg so we don't crash; may safely ignore `const'
2654 if return type is void. Disable for PARALLEL return values, because
2655 we have no way to move such values into a pseudo register. */
2656 if (pass && (flags & ECF_LIBCALL_BLOCK))
2658 rtx insns;
2659 rtx insn;
2660 bool failed = valreg == 0 || GET_CODE (valreg) == PARALLEL;
2662 insns = get_insns ();
2664 /* Expansion of block moves possibly introduced a loop that may
2665 not appear inside libcall block. */
2666 for (insn = insns; insn; insn = NEXT_INSN (insn))
2667 if (JUMP_P (insn))
2668 failed = true;
2670 if (failed)
2672 end_sequence ();
2673 emit_insn (insns);
2675 else
2677 rtx note = 0;
2678 rtx temp = gen_reg_rtx (GET_MODE (valreg));
2680 /* Mark the return value as a pointer if needed. */
2681 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
2682 mark_reg_pointer (temp,
2683 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (exp))));
2685 end_sequence ();
2686 if (flag_unsafe_math_optimizations
2687 && fndecl
2688 && DECL_BUILT_IN (fndecl)
2689 && (DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRT
2690 || DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRTF
2691 || DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRTL))
2692 note = gen_rtx_fmt_e (SQRT,
2693 GET_MODE (temp),
2694 args[0].initial_value);
2695 else
2697 /* Construct an "equal form" for the value which
2698 mentions all the arguments in order as well as
2699 the function name. */
2700 for (i = 0; i < num_actuals; i++)
2701 note = gen_rtx_EXPR_LIST (VOIDmode,
2702 args[i].initial_value, note);
2703 note = gen_rtx_EXPR_LIST (VOIDmode, funexp, note);
2705 if (flags & ECF_PURE)
2706 note = gen_rtx_EXPR_LIST (VOIDmode,
2707 gen_rtx_USE (VOIDmode,
2708 gen_rtx_MEM (BLKmode,
2709 gen_rtx_SCRATCH (VOIDmode))),
2710 note);
2712 emit_libcall_block (insns, temp, valreg, note);
2714 valreg = temp;
2717 else if (pass && (flags & ECF_MALLOC))
2719 rtx temp = gen_reg_rtx (GET_MODE (valreg));
2720 rtx last, insns;
2722 /* The return value from a malloc-like function is a pointer. */
2723 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
2724 mark_reg_pointer (temp, BIGGEST_ALIGNMENT);
2726 emit_move_insn (temp, valreg);
2728 /* The return value from a malloc-like function can not alias
2729 anything else. */
2730 last = get_last_insn ();
2731 REG_NOTES (last) =
2732 gen_rtx_EXPR_LIST (REG_NOALIAS, temp, REG_NOTES (last));
2734 /* Write out the sequence. */
2735 insns = get_insns ();
2736 end_sequence ();
2737 emit_insn (insns);
2738 valreg = temp;
2741 /* For calls to `setjmp', etc., inform flow.c it should complain
2742 if nonvolatile values are live. For functions that cannot return,
2743 inform flow that control does not fall through. */
2745 if ((flags & (ECF_NORETURN | ECF_LONGJMP)) || pass == 0)
2747 /* The barrier must be emitted
2748 immediately after the CALL_INSN. Some ports emit more
2749 than just a CALL_INSN above, so we must search for it here. */
2751 rtx last = get_last_insn ();
2752 while (!CALL_P (last))
2754 last = PREV_INSN (last);
2755 /* There was no CALL_INSN? */
2756 gcc_assert (last != before_call);
2759 emit_barrier_after (last);
2761 /* Stack adjustments after a noreturn call are dead code.
2762 However when NO_DEFER_POP is in effect, we must preserve
2763 stack_pointer_delta. */
2764 if (inhibit_defer_pop == 0)
2766 stack_pointer_delta = old_stack_allocated;
2767 pending_stack_adjust = 0;
2771 if (flags & ECF_LONGJMP)
2772 current_function_calls_longjmp = 1;
2774 /* If value type not void, return an rtx for the value. */
2776 if (TYPE_MODE (TREE_TYPE (exp)) == VOIDmode
2777 || ignore)
2778 target = const0_rtx;
2779 else if (structure_value_addr)
2781 if (target == 0 || !MEM_P (target))
2783 target
2784 = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
2785 memory_address (TYPE_MODE (TREE_TYPE (exp)),
2786 structure_value_addr));
2787 set_mem_attributes (target, exp, 1);
2790 else if (pcc_struct_value)
2792 /* This is the special C++ case where we need to
2793 know what the true target was. We take care to
2794 never use this value more than once in one expression. */
2795 target = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
2796 copy_to_reg (valreg));
2797 set_mem_attributes (target, exp, 1);
2799 /* Handle calls that return values in multiple non-contiguous locations.
2800 The Irix 6 ABI has examples of this. */
2801 else if (GET_CODE (valreg) == PARALLEL)
2803 if (target == 0)
2805 /* This will only be assigned once, so it can be readonly. */
2806 tree nt = build_qualified_type (TREE_TYPE (exp),
2807 (TYPE_QUALS (TREE_TYPE (exp))
2808 | TYPE_QUAL_CONST));
2810 target = assign_temp (nt, 0, 1, 1);
2811 preserve_temp_slots (target);
2814 if (! rtx_equal_p (target, valreg))
2815 emit_group_store (target, valreg, TREE_TYPE (exp),
2816 int_size_in_bytes (TREE_TYPE (exp)));
2818 /* We can not support sibling calls for this case. */
2819 sibcall_failure = 1;
2821 else if (target
2822 && GET_MODE (target) == TYPE_MODE (TREE_TYPE (exp))
2823 && GET_MODE (target) == GET_MODE (valreg))
2825 /* TARGET and VALREG cannot be equal at this point because the
2826 latter would not have REG_FUNCTION_VALUE_P true, while the
2827 former would if it were referring to the same register.
2829 If they refer to the same register, this move will be a no-op,
2830 except when function inlining is being done. */
2831 emit_move_insn (target, valreg);
2833 /* If we are setting a MEM, this code must be executed. Since it is
2834 emitted after the call insn, sibcall optimization cannot be
2835 performed in that case. */
2836 if (MEM_P (target))
2837 sibcall_failure = 1;
2839 else if (TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
2841 target = copy_blkmode_from_reg (target, valreg, TREE_TYPE (exp));
2843 /* We can not support sibling calls for this case. */
2844 sibcall_failure = 1;
2846 else
2848 if (shift_returned_value (TREE_TYPE (exp), &valreg))
2849 sibcall_failure = 1;
2851 target = copy_to_reg (valreg);
2854 if (targetm.calls.promote_function_return(funtype))
2856 /* If we promoted this return value, make the proper SUBREG.
2857 TARGET might be const0_rtx here, so be careful. */
2858 if (REG_P (target)
2859 && TYPE_MODE (TREE_TYPE (exp)) != BLKmode
2860 && GET_MODE (target) != TYPE_MODE (TREE_TYPE (exp)))
2862 tree type = TREE_TYPE (exp);
2863 int unsignedp = TYPE_UNSIGNED (type);
2864 int offset = 0;
2865 enum machine_mode pmode;
2867 pmode = promote_mode (type, TYPE_MODE (type), &unsignedp, 1);
2868 /* If we don't promote as expected, something is wrong. */
2869 gcc_assert (GET_MODE (target) == pmode);
2871 if ((WORDS_BIG_ENDIAN || BYTES_BIG_ENDIAN)
2872 && (GET_MODE_SIZE (GET_MODE (target))
2873 > GET_MODE_SIZE (TYPE_MODE (type))))
2875 offset = GET_MODE_SIZE (GET_MODE (target))
2876 - GET_MODE_SIZE (TYPE_MODE (type));
2877 if (! BYTES_BIG_ENDIAN)
2878 offset = (offset / UNITS_PER_WORD) * UNITS_PER_WORD;
2879 else if (! WORDS_BIG_ENDIAN)
2880 offset %= UNITS_PER_WORD;
2882 target = gen_rtx_SUBREG (TYPE_MODE (type), target, offset);
2883 SUBREG_PROMOTED_VAR_P (target) = 1;
2884 SUBREG_PROMOTED_UNSIGNED_SET (target, unsignedp);
2888 /* If size of args is variable or this was a constructor call for a stack
2889 argument, restore saved stack-pointer value. */
2891 if (old_stack_level && ! (flags & ECF_SP_DEPRESSED))
2893 emit_stack_restore (SAVE_BLOCK, old_stack_level, NULL_RTX);
2894 stack_pointer_delta = old_stack_pointer_delta;
2895 pending_stack_adjust = old_pending_adj;
2896 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
2897 stack_arg_under_construction = old_stack_arg_under_construction;
2898 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
2899 stack_usage_map = initial_stack_usage_map;
2900 sibcall_failure = 1;
2902 else if (ACCUMULATE_OUTGOING_ARGS && pass)
2904 #ifdef REG_PARM_STACK_SPACE
2905 if (save_area)
2906 restore_fixed_argument_area (save_area, argblock,
2907 high_to_save, low_to_save);
2908 #endif
2910 /* If we saved any argument areas, restore them. */
2911 for (i = 0; i < num_actuals; i++)
2912 if (args[i].save_area)
2914 enum machine_mode save_mode = GET_MODE (args[i].save_area);
2915 rtx stack_area
2916 = gen_rtx_MEM (save_mode,
2917 memory_address (save_mode,
2918 XEXP (args[i].stack_slot, 0)));
2920 if (save_mode != BLKmode)
2921 emit_move_insn (stack_area, args[i].save_area);
2922 else
2923 emit_block_move (stack_area, args[i].save_area,
2924 GEN_INT (args[i].locate.size.constant),
2925 BLOCK_OP_CALL_PARM);
2928 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
2929 stack_usage_map = initial_stack_usage_map;
2932 /* If this was alloca, record the new stack level for nonlocal gotos.
2933 Check for the handler slots since we might not have a save area
2934 for non-local gotos. */
2936 if ((flags & ECF_MAY_BE_ALLOCA) && cfun->nonlocal_goto_save_area != 0)
2937 update_nonlocal_goto_save_area ();
2939 /* Free up storage we no longer need. */
2940 for (i = 0; i < num_actuals; ++i)
2941 if (args[i].aligned_regs)
2942 free (args[i].aligned_regs);
2944 insns = get_insns ();
2945 end_sequence ();
2947 if (pass == 0)
2949 tail_call_insns = insns;
2951 /* Restore the pending stack adjustment now that we have
2952 finished generating the sibling call sequence. */
2954 pending_stack_adjust = save_pending_stack_adjust;
2955 stack_pointer_delta = save_stack_pointer_delta;
2957 /* Prepare arg structure for next iteration. */
2958 for (i = 0; i < num_actuals; i++)
2960 args[i].value = 0;
2961 args[i].aligned_regs = 0;
2962 args[i].stack = 0;
2965 sbitmap_free (stored_args_map);
2967 else
2969 normal_call_insns = insns;
2971 /* Verify that we've deallocated all the stack we used. */
2972 gcc_assert ((flags & (ECF_NORETURN | ECF_LONGJMP))
2973 || (old_stack_allocated
2974 == stack_pointer_delta - pending_stack_adjust));
2977 /* If something prevents making this a sibling call,
2978 zero out the sequence. */
2979 if (sibcall_failure)
2980 tail_call_insns = NULL_RTX;
2981 else
2982 break;
2985 /* If tail call production succeeded, we need to remove REG_EQUIV notes on
2986 arguments too, as argument area is now clobbered by the call. */
2987 if (tail_call_insns)
2989 emit_insn (tail_call_insns);
2990 cfun->tail_call_emit = true;
2992 else
2993 emit_insn (normal_call_insns);
2995 currently_expanding_call--;
2997 /* If this function returns with the stack pointer depressed, ensure
2998 this block saves and restores the stack pointer, show it was
2999 changed, and adjust for any outgoing arg space. */
3000 if (flags & ECF_SP_DEPRESSED)
3002 clear_pending_stack_adjust ();
3003 emit_insn (gen_rtx_CLOBBER (VOIDmode, stack_pointer_rtx));
3004 emit_move_insn (virtual_stack_dynamic_rtx, stack_pointer_rtx);
3007 return target;
3010 /* A sibling call sequence invalidates any REG_EQUIV notes made for
3011 this function's incoming arguments.
3013 At the start of RTL generation we know the only REG_EQUIV notes
3014 in the rtl chain are those for incoming arguments, so we can safely
3015 flush any REG_EQUIV note.
3017 This is (slight) overkill. We could keep track of the highest
3018 argument we clobber and be more selective in removing notes, but it
3019 does not seem to be worth the effort. */
3020 void
3021 fixup_tail_calls (void)
3023 purge_reg_equiv_notes ();
3026 /* Traverse an argument list in VALUES and expand all complex
3027 arguments into their components. */
3028 static tree
3029 split_complex_values (tree values)
3031 tree p;
3033 /* Before allocating memory, check for the common case of no complex. */
3034 for (p = values; p; p = TREE_CHAIN (p))
3036 tree type = TREE_TYPE (TREE_VALUE (p));
3037 if (type && TREE_CODE (type) == COMPLEX_TYPE
3038 && targetm.calls.split_complex_arg (type))
3039 goto found;
3041 return values;
3043 found:
3044 values = copy_list (values);
3046 for (p = values; p; p = TREE_CHAIN (p))
3048 tree complex_value = TREE_VALUE (p);
3049 tree complex_type;
3051 complex_type = TREE_TYPE (complex_value);
3052 if (!complex_type)
3053 continue;
3055 if (TREE_CODE (complex_type) == COMPLEX_TYPE
3056 && targetm.calls.split_complex_arg (complex_type))
3058 tree subtype;
3059 tree real, imag, next;
3061 subtype = TREE_TYPE (complex_type);
3062 complex_value = save_expr (complex_value);
3063 real = build1 (REALPART_EXPR, subtype, complex_value);
3064 imag = build1 (IMAGPART_EXPR, subtype, complex_value);
3066 TREE_VALUE (p) = real;
3067 next = TREE_CHAIN (p);
3068 imag = build_tree_list (NULL_TREE, imag);
3069 TREE_CHAIN (p) = imag;
3070 TREE_CHAIN (imag) = next;
3072 /* Skip the newly created node. */
3073 p = TREE_CHAIN (p);
3077 return values;
3080 /* Traverse a list of TYPES and expand all complex types into their
3081 components. */
3082 static tree
3083 split_complex_types (tree types)
3085 tree p;
3087 /* Before allocating memory, check for the common case of no complex. */
3088 for (p = types; p; p = TREE_CHAIN (p))
3090 tree type = TREE_VALUE (p);
3091 if (TREE_CODE (type) == COMPLEX_TYPE
3092 && targetm.calls.split_complex_arg (type))
3093 goto found;
3095 return types;
3097 found:
3098 types = copy_list (types);
3100 for (p = types; p; p = TREE_CHAIN (p))
3102 tree complex_type = TREE_VALUE (p);
3104 if (TREE_CODE (complex_type) == COMPLEX_TYPE
3105 && targetm.calls.split_complex_arg (complex_type))
3107 tree next, imag;
3109 /* Rewrite complex type with component type. */
3110 TREE_VALUE (p) = TREE_TYPE (complex_type);
3111 next = TREE_CHAIN (p);
3113 /* Add another component type for the imaginary part. */
3114 imag = build_tree_list (NULL_TREE, TREE_VALUE (p));
3115 TREE_CHAIN (p) = imag;
3116 TREE_CHAIN (imag) = next;
3118 /* Skip the newly created node. */
3119 p = TREE_CHAIN (p);
3123 return types;
3126 /* Output a library call to function FUN (a SYMBOL_REF rtx).
3127 The RETVAL parameter specifies whether return value needs to be saved, other
3128 parameters are documented in the emit_library_call function below. */
3130 static rtx
3131 emit_library_call_value_1 (int retval, rtx orgfun, rtx value,
3132 enum libcall_type fn_type,
3133 enum machine_mode outmode, int nargs, va_list p)
3135 /* Total size in bytes of all the stack-parms scanned so far. */
3136 struct args_size args_size;
3137 /* Size of arguments before any adjustments (such as rounding). */
3138 struct args_size original_args_size;
3139 int argnum;
3140 rtx fun;
3141 int inc;
3142 int count;
3143 rtx argblock = 0;
3144 CUMULATIVE_ARGS args_so_far;
3145 struct arg
3147 rtx value;
3148 enum machine_mode mode;
3149 rtx reg;
3150 int partial;
3151 struct locate_and_pad_arg_data locate;
3152 rtx save_area;
3154 struct arg *argvec;
3155 int old_inhibit_defer_pop = inhibit_defer_pop;
3156 rtx call_fusage = 0;
3157 rtx mem_value = 0;
3158 rtx valreg;
3159 int pcc_struct_value = 0;
3160 int struct_value_size = 0;
3161 int flags;
3162 int reg_parm_stack_space = 0;
3163 int needed;
3164 rtx before_call;
3165 tree tfom; /* type_for_mode (outmode, 0) */
3167 #ifdef REG_PARM_STACK_SPACE
3168 /* Define the boundary of the register parm stack space that needs to be
3169 save, if any. */
3170 int low_to_save, high_to_save;
3171 rtx save_area = 0; /* Place that it is saved. */
3172 #endif
3174 /* Size of the stack reserved for parameter registers. */
3175 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
3176 char *initial_stack_usage_map = stack_usage_map;
3178 rtx struct_value = targetm.calls.struct_value_rtx (0, 0);
3180 #ifdef REG_PARM_STACK_SPACE
3181 reg_parm_stack_space = REG_PARM_STACK_SPACE ((tree) 0);
3182 #endif
3184 /* By default, library functions can not throw. */
3185 flags = ECF_NOTHROW;
3187 switch (fn_type)
3189 case LCT_NORMAL:
3190 break;
3191 case LCT_CONST:
3192 flags |= ECF_CONST;
3193 break;
3194 case LCT_PURE:
3195 flags |= ECF_PURE;
3196 break;
3197 case LCT_CONST_MAKE_BLOCK:
3198 flags |= ECF_CONST | ECF_LIBCALL_BLOCK;
3199 break;
3200 case LCT_PURE_MAKE_BLOCK:
3201 flags |= ECF_PURE | ECF_LIBCALL_BLOCK;
3202 break;
3203 case LCT_NORETURN:
3204 flags |= ECF_NORETURN;
3205 break;
3206 case LCT_THROW:
3207 flags = ECF_NORETURN;
3208 break;
3209 case LCT_ALWAYS_RETURN:
3210 flags = ECF_ALWAYS_RETURN;
3211 break;
3212 case LCT_RETURNS_TWICE:
3213 flags = ECF_RETURNS_TWICE;
3214 break;
3216 fun = orgfun;
3218 /* Ensure current function's preferred stack boundary is at least
3219 what we need. */
3220 if (cfun->preferred_stack_boundary < PREFERRED_STACK_BOUNDARY)
3221 cfun->preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
3223 /* If this kind of value comes back in memory,
3224 decide where in memory it should come back. */
3225 if (outmode != VOIDmode)
3227 tfom = lang_hooks.types.type_for_mode (outmode, 0);
3228 if (aggregate_value_p (tfom, 0))
3230 #ifdef PCC_STATIC_STRUCT_RETURN
3231 rtx pointer_reg
3232 = hard_function_value (build_pointer_type (tfom), 0, 0);
3233 mem_value = gen_rtx_MEM (outmode, pointer_reg);
3234 pcc_struct_value = 1;
3235 if (value == 0)
3236 value = gen_reg_rtx (outmode);
3237 #else /* not PCC_STATIC_STRUCT_RETURN */
3238 struct_value_size = GET_MODE_SIZE (outmode);
3239 if (value != 0 && MEM_P (value))
3240 mem_value = value;
3241 else
3242 mem_value = assign_temp (tfom, 0, 1, 1);
3243 #endif
3244 /* This call returns a big structure. */
3245 flags &= ~(ECF_CONST | ECF_PURE | ECF_LIBCALL_BLOCK);
3248 else
3249 tfom = void_type_node;
3251 /* ??? Unfinished: must pass the memory address as an argument. */
3253 /* Copy all the libcall-arguments out of the varargs data
3254 and into a vector ARGVEC.
3256 Compute how to pass each argument. We only support a very small subset
3257 of the full argument passing conventions to limit complexity here since
3258 library functions shouldn't have many args. */
3260 argvec = alloca ((nargs + 1) * sizeof (struct arg));
3261 memset (argvec, 0, (nargs + 1) * sizeof (struct arg));
3263 #ifdef INIT_CUMULATIVE_LIBCALL_ARGS
3264 INIT_CUMULATIVE_LIBCALL_ARGS (args_so_far, outmode, fun);
3265 #else
3266 INIT_CUMULATIVE_ARGS (args_so_far, NULL_TREE, fun, 0, nargs);
3267 #endif
3269 args_size.constant = 0;
3270 args_size.var = 0;
3272 count = 0;
3274 /* Now we are about to start emitting insns that can be deleted
3275 if a libcall is deleted. */
3276 if (flags & ECF_LIBCALL_BLOCK)
3277 start_sequence ();
3279 push_temp_slots ();
3281 /* If there's a structure value address to be passed,
3282 either pass it in the special place, or pass it as an extra argument. */
3283 if (mem_value && struct_value == 0 && ! pcc_struct_value)
3285 rtx addr = XEXP (mem_value, 0);
3286 int partial;
3288 nargs++;
3290 /* Make sure it is a reasonable operand for a move or push insn. */
3291 if (!REG_P (addr) && !MEM_P (addr)
3292 && ! (CONSTANT_P (addr) && LEGITIMATE_CONSTANT_P (addr)))
3293 addr = force_operand (addr, NULL_RTX);
3295 argvec[count].value = addr;
3296 argvec[count].mode = Pmode;
3297 argvec[count].partial = 0;
3299 argvec[count].reg = FUNCTION_ARG (args_so_far, Pmode, NULL_TREE, 1);
3300 partial = FUNCTION_ARG_PARTIAL_NREGS (args_so_far, Pmode, NULL_TREE, 1);
3301 gcc_assert (!partial);
3303 locate_and_pad_parm (Pmode, NULL_TREE,
3304 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3306 #else
3307 argvec[count].reg != 0,
3308 #endif
3309 0, NULL_TREE, &args_size, &argvec[count].locate);
3311 if (argvec[count].reg == 0 || argvec[count].partial != 0
3312 || reg_parm_stack_space > 0)
3313 args_size.constant += argvec[count].locate.size.constant;
3315 FUNCTION_ARG_ADVANCE (args_so_far, Pmode, (tree) 0, 1);
3317 count++;
3320 for (; count < nargs; count++)
3322 rtx val = va_arg (p, rtx);
3323 enum machine_mode mode = va_arg (p, enum machine_mode);
3325 /* We cannot convert the arg value to the mode the library wants here;
3326 must do it earlier where we know the signedness of the arg. */
3327 gcc_assert (mode != BLKmode
3328 && (GET_MODE (val) == mode || GET_MODE (val) == VOIDmode));
3330 /* Make sure it is a reasonable operand for a move or push insn. */
3331 if (!REG_P (val) && !MEM_P (val)
3332 && ! (CONSTANT_P (val) && LEGITIMATE_CONSTANT_P (val)))
3333 val = force_operand (val, NULL_RTX);
3335 if (pass_by_reference (&args_so_far, mode, NULL_TREE, 1))
3337 rtx slot;
3338 int must_copy
3339 = !reference_callee_copied (&args_so_far, mode, NULL_TREE, 1);
3341 /* loop.c won't look at CALL_INSN_FUNCTION_USAGE of const/pure
3342 functions, so we have to pretend this isn't such a function. */
3343 if (flags & ECF_LIBCALL_BLOCK)
3345 rtx insns = get_insns ();
3346 end_sequence ();
3347 emit_insn (insns);
3349 flags &= ~(ECF_CONST | ECF_PURE | ECF_LIBCALL_BLOCK);
3351 /* If this was a CONST function, it is now PURE since
3352 it now reads memory. */
3353 if (flags & ECF_CONST)
3355 flags &= ~ECF_CONST;
3356 flags |= ECF_PURE;
3359 if (GET_MODE (val) == MEM && !must_copy)
3360 slot = val;
3361 else
3363 slot = assign_temp (lang_hooks.types.type_for_mode (mode, 0),
3364 0, 1, 1);
3365 emit_move_insn (slot, val);
3368 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
3369 gen_rtx_USE (VOIDmode, slot),
3370 call_fusage);
3371 if (must_copy)
3372 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
3373 gen_rtx_CLOBBER (VOIDmode,
3374 slot),
3375 call_fusage);
3377 mode = Pmode;
3378 val = force_operand (XEXP (slot, 0), NULL_RTX);
3381 argvec[count].value = val;
3382 argvec[count].mode = mode;
3384 argvec[count].reg = FUNCTION_ARG (args_so_far, mode, NULL_TREE, 1);
3386 argvec[count].partial
3387 = FUNCTION_ARG_PARTIAL_NREGS (args_so_far, mode, NULL_TREE, 1);
3389 locate_and_pad_parm (mode, NULL_TREE,
3390 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3392 #else
3393 argvec[count].reg != 0,
3394 #endif
3395 argvec[count].partial,
3396 NULL_TREE, &args_size, &argvec[count].locate);
3398 gcc_assert (!argvec[count].locate.size.var);
3400 if (argvec[count].reg == 0 || argvec[count].partial != 0
3401 || reg_parm_stack_space > 0)
3402 args_size.constant += argvec[count].locate.size.constant;
3404 FUNCTION_ARG_ADVANCE (args_so_far, mode, (tree) 0, 1);
3407 /* If this machine requires an external definition for library
3408 functions, write one out. */
3409 assemble_external_libcall (fun);
3411 original_args_size = args_size;
3412 args_size.constant = (((args_size.constant
3413 + stack_pointer_delta
3414 + STACK_BYTES - 1)
3415 / STACK_BYTES
3416 * STACK_BYTES)
3417 - stack_pointer_delta);
3419 args_size.constant = MAX (args_size.constant,
3420 reg_parm_stack_space);
3422 #ifndef OUTGOING_REG_PARM_STACK_SPACE
3423 args_size.constant -= reg_parm_stack_space;
3424 #endif
3426 if (args_size.constant > current_function_outgoing_args_size)
3427 current_function_outgoing_args_size = args_size.constant;
3429 if (ACCUMULATE_OUTGOING_ARGS)
3431 /* Since the stack pointer will never be pushed, it is possible for
3432 the evaluation of a parm to clobber something we have already
3433 written to the stack. Since most function calls on RISC machines
3434 do not use the stack, this is uncommon, but must work correctly.
3436 Therefore, we save any area of the stack that was already written
3437 and that we are using. Here we set up to do this by making a new
3438 stack usage map from the old one.
3440 Another approach might be to try to reorder the argument
3441 evaluations to avoid this conflicting stack usage. */
3443 needed = args_size.constant;
3445 #ifndef OUTGOING_REG_PARM_STACK_SPACE
3446 /* Since we will be writing into the entire argument area, the
3447 map must be allocated for its entire size, not just the part that
3448 is the responsibility of the caller. */
3449 needed += reg_parm_stack_space;
3450 #endif
3452 #ifdef ARGS_GROW_DOWNWARD
3453 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3454 needed + 1);
3455 #else
3456 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3457 needed);
3458 #endif
3459 stack_usage_map = alloca (highest_outgoing_arg_in_use);
3461 if (initial_highest_arg_in_use)
3462 memcpy (stack_usage_map, initial_stack_usage_map,
3463 initial_highest_arg_in_use);
3465 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
3466 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
3467 highest_outgoing_arg_in_use - initial_highest_arg_in_use);
3468 needed = 0;
3470 /* We must be careful to use virtual regs before they're instantiated,
3471 and real regs afterwards. Loop optimization, for example, can create
3472 new libcalls after we've instantiated the virtual regs, and if we
3473 use virtuals anyway, they won't match the rtl patterns. */
3475 if (virtuals_instantiated)
3476 argblock = plus_constant (stack_pointer_rtx, STACK_POINTER_OFFSET);
3477 else
3478 argblock = virtual_outgoing_args_rtx;
3480 else
3482 if (!PUSH_ARGS)
3483 argblock = push_block (GEN_INT (args_size.constant), 0, 0);
3486 /* If we push args individually in reverse order, perform stack alignment
3487 before the first push (the last arg). */
3488 if (argblock == 0 && PUSH_ARGS_REVERSED)
3489 anti_adjust_stack (GEN_INT (args_size.constant
3490 - original_args_size.constant));
3492 if (PUSH_ARGS_REVERSED)
3494 inc = -1;
3495 argnum = nargs - 1;
3497 else
3499 inc = 1;
3500 argnum = 0;
3503 #ifdef REG_PARM_STACK_SPACE
3504 if (ACCUMULATE_OUTGOING_ARGS)
3506 /* The argument list is the property of the called routine and it
3507 may clobber it. If the fixed area has been used for previous
3508 parameters, we must save and restore it. */
3509 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
3510 &low_to_save, &high_to_save);
3512 #endif
3514 /* Push the args that need to be pushed. */
3516 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3517 are to be pushed. */
3518 for (count = 0; count < nargs; count++, argnum += inc)
3520 enum machine_mode mode = argvec[argnum].mode;
3521 rtx val = argvec[argnum].value;
3522 rtx reg = argvec[argnum].reg;
3523 int partial = argvec[argnum].partial;
3524 int lower_bound = 0, upper_bound = 0, i;
3526 if (! (reg != 0 && partial == 0))
3528 if (ACCUMULATE_OUTGOING_ARGS)
3530 /* If this is being stored into a pre-allocated, fixed-size,
3531 stack area, save any previous data at that location. */
3533 #ifdef ARGS_GROW_DOWNWARD
3534 /* stack_slot is negative, but we want to index stack_usage_map
3535 with positive values. */
3536 upper_bound = -argvec[argnum].locate.offset.constant + 1;
3537 lower_bound = upper_bound - argvec[argnum].locate.size.constant;
3538 #else
3539 lower_bound = argvec[argnum].locate.offset.constant;
3540 upper_bound = lower_bound + argvec[argnum].locate.size.constant;
3541 #endif
3543 i = lower_bound;
3544 /* Don't worry about things in the fixed argument area;
3545 it has already been saved. */
3546 if (i < reg_parm_stack_space)
3547 i = reg_parm_stack_space;
3548 while (i < upper_bound && stack_usage_map[i] == 0)
3549 i++;
3551 if (i < upper_bound)
3553 /* We need to make a save area. */
3554 unsigned int size
3555 = argvec[argnum].locate.size.constant * BITS_PER_UNIT;
3556 enum machine_mode save_mode
3557 = mode_for_size (size, MODE_INT, 1);
3558 rtx adr
3559 = plus_constant (argblock,
3560 argvec[argnum].locate.offset.constant);
3561 rtx stack_area
3562 = gen_rtx_MEM (save_mode, memory_address (save_mode, adr));
3564 if (save_mode == BLKmode)
3566 argvec[argnum].save_area
3567 = assign_stack_temp (BLKmode,
3568 argvec[argnum].locate.size.constant,
3571 emit_block_move (validize_mem (argvec[argnum].save_area),
3572 stack_area,
3573 GEN_INT (argvec[argnum].locate.size.constant),
3574 BLOCK_OP_CALL_PARM);
3576 else
3578 argvec[argnum].save_area = gen_reg_rtx (save_mode);
3580 emit_move_insn (argvec[argnum].save_area, stack_area);
3585 emit_push_insn (val, mode, NULL_TREE, NULL_RTX, PARM_BOUNDARY,
3586 partial, reg, 0, argblock,
3587 GEN_INT (argvec[argnum].locate.offset.constant),
3588 reg_parm_stack_space,
3589 ARGS_SIZE_RTX (argvec[argnum].locate.alignment_pad));
3591 /* Now mark the segment we just used. */
3592 if (ACCUMULATE_OUTGOING_ARGS)
3593 for (i = lower_bound; i < upper_bound; i++)
3594 stack_usage_map[i] = 1;
3596 NO_DEFER_POP;
3600 /* If we pushed args in forward order, perform stack alignment
3601 after pushing the last arg. */
3602 if (argblock == 0 && !PUSH_ARGS_REVERSED)
3603 anti_adjust_stack (GEN_INT (args_size.constant
3604 - original_args_size.constant));
3606 if (PUSH_ARGS_REVERSED)
3607 argnum = nargs - 1;
3608 else
3609 argnum = 0;
3611 fun = prepare_call_address (fun, NULL, &call_fusage, 0, 0);
3613 /* Now load any reg parms into their regs. */
3615 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3616 are to be pushed. */
3617 for (count = 0; count < nargs; count++, argnum += inc)
3619 enum machine_mode mode = argvec[argnum].mode;
3620 rtx val = argvec[argnum].value;
3621 rtx reg = argvec[argnum].reg;
3622 int partial = argvec[argnum].partial;
3624 /* Handle calls that pass values in multiple non-contiguous
3625 locations. The PA64 has examples of this for library calls. */
3626 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3627 emit_group_load (reg, val, NULL_TREE, GET_MODE_SIZE (mode));
3628 else if (reg != 0 && partial == 0)
3629 emit_move_insn (reg, val);
3631 NO_DEFER_POP;
3634 /* Any regs containing parms remain in use through the call. */
3635 for (count = 0; count < nargs; count++)
3637 rtx reg = argvec[count].reg;
3638 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3639 use_group_regs (&call_fusage, reg);
3640 else if (reg != 0)
3641 use_reg (&call_fusage, reg);
3644 /* Pass the function the address in which to return a structure value. */
3645 if (mem_value != 0 && struct_value != 0 && ! pcc_struct_value)
3647 emit_move_insn (struct_value,
3648 force_reg (Pmode,
3649 force_operand (XEXP (mem_value, 0),
3650 NULL_RTX)));
3651 if (REG_P (struct_value))
3652 use_reg (&call_fusage, struct_value);
3655 /* Don't allow popping to be deferred, since then
3656 cse'ing of library calls could delete a call and leave the pop. */
3657 NO_DEFER_POP;
3658 valreg = (mem_value == 0 && outmode != VOIDmode
3659 ? hard_libcall_value (outmode) : NULL_RTX);
3661 /* Stack must be properly aligned now. */
3662 gcc_assert (!(stack_pointer_delta
3663 & (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT - 1)));
3665 before_call = get_last_insn ();
3667 /* We pass the old value of inhibit_defer_pop + 1 to emit_call_1, which
3668 will set inhibit_defer_pop to that value. */
3669 /* The return type is needed to decide how many bytes the function pops.
3670 Signedness plays no role in that, so for simplicity, we pretend it's
3671 always signed. We also assume that the list of arguments passed has
3672 no impact, so we pretend it is unknown. */
3674 emit_call_1 (fun, NULL,
3675 get_identifier (XSTR (orgfun, 0)),
3676 build_function_type (tfom, NULL_TREE),
3677 original_args_size.constant, args_size.constant,
3678 struct_value_size,
3679 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1),
3680 valreg,
3681 old_inhibit_defer_pop + 1, call_fusage, flags, & args_so_far);
3683 /* For calls to `setjmp', etc., inform flow.c it should complain
3684 if nonvolatile values are live. For functions that cannot return,
3685 inform flow that control does not fall through. */
3687 if (flags & (ECF_NORETURN | ECF_LONGJMP))
3689 /* The barrier note must be emitted
3690 immediately after the CALL_INSN. Some ports emit more than
3691 just a CALL_INSN above, so we must search for it here. */
3693 rtx last = get_last_insn ();
3694 while (!CALL_P (last))
3696 last = PREV_INSN (last);
3697 /* There was no CALL_INSN? */
3698 gcc_assert (last != before_call);
3701 emit_barrier_after (last);
3704 /* Now restore inhibit_defer_pop to its actual original value. */
3705 OK_DEFER_POP;
3707 /* If call is cse'able, make appropriate pair of reg-notes around it.
3708 Test valreg so we don't crash; may safely ignore `const'
3709 if return type is void. Disable for PARALLEL return values, because
3710 we have no way to move such values into a pseudo register. */
3711 if (flags & ECF_LIBCALL_BLOCK)
3713 rtx insns;
3715 if (valreg == 0)
3717 insns = get_insns ();
3718 end_sequence ();
3719 emit_insn (insns);
3721 else
3723 rtx note = 0;
3724 rtx temp;
3725 int i;
3727 if (GET_CODE (valreg) == PARALLEL)
3729 temp = gen_reg_rtx (outmode);
3730 emit_group_store (temp, valreg, NULL_TREE,
3731 GET_MODE_SIZE (outmode));
3732 valreg = temp;
3735 temp = gen_reg_rtx (GET_MODE (valreg));
3737 /* Construct an "equal form" for the value which mentions all the
3738 arguments in order as well as the function name. */
3739 for (i = 0; i < nargs; i++)
3740 note = gen_rtx_EXPR_LIST (VOIDmode, argvec[i].value, note);
3741 note = gen_rtx_EXPR_LIST (VOIDmode, fun, note);
3743 insns = get_insns ();
3744 end_sequence ();
3746 if (flags & ECF_PURE)
3747 note = gen_rtx_EXPR_LIST (VOIDmode,
3748 gen_rtx_USE (VOIDmode,
3749 gen_rtx_MEM (BLKmode,
3750 gen_rtx_SCRATCH (VOIDmode))),
3751 note);
3753 emit_libcall_block (insns, temp, valreg, note);
3755 valreg = temp;
3758 pop_temp_slots ();
3760 /* Copy the value to the right place. */
3761 if (outmode != VOIDmode && retval)
3763 if (mem_value)
3765 if (value == 0)
3766 value = mem_value;
3767 if (value != mem_value)
3768 emit_move_insn (value, mem_value);
3770 else if (GET_CODE (valreg) == PARALLEL)
3772 if (value == 0)
3773 value = gen_reg_rtx (outmode);
3774 emit_group_store (value, valreg, NULL_TREE, GET_MODE_SIZE (outmode));
3776 else if (value != 0)
3777 emit_move_insn (value, valreg);
3778 else
3779 value = valreg;
3782 if (ACCUMULATE_OUTGOING_ARGS)
3784 #ifdef REG_PARM_STACK_SPACE
3785 if (save_area)
3786 restore_fixed_argument_area (save_area, argblock,
3787 high_to_save, low_to_save);
3788 #endif
3790 /* If we saved any argument areas, restore them. */
3791 for (count = 0; count < nargs; count++)
3792 if (argvec[count].save_area)
3794 enum machine_mode save_mode = GET_MODE (argvec[count].save_area);
3795 rtx adr = plus_constant (argblock,
3796 argvec[count].locate.offset.constant);
3797 rtx stack_area = gen_rtx_MEM (save_mode,
3798 memory_address (save_mode, adr));
3800 if (save_mode == BLKmode)
3801 emit_block_move (stack_area,
3802 validize_mem (argvec[count].save_area),
3803 GEN_INT (argvec[count].locate.size.constant),
3804 BLOCK_OP_CALL_PARM);
3805 else
3806 emit_move_insn (stack_area, argvec[count].save_area);
3809 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3810 stack_usage_map = initial_stack_usage_map;
3813 return value;
3817 /* Output a library call to function FUN (a SYMBOL_REF rtx)
3818 (emitting the queue unless NO_QUEUE is nonzero),
3819 for a value of mode OUTMODE,
3820 with NARGS different arguments, passed as alternating rtx values
3821 and machine_modes to convert them to.
3823 FN_TYPE should be LCT_NORMAL for `normal' calls, LCT_CONST for `const'
3824 calls, LCT_PURE for `pure' calls, LCT_CONST_MAKE_BLOCK for `const' calls
3825 which should be enclosed in REG_LIBCALL/REG_RETVAL notes,
3826 LCT_PURE_MAKE_BLOCK for `purep' calls which should be enclosed in
3827 REG_LIBCALL/REG_RETVAL notes with extra (use (memory (scratch)),
3828 or other LCT_ value for other types of library calls. */
3830 void
3831 emit_library_call (rtx orgfun, enum libcall_type fn_type,
3832 enum machine_mode outmode, int nargs, ...)
3834 va_list p;
3836 va_start (p, nargs);
3837 emit_library_call_value_1 (0, orgfun, NULL_RTX, fn_type, outmode, nargs, p);
3838 va_end (p);
3841 /* Like emit_library_call except that an extra argument, VALUE,
3842 comes second and says where to store the result.
3843 (If VALUE is zero, this function chooses a convenient way
3844 to return the value.
3846 This function returns an rtx for where the value is to be found.
3847 If VALUE is nonzero, VALUE is returned. */
3850 emit_library_call_value (rtx orgfun, rtx value,
3851 enum libcall_type fn_type,
3852 enum machine_mode outmode, int nargs, ...)
3854 rtx result;
3855 va_list p;
3857 va_start (p, nargs);
3858 result = emit_library_call_value_1 (1, orgfun, value, fn_type, outmode,
3859 nargs, p);
3860 va_end (p);
3862 return result;
3865 /* Store a single argument for a function call
3866 into the register or memory area where it must be passed.
3867 *ARG describes the argument value and where to pass it.
3869 ARGBLOCK is the address of the stack-block for all the arguments,
3870 or 0 on a machine where arguments are pushed individually.
3872 MAY_BE_ALLOCA nonzero says this could be a call to `alloca'
3873 so must be careful about how the stack is used.
3875 VARIABLE_SIZE nonzero says that this was a variable-sized outgoing
3876 argument stack. This is used if ACCUMULATE_OUTGOING_ARGS to indicate
3877 that we need not worry about saving and restoring the stack.
3879 FNDECL is the declaration of the function we are calling.
3881 Return nonzero if this arg should cause sibcall failure,
3882 zero otherwise. */
3884 static int
3885 store_one_arg (struct arg_data *arg, rtx argblock, int flags,
3886 int variable_size ATTRIBUTE_UNUSED, int reg_parm_stack_space)
3888 tree pval = arg->tree_value;
3889 rtx reg = 0;
3890 int partial = 0;
3891 int used = 0;
3892 int i, lower_bound = 0, upper_bound = 0;
3893 int sibcall_failure = 0;
3895 if (TREE_CODE (pval) == ERROR_MARK)
3896 return 1;
3898 /* Push a new temporary level for any temporaries we make for
3899 this argument. */
3900 push_temp_slots ();
3902 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL))
3904 /* If this is being stored into a pre-allocated, fixed-size, stack area,
3905 save any previous data at that location. */
3906 if (argblock && ! variable_size && arg->stack)
3908 #ifdef ARGS_GROW_DOWNWARD
3909 /* stack_slot is negative, but we want to index stack_usage_map
3910 with positive values. */
3911 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
3912 upper_bound = -INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1)) + 1;
3913 else
3914 upper_bound = 0;
3916 lower_bound = upper_bound - arg->locate.size.constant;
3917 #else
3918 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
3919 lower_bound = INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1));
3920 else
3921 lower_bound = 0;
3923 upper_bound = lower_bound + arg->locate.size.constant;
3924 #endif
3926 i = lower_bound;
3927 /* Don't worry about things in the fixed argument area;
3928 it has already been saved. */
3929 if (i < reg_parm_stack_space)
3930 i = reg_parm_stack_space;
3931 while (i < upper_bound && stack_usage_map[i] == 0)
3932 i++;
3934 if (i < upper_bound)
3936 /* We need to make a save area. */
3937 unsigned int size = arg->locate.size.constant * BITS_PER_UNIT;
3938 enum machine_mode save_mode = mode_for_size (size, MODE_INT, 1);
3939 rtx adr = memory_address (save_mode, XEXP (arg->stack_slot, 0));
3940 rtx stack_area = gen_rtx_MEM (save_mode, adr);
3942 if (save_mode == BLKmode)
3944 tree ot = TREE_TYPE (arg->tree_value);
3945 tree nt = build_qualified_type (ot, (TYPE_QUALS (ot)
3946 | TYPE_QUAL_CONST));
3948 arg->save_area = assign_temp (nt, 0, 1, 1);
3949 preserve_temp_slots (arg->save_area);
3950 emit_block_move (validize_mem (arg->save_area), stack_area,
3951 expr_size (arg->tree_value),
3952 BLOCK_OP_CALL_PARM);
3954 else
3956 arg->save_area = gen_reg_rtx (save_mode);
3957 emit_move_insn (arg->save_area, stack_area);
3963 /* If this isn't going to be placed on both the stack and in registers,
3964 set up the register and number of words. */
3965 if (! arg->pass_on_stack)
3967 if (flags & ECF_SIBCALL)
3968 reg = arg->tail_call_reg;
3969 else
3970 reg = arg->reg;
3971 partial = arg->partial;
3974 /* Being passed entirely in a register. We shouldn't be called in
3975 this case. */
3976 gcc_assert (reg == 0 || partial != 0);
3978 /* If this arg needs special alignment, don't load the registers
3979 here. */
3980 if (arg->n_aligned_regs != 0)
3981 reg = 0;
3983 /* If this is being passed partially in a register, we can't evaluate
3984 it directly into its stack slot. Otherwise, we can. */
3985 if (arg->value == 0)
3987 /* stack_arg_under_construction is nonzero if a function argument is
3988 being evaluated directly into the outgoing argument list and
3989 expand_call must take special action to preserve the argument list
3990 if it is called recursively.
3992 For scalar function arguments stack_usage_map is sufficient to
3993 determine which stack slots must be saved and restored. Scalar
3994 arguments in general have pass_on_stack == 0.
3996 If this argument is initialized by a function which takes the
3997 address of the argument (a C++ constructor or a C function
3998 returning a BLKmode structure), then stack_usage_map is
3999 insufficient and expand_call must push the stack around the
4000 function call. Such arguments have pass_on_stack == 1.
4002 Note that it is always safe to set stack_arg_under_construction,
4003 but this generates suboptimal code if set when not needed. */
4005 if (arg->pass_on_stack)
4006 stack_arg_under_construction++;
4008 arg->value = expand_expr (pval,
4009 (partial
4010 || TYPE_MODE (TREE_TYPE (pval)) != arg->mode)
4011 ? NULL_RTX : arg->stack,
4012 VOIDmode, EXPAND_STACK_PARM);
4014 /* If we are promoting object (or for any other reason) the mode
4015 doesn't agree, convert the mode. */
4017 if (arg->mode != TYPE_MODE (TREE_TYPE (pval)))
4018 arg->value = convert_modes (arg->mode, TYPE_MODE (TREE_TYPE (pval)),
4019 arg->value, arg->unsignedp);
4021 if (arg->pass_on_stack)
4022 stack_arg_under_construction--;
4025 /* Don't allow anything left on stack from computation
4026 of argument to alloca. */
4027 if (flags & ECF_MAY_BE_ALLOCA)
4028 do_pending_stack_adjust ();
4030 if (arg->value == arg->stack)
4031 /* If the value is already in the stack slot, we are done. */
4033 else if (arg->mode != BLKmode)
4035 int size;
4037 /* Argument is a scalar, not entirely passed in registers.
4038 (If part is passed in registers, arg->partial says how much
4039 and emit_push_insn will take care of putting it there.)
4041 Push it, and if its size is less than the
4042 amount of space allocated to it,
4043 also bump stack pointer by the additional space.
4044 Note that in C the default argument promotions
4045 will prevent such mismatches. */
4047 size = GET_MODE_SIZE (arg->mode);
4048 /* Compute how much space the push instruction will push.
4049 On many machines, pushing a byte will advance the stack
4050 pointer by a halfword. */
4051 #ifdef PUSH_ROUNDING
4052 size = PUSH_ROUNDING (size);
4053 #endif
4054 used = size;
4056 /* Compute how much space the argument should get:
4057 round up to a multiple of the alignment for arguments. */
4058 if (none != FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)))
4059 used = (((size + PARM_BOUNDARY / BITS_PER_UNIT - 1)
4060 / (PARM_BOUNDARY / BITS_PER_UNIT))
4061 * (PARM_BOUNDARY / BITS_PER_UNIT));
4063 /* This isn't already where we want it on the stack, so put it there.
4064 This can either be done with push or copy insns. */
4065 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), NULL_RTX,
4066 PARM_BOUNDARY, partial, reg, used - size, argblock,
4067 ARGS_SIZE_RTX (arg->locate.offset), reg_parm_stack_space,
4068 ARGS_SIZE_RTX (arg->locate.alignment_pad));
4070 /* Unless this is a partially-in-register argument, the argument is now
4071 in the stack. */
4072 if (partial == 0)
4073 arg->value = arg->stack;
4075 else
4077 /* BLKmode, at least partly to be pushed. */
4079 unsigned int parm_align;
4080 int excess;
4081 rtx size_rtx;
4083 /* Pushing a nonscalar.
4084 If part is passed in registers, PARTIAL says how much
4085 and emit_push_insn will take care of putting it there. */
4087 /* Round its size up to a multiple
4088 of the allocation unit for arguments. */
4090 if (arg->locate.size.var != 0)
4092 excess = 0;
4093 size_rtx = ARGS_SIZE_RTX (arg->locate.size);
4095 else
4097 /* PUSH_ROUNDING has no effect on us, because
4098 emit_push_insn for BLKmode is careful to avoid it. */
4099 if (reg && GET_CODE (reg) == PARALLEL)
4101 /* Use the size of the elt to compute excess. */
4102 rtx elt = XEXP (XVECEXP (reg, 0, 0), 0);
4103 excess = (arg->locate.size.constant
4104 - int_size_in_bytes (TREE_TYPE (pval))
4105 + partial * GET_MODE_SIZE (GET_MODE (elt)));
4107 else
4108 excess = (arg->locate.size.constant
4109 - int_size_in_bytes (TREE_TYPE (pval))
4110 + partial * UNITS_PER_WORD);
4111 size_rtx = expand_expr (size_in_bytes (TREE_TYPE (pval)),
4112 NULL_RTX, TYPE_MODE (sizetype), 0);
4115 /* Some types will require stricter alignment, which will be
4116 provided for elsewhere in argument layout. */
4117 parm_align = MAX (PARM_BOUNDARY, TYPE_ALIGN (TREE_TYPE (pval)));
4119 /* When an argument is padded down, the block is aligned to
4120 PARM_BOUNDARY, but the actual argument isn't. */
4121 if (FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)) == downward)
4123 if (arg->locate.size.var)
4124 parm_align = BITS_PER_UNIT;
4125 else if (excess)
4127 unsigned int excess_align = (excess & -excess) * BITS_PER_UNIT;
4128 parm_align = MIN (parm_align, excess_align);
4132 if ((flags & ECF_SIBCALL) && MEM_P (arg->value))
4134 /* emit_push_insn might not work properly if arg->value and
4135 argblock + arg->locate.offset areas overlap. */
4136 rtx x = arg->value;
4137 int i = 0;
4139 if (XEXP (x, 0) == current_function_internal_arg_pointer
4140 || (GET_CODE (XEXP (x, 0)) == PLUS
4141 && XEXP (XEXP (x, 0), 0) ==
4142 current_function_internal_arg_pointer
4143 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT))
4145 if (XEXP (x, 0) != current_function_internal_arg_pointer)
4146 i = INTVAL (XEXP (XEXP (x, 0), 1));
4148 /* expand_call should ensure this. */
4149 gcc_assert (!arg->locate.offset.var
4150 && GET_CODE (size_rtx) == CONST_INT);
4152 if (arg->locate.offset.constant > i)
4154 if (arg->locate.offset.constant < i + INTVAL (size_rtx))
4155 sibcall_failure = 1;
4157 else if (arg->locate.offset.constant < i)
4159 if (i < arg->locate.offset.constant + INTVAL (size_rtx))
4160 sibcall_failure = 1;
4165 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), size_rtx,
4166 parm_align, partial, reg, excess, argblock,
4167 ARGS_SIZE_RTX (arg->locate.offset), reg_parm_stack_space,
4168 ARGS_SIZE_RTX (arg->locate.alignment_pad));
4170 /* Unless this is a partially-in-register argument, the argument is now
4171 in the stack.
4173 ??? Unlike the case above, in which we want the actual
4174 address of the data, so that we can load it directly into a
4175 register, here we want the address of the stack slot, so that
4176 it's properly aligned for word-by-word copying or something
4177 like that. It's not clear that this is always correct. */
4178 if (partial == 0)
4179 arg->value = arg->stack_slot;
4182 /* Mark all slots this store used. */
4183 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL)
4184 && argblock && ! variable_size && arg->stack)
4185 for (i = lower_bound; i < upper_bound; i++)
4186 stack_usage_map[i] = 1;
4188 /* Once we have pushed something, pops can't safely
4189 be deferred during the rest of the arguments. */
4190 NO_DEFER_POP;
4192 /* Free any temporary slots made in processing this argument. Show
4193 that we might have taken the address of something and pushed that
4194 as an operand. */
4195 preserve_temp_slots (NULL_RTX);
4196 free_temp_slots ();
4197 pop_temp_slots ();
4199 return sibcall_failure;
4202 /* Nonzero if we do not know how to pass TYPE solely in registers. */
4204 bool
4205 must_pass_in_stack_var_size (enum machine_mode mode ATTRIBUTE_UNUSED,
4206 tree type)
4208 if (!type)
4209 return false;
4211 /* If the type has variable size... */
4212 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
4213 return true;
4215 /* If the type is marked as addressable (it is required
4216 to be constructed into the stack)... */
4217 if (TREE_ADDRESSABLE (type))
4218 return true;
4220 return false;
4223 /* Another version of the TARGET_MUST_PASS_IN_STACK hook. This one
4224 takes trailing padding of a structure into account. */
4225 /* ??? Should be able to merge these two by examining BLOCK_REG_PADDING. */
4227 bool
4228 must_pass_in_stack_var_size_or_pad (enum machine_mode mode, tree type)
4230 if (!type)
4231 return false;
4233 /* If the type has variable size... */
4234 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
4235 return true;
4237 /* If the type is marked as addressable (it is required
4238 to be constructed into the stack)... */
4239 if (TREE_ADDRESSABLE (type))
4240 return true;
4242 /* If the padding and mode of the type is such that a copy into
4243 a register would put it into the wrong part of the register. */
4244 if (mode == BLKmode
4245 && int_size_in_bytes (type) % (PARM_BOUNDARY / BITS_PER_UNIT)
4246 && (FUNCTION_ARG_PADDING (mode, type)
4247 == (BYTES_BIG_ENDIAN ? upward : downward)))
4248 return true;
4250 return false;