2008-05-08 Kai Tietz <kai.tietz@onevision.com>
[official-gcc.git] / gcc / calls.c
blobbbb9b769c490765fcedc1f0f2c018232ad76c8cd
1 /* Convert function calls to rtl insns, for GNU C compiler.
2 Copyright (C) 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998,
3 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007
4 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "rtl.h"
27 #include "tree.h"
28 #include "flags.h"
29 #include "expr.h"
30 #include "optabs.h"
31 #include "libfuncs.h"
32 #include "function.h"
33 #include "regs.h"
34 #include "toplev.h"
35 #include "output.h"
36 #include "tm_p.h"
37 #include "timevar.h"
38 #include "sbitmap.h"
39 #include "langhooks.h"
40 #include "target.h"
41 #include "cgraph.h"
42 #include "except.h"
43 #include "dbgcnt.h"
45 /* Like PREFERRED_STACK_BOUNDARY but in units of bytes, not bits. */
46 #define STACK_BYTES (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT)
48 /* Data structure and subroutines used within expand_call. */
50 struct arg_data
52 /* Tree node for this argument. */
53 tree tree_value;
54 /* Mode for value; TYPE_MODE unless promoted. */
55 enum machine_mode mode;
56 /* Current RTL value for argument, or 0 if it isn't precomputed. */
57 rtx value;
58 /* Initially-compute RTL value for argument; only for const functions. */
59 rtx initial_value;
60 /* Register to pass this argument in, 0 if passed on stack, or an
61 PARALLEL if the arg is to be copied into multiple non-contiguous
62 registers. */
63 rtx reg;
64 /* Register to pass this argument in when generating tail call sequence.
65 This is not the same register as for normal calls on machines with
66 register windows. */
67 rtx tail_call_reg;
68 /* If REG is a PARALLEL, this is a copy of VALUE pulled into the correct
69 form for emit_group_move. */
70 rtx parallel_value;
71 /* If REG was promoted from the actual mode of the argument expression,
72 indicates whether the promotion is sign- or zero-extended. */
73 int unsignedp;
74 /* Number of bytes to put in registers. 0 means put the whole arg
75 in registers. Also 0 if not passed in registers. */
76 int partial;
77 /* Nonzero if argument must be passed on stack.
78 Note that some arguments may be passed on the stack
79 even though pass_on_stack is zero, just because FUNCTION_ARG says so.
80 pass_on_stack identifies arguments that *cannot* go in registers. */
81 int pass_on_stack;
82 /* Some fields packaged up for locate_and_pad_parm. */
83 struct locate_and_pad_arg_data locate;
84 /* Location on the stack at which parameter should be stored. The store
85 has already been done if STACK == VALUE. */
86 rtx stack;
87 /* Location on the stack of the start of this argument slot. This can
88 differ from STACK if this arg pads downward. This location is known
89 to be aligned to FUNCTION_ARG_BOUNDARY. */
90 rtx stack_slot;
91 /* Place that this stack area has been saved, if needed. */
92 rtx save_area;
93 /* If an argument's alignment does not permit direct copying into registers,
94 copy in smaller-sized pieces into pseudos. These are stored in a
95 block pointed to by this field. The next field says how many
96 word-sized pseudos we made. */
97 rtx *aligned_regs;
98 int n_aligned_regs;
101 /* A vector of one char per byte of stack space. A byte if nonzero if
102 the corresponding stack location has been used.
103 This vector is used to prevent a function call within an argument from
104 clobbering any stack already set up. */
105 static char *stack_usage_map;
107 /* Size of STACK_USAGE_MAP. */
108 static int highest_outgoing_arg_in_use;
110 /* A bitmap of virtual-incoming stack space. Bit is set if the corresponding
111 stack location's tail call argument has been already stored into the stack.
112 This bitmap is used to prevent sibling call optimization if function tries
113 to use parent's incoming argument slots when they have been already
114 overwritten with tail call arguments. */
115 static sbitmap stored_args_map;
117 /* stack_arg_under_construction is nonzero when an argument may be
118 initialized with a constructor call (including a C function that
119 returns a BLKmode struct) and expand_call must take special action
120 to make sure the object being constructed does not overlap the
121 argument list for the constructor call. */
122 static int stack_arg_under_construction;
124 static void emit_call_1 (rtx, tree, tree, tree, HOST_WIDE_INT, HOST_WIDE_INT,
125 HOST_WIDE_INT, rtx, rtx, int, rtx, int,
126 CUMULATIVE_ARGS *);
127 static void precompute_register_parameters (int, struct arg_data *, int *);
128 static int store_one_arg (struct arg_data *, rtx, int, int, int);
129 static void store_unaligned_arguments_into_pseudos (struct arg_data *, int);
130 static int finalize_must_preallocate (int, int, struct arg_data *,
131 struct args_size *);
132 static void precompute_arguments (int, int, struct arg_data *);
133 static int compute_argument_block_size (int, struct args_size *, tree, int);
134 static void initialize_argument_information (int, struct arg_data *,
135 struct args_size *, int,
136 tree, tree,
137 tree, CUMULATIVE_ARGS *, int,
138 rtx *, int *, int *, int *,
139 bool *, bool);
140 static void compute_argument_addresses (struct arg_data *, rtx, int);
141 static rtx rtx_for_function_call (tree, tree);
142 static void load_register_parameters (struct arg_data *, int, rtx *, int,
143 int, int *);
144 static rtx emit_library_call_value_1 (int, rtx, rtx, enum libcall_type,
145 enum machine_mode, int, va_list);
146 static int special_function_p (const_tree, int);
147 static int check_sibcall_argument_overlap_1 (rtx);
148 static int check_sibcall_argument_overlap (rtx, struct arg_data *, int);
150 static int combine_pending_stack_adjustment_and_call (int, struct args_size *,
151 unsigned int);
152 static tree split_complex_types (tree);
154 #ifdef REG_PARM_STACK_SPACE
155 static rtx save_fixed_argument_area (int, rtx, int *, int *);
156 static void restore_fixed_argument_area (rtx, rtx, int, int);
157 #endif
159 /* Force FUNEXP into a form suitable for the address of a CALL,
160 and return that as an rtx. Also load the static chain register
161 if FNDECL is a nested function.
163 CALL_FUSAGE points to a variable holding the prospective
164 CALL_INSN_FUNCTION_USAGE information. */
167 prepare_call_address (rtx funexp, rtx static_chain_value,
168 rtx *call_fusage, int reg_parm_seen, int sibcallp)
170 /* Make a valid memory address and copy constants through pseudo-regs,
171 but not for a constant address if -fno-function-cse. */
172 if (GET_CODE (funexp) != SYMBOL_REF)
173 /* If we are using registers for parameters, force the
174 function address into a register now. */
175 funexp = ((SMALL_REGISTER_CLASSES && reg_parm_seen)
176 ? force_not_mem (memory_address (FUNCTION_MODE, funexp))
177 : memory_address (FUNCTION_MODE, funexp));
178 else if (! sibcallp)
180 #ifndef NO_FUNCTION_CSE
181 if (optimize && ! flag_no_function_cse)
182 funexp = force_reg (Pmode, funexp);
183 #endif
186 if (static_chain_value != 0)
188 static_chain_value = convert_memory_address (Pmode, static_chain_value);
189 emit_move_insn (static_chain_rtx, static_chain_value);
191 if (REG_P (static_chain_rtx))
192 use_reg (call_fusage, static_chain_rtx);
195 return funexp;
198 /* Generate instructions to call function FUNEXP,
199 and optionally pop the results.
200 The CALL_INSN is the first insn generated.
202 FNDECL is the declaration node of the function. This is given to the
203 macro RETURN_POPS_ARGS to determine whether this function pops its own args.
205 FUNTYPE is the data type of the function. This is given to the macro
206 RETURN_POPS_ARGS to determine whether this function pops its own args.
207 We used to allow an identifier for library functions, but that doesn't
208 work when the return type is an aggregate type and the calling convention
209 says that the pointer to this aggregate is to be popped by the callee.
211 STACK_SIZE is the number of bytes of arguments on the stack,
212 ROUNDED_STACK_SIZE is that number rounded up to
213 PREFERRED_STACK_BOUNDARY; zero if the size is variable. This is
214 both to put into the call insn and to generate explicit popping
215 code if necessary.
217 STRUCT_VALUE_SIZE is the number of bytes wanted in a structure value.
218 It is zero if this call doesn't want a structure value.
220 NEXT_ARG_REG is the rtx that results from executing
221 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1)
222 just after all the args have had their registers assigned.
223 This could be whatever you like, but normally it is the first
224 arg-register beyond those used for args in this call,
225 or 0 if all the arg-registers are used in this call.
226 It is passed on to `gen_call' so you can put this info in the call insn.
228 VALREG is a hard register in which a value is returned,
229 or 0 if the call does not return a value.
231 OLD_INHIBIT_DEFER_POP is the value that `inhibit_defer_pop' had before
232 the args to this call were processed.
233 We restore `inhibit_defer_pop' to that value.
235 CALL_FUSAGE is either empty or an EXPR_LIST of USE expressions that
236 denote registers used by the called function. */
238 static void
239 emit_call_1 (rtx funexp, tree fntree, tree fndecl ATTRIBUTE_UNUSED,
240 tree funtype ATTRIBUTE_UNUSED,
241 HOST_WIDE_INT stack_size ATTRIBUTE_UNUSED,
242 HOST_WIDE_INT rounded_stack_size,
243 HOST_WIDE_INT struct_value_size ATTRIBUTE_UNUSED,
244 rtx next_arg_reg ATTRIBUTE_UNUSED, rtx valreg,
245 int old_inhibit_defer_pop, rtx call_fusage, int ecf_flags,
246 CUMULATIVE_ARGS *args_so_far ATTRIBUTE_UNUSED)
248 rtx rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
249 rtx call_insn;
250 int already_popped = 0;
251 HOST_WIDE_INT n_popped = RETURN_POPS_ARGS (fndecl, funtype, stack_size);
252 #if defined (HAVE_call) && defined (HAVE_call_value)
253 rtx struct_value_size_rtx;
254 struct_value_size_rtx = GEN_INT (struct_value_size);
255 #endif
257 #ifdef CALL_POPS_ARGS
258 n_popped += CALL_POPS_ARGS (* args_so_far);
259 #endif
261 /* Ensure address is valid. SYMBOL_REF is already valid, so no need,
262 and we don't want to load it into a register as an optimization,
263 because prepare_call_address already did it if it should be done. */
264 if (GET_CODE (funexp) != SYMBOL_REF)
265 funexp = memory_address (FUNCTION_MODE, funexp);
267 #if defined (HAVE_sibcall_pop) && defined (HAVE_sibcall_value_pop)
268 if ((ecf_flags & ECF_SIBCALL)
269 && HAVE_sibcall_pop && HAVE_sibcall_value_pop
270 && (n_popped > 0 || stack_size == 0))
272 rtx n_pop = GEN_INT (n_popped);
273 rtx pat;
275 /* If this subroutine pops its own args, record that in the call insn
276 if possible, for the sake of frame pointer elimination. */
278 if (valreg)
279 pat = GEN_SIBCALL_VALUE_POP (valreg,
280 gen_rtx_MEM (FUNCTION_MODE, funexp),
281 rounded_stack_size_rtx, next_arg_reg,
282 n_pop);
283 else
284 pat = GEN_SIBCALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
285 rounded_stack_size_rtx, next_arg_reg, n_pop);
287 emit_call_insn (pat);
288 already_popped = 1;
290 else
291 #endif
293 #if defined (HAVE_call_pop) && defined (HAVE_call_value_pop)
294 /* If the target has "call" or "call_value" insns, then prefer them
295 if no arguments are actually popped. If the target does not have
296 "call" or "call_value" insns, then we must use the popping versions
297 even if the call has no arguments to pop. */
298 #if defined (HAVE_call) && defined (HAVE_call_value)
299 if (HAVE_call && HAVE_call_value && HAVE_call_pop && HAVE_call_value_pop
300 && n_popped > 0)
301 #else
302 if (HAVE_call_pop && HAVE_call_value_pop)
303 #endif
305 rtx n_pop = GEN_INT (n_popped);
306 rtx pat;
308 /* If this subroutine pops its own args, record that in the call insn
309 if possible, for the sake of frame pointer elimination. */
311 if (valreg)
312 pat = GEN_CALL_VALUE_POP (valreg,
313 gen_rtx_MEM (FUNCTION_MODE, funexp),
314 rounded_stack_size_rtx, next_arg_reg, n_pop);
315 else
316 pat = GEN_CALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
317 rounded_stack_size_rtx, next_arg_reg, n_pop);
319 emit_call_insn (pat);
320 already_popped = 1;
322 else
323 #endif
325 #if defined (HAVE_sibcall) && defined (HAVE_sibcall_value)
326 if ((ecf_flags & ECF_SIBCALL)
327 && HAVE_sibcall && HAVE_sibcall_value)
329 if (valreg)
330 emit_call_insn (GEN_SIBCALL_VALUE (valreg,
331 gen_rtx_MEM (FUNCTION_MODE, funexp),
332 rounded_stack_size_rtx,
333 next_arg_reg, NULL_RTX));
334 else
335 emit_call_insn (GEN_SIBCALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
336 rounded_stack_size_rtx, next_arg_reg,
337 struct_value_size_rtx));
339 else
340 #endif
342 #if defined (HAVE_call) && defined (HAVE_call_value)
343 if (HAVE_call && HAVE_call_value)
345 if (valreg)
346 emit_call_insn (GEN_CALL_VALUE (valreg,
347 gen_rtx_MEM (FUNCTION_MODE, funexp),
348 rounded_stack_size_rtx, next_arg_reg,
349 NULL_RTX));
350 else
351 emit_call_insn (GEN_CALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
352 rounded_stack_size_rtx, next_arg_reg,
353 struct_value_size_rtx));
355 else
356 #endif
357 gcc_unreachable ();
359 /* Find the call we just emitted. */
360 call_insn = last_call_insn ();
362 /* Put the register usage information there. */
363 add_function_usage_to (call_insn, call_fusage);
365 /* If this is a const call, then set the insn's unchanging bit. */
366 if (ecf_flags & ECF_CONST)
367 RTL_CONST_CALL_P (call_insn) = 1;
369 /* If this is a pure call, then set the insn's unchanging bit. */
370 if (ecf_flags & ECF_PURE)
371 RTL_PURE_CALL_P (call_insn) = 1;
373 /* If this is a const call, then set the insn's unchanging bit. */
374 if (ecf_flags & ECF_LOOPING_CONST_OR_PURE)
375 RTL_LOOPING_CONST_OR_PURE_CALL_P (call_insn) = 1;
377 /* If this call can't throw, attach a REG_EH_REGION reg note to that
378 effect. */
379 if (ecf_flags & ECF_NOTHROW)
380 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_EH_REGION, const0_rtx,
381 REG_NOTES (call_insn));
382 else
384 int rn = lookup_stmt_eh_region (fntree);
386 /* If rn < 0, then either (1) tree-ssa not used or (2) doesn't
387 throw, which we already took care of. */
388 if (rn > 0)
389 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_EH_REGION, GEN_INT (rn),
390 REG_NOTES (call_insn));
393 if (ecf_flags & ECF_NORETURN)
394 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_NORETURN, const0_rtx,
395 REG_NOTES (call_insn));
397 if (ecf_flags & ECF_RETURNS_TWICE)
399 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_SETJMP, const0_rtx,
400 REG_NOTES (call_insn));
401 cfun->calls_setjmp = 1;
404 SIBLING_CALL_P (call_insn) = ((ecf_flags & ECF_SIBCALL) != 0);
406 /* Restore this now, so that we do defer pops for this call's args
407 if the context of the call as a whole permits. */
408 inhibit_defer_pop = old_inhibit_defer_pop;
410 if (n_popped > 0)
412 if (!already_popped)
413 CALL_INSN_FUNCTION_USAGE (call_insn)
414 = gen_rtx_EXPR_LIST (VOIDmode,
415 gen_rtx_CLOBBER (VOIDmode, stack_pointer_rtx),
416 CALL_INSN_FUNCTION_USAGE (call_insn));
417 rounded_stack_size -= n_popped;
418 rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
419 stack_pointer_delta -= n_popped;
422 if (!ACCUMULATE_OUTGOING_ARGS)
424 /* If returning from the subroutine does not automatically pop the args,
425 we need an instruction to pop them sooner or later.
426 Perhaps do it now; perhaps just record how much space to pop later.
428 If returning from the subroutine does pop the args, indicate that the
429 stack pointer will be changed. */
431 if (rounded_stack_size != 0)
433 if (ecf_flags & ECF_NORETURN)
434 /* Just pretend we did the pop. */
435 stack_pointer_delta -= rounded_stack_size;
436 else if (flag_defer_pop && inhibit_defer_pop == 0
437 && ! (ecf_flags & (ECF_CONST | ECF_PURE)))
438 pending_stack_adjust += rounded_stack_size;
439 else
440 adjust_stack (rounded_stack_size_rtx);
443 /* When we accumulate outgoing args, we must avoid any stack manipulations.
444 Restore the stack pointer to its original value now. Usually
445 ACCUMULATE_OUTGOING_ARGS targets don't get here, but there are exceptions.
446 On i386 ACCUMULATE_OUTGOING_ARGS can be enabled on demand, and
447 popping variants of functions exist as well.
449 ??? We may optimize similar to defer_pop above, but it is
450 probably not worthwhile.
452 ??? It will be worthwhile to enable combine_stack_adjustments even for
453 such machines. */
454 else if (n_popped)
455 anti_adjust_stack (GEN_INT (n_popped));
458 /* Determine if the function identified by NAME and FNDECL is one with
459 special properties we wish to know about.
461 For example, if the function might return more than one time (setjmp), then
462 set RETURNS_TWICE to a nonzero value.
464 Similarly set NORETURN if the function is in the longjmp family.
466 Set MAY_BE_ALLOCA for any memory allocation function that might allocate
467 space from the stack such as alloca. */
469 static int
470 special_function_p (const_tree fndecl, int flags)
472 if (fndecl && DECL_NAME (fndecl)
473 && IDENTIFIER_LENGTH (DECL_NAME (fndecl)) <= 17
474 /* Exclude functions not at the file scope, or not `extern',
475 since they are not the magic functions we would otherwise
476 think they are.
477 FIXME: this should be handled with attributes, not with this
478 hacky imitation of DECL_ASSEMBLER_NAME. It's (also) wrong
479 because you can declare fork() inside a function if you
480 wish. */
481 && (DECL_CONTEXT (fndecl) == NULL_TREE
482 || TREE_CODE (DECL_CONTEXT (fndecl)) == TRANSLATION_UNIT_DECL)
483 && TREE_PUBLIC (fndecl))
485 const char *name = IDENTIFIER_POINTER (DECL_NAME (fndecl));
486 const char *tname = name;
488 /* We assume that alloca will always be called by name. It
489 makes no sense to pass it as a pointer-to-function to
490 anything that does not understand its behavior. */
491 if (((IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 6
492 && name[0] == 'a'
493 && ! strcmp (name, "alloca"))
494 || (IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 16
495 && name[0] == '_'
496 && ! strcmp (name, "__builtin_alloca"))))
497 flags |= ECF_MAY_BE_ALLOCA;
499 /* Disregard prefix _, __ or __x. */
500 if (name[0] == '_')
502 if (name[1] == '_' && name[2] == 'x')
503 tname += 3;
504 else if (name[1] == '_')
505 tname += 2;
506 else
507 tname += 1;
510 if (tname[0] == 's')
512 if ((tname[1] == 'e'
513 && (! strcmp (tname, "setjmp")
514 || ! strcmp (tname, "setjmp_syscall")))
515 || (tname[1] == 'i'
516 && ! strcmp (tname, "sigsetjmp"))
517 || (tname[1] == 'a'
518 && ! strcmp (tname, "savectx")))
519 flags |= ECF_RETURNS_TWICE;
521 if (tname[1] == 'i'
522 && ! strcmp (tname, "siglongjmp"))
523 flags |= ECF_NORETURN;
525 else if ((tname[0] == 'q' && tname[1] == 's'
526 && ! strcmp (tname, "qsetjmp"))
527 || (tname[0] == 'v' && tname[1] == 'f'
528 && ! strcmp (tname, "vfork"))
529 || (tname[0] == 'g' && tname[1] == 'e'
530 && !strcmp (tname, "getcontext")))
531 flags |= ECF_RETURNS_TWICE;
533 else if (tname[0] == 'l' && tname[1] == 'o'
534 && ! strcmp (tname, "longjmp"))
535 flags |= ECF_NORETURN;
538 return flags;
541 /* Return nonzero when FNDECL represents a call to setjmp. */
544 setjmp_call_p (const_tree fndecl)
546 return special_function_p (fndecl, 0) & ECF_RETURNS_TWICE;
549 /* Return true when exp contains alloca call. */
550 bool
551 alloca_call_p (const_tree exp)
553 if (TREE_CODE (exp) == CALL_EXPR
554 && TREE_CODE (CALL_EXPR_FN (exp)) == ADDR_EXPR
555 && (TREE_CODE (TREE_OPERAND (CALL_EXPR_FN (exp), 0)) == FUNCTION_DECL)
556 && (special_function_p (TREE_OPERAND (CALL_EXPR_FN (exp), 0), 0)
557 & ECF_MAY_BE_ALLOCA))
558 return true;
559 return false;
562 /* Detect flags (function attributes) from the function decl or type node. */
565 flags_from_decl_or_type (const_tree exp)
567 int flags = 0;
568 const_tree type = exp;
570 if (DECL_P (exp))
572 type = TREE_TYPE (exp);
574 /* The function exp may have the `malloc' attribute. */
575 if (DECL_IS_MALLOC (exp))
576 flags |= ECF_MALLOC;
578 /* The function exp may have the `returns_twice' attribute. */
579 if (DECL_IS_RETURNS_TWICE (exp))
580 flags |= ECF_RETURNS_TWICE;
582 /* Process the pure and const attributes. */
583 if (TREE_READONLY (exp) && ! TREE_THIS_VOLATILE (exp))
584 flags |= ECF_CONST;
585 if (DECL_PURE_P (exp))
586 flags |= ECF_PURE;
587 if (DECL_LOOPING_CONST_OR_PURE_P (exp))
588 flags |= ECF_LOOPING_CONST_OR_PURE;
590 if (DECL_IS_NOVOPS (exp))
591 flags |= ECF_NOVOPS;
593 if (TREE_NOTHROW (exp))
594 flags |= ECF_NOTHROW;
596 flags = special_function_p (exp, flags);
598 else if (TYPE_P (exp) && TYPE_READONLY (exp) && ! TREE_THIS_VOLATILE (exp))
599 flags |= ECF_CONST;
601 if (TREE_THIS_VOLATILE (exp))
602 flags |= ECF_NORETURN;
604 return flags;
607 /* Detect flags from a CALL_EXPR. */
610 call_expr_flags (const_tree t)
612 int flags;
613 tree decl = get_callee_fndecl (t);
615 if (decl)
616 flags = flags_from_decl_or_type (decl);
617 else
619 t = TREE_TYPE (CALL_EXPR_FN (t));
620 if (t && TREE_CODE (t) == POINTER_TYPE)
621 flags = flags_from_decl_or_type (TREE_TYPE (t));
622 else
623 flags = 0;
626 return flags;
629 /* Precompute all register parameters as described by ARGS, storing values
630 into fields within the ARGS array.
632 NUM_ACTUALS indicates the total number elements in the ARGS array.
634 Set REG_PARM_SEEN if we encounter a register parameter. */
636 static void
637 precompute_register_parameters (int num_actuals, struct arg_data *args,
638 int *reg_parm_seen)
640 int i;
642 *reg_parm_seen = 0;
644 for (i = 0; i < num_actuals; i++)
645 if (args[i].reg != 0 && ! args[i].pass_on_stack)
647 *reg_parm_seen = 1;
649 if (args[i].value == 0)
651 push_temp_slots ();
652 args[i].value = expand_normal (args[i].tree_value);
653 preserve_temp_slots (args[i].value);
654 pop_temp_slots ();
657 /* If the value is a non-legitimate constant, force it into a
658 pseudo now. TLS symbols sometimes need a call to resolve. */
659 if (CONSTANT_P (args[i].value)
660 && !LEGITIMATE_CONSTANT_P (args[i].value))
661 args[i].value = force_reg (args[i].mode, args[i].value);
663 /* If we are to promote the function arg to a wider mode,
664 do it now. */
666 if (args[i].mode != TYPE_MODE (TREE_TYPE (args[i].tree_value)))
667 args[i].value
668 = convert_modes (args[i].mode,
669 TYPE_MODE (TREE_TYPE (args[i].tree_value)),
670 args[i].value, args[i].unsignedp);
672 /* If we're going to have to load the value by parts, pull the
673 parts into pseudos. The part extraction process can involve
674 non-trivial computation. */
675 if (GET_CODE (args[i].reg) == PARALLEL)
677 tree type = TREE_TYPE (args[i].tree_value);
678 args[i].parallel_value
679 = emit_group_load_into_temps (args[i].reg, args[i].value,
680 type, int_size_in_bytes (type));
683 /* If the value is expensive, and we are inside an appropriately
684 short loop, put the value into a pseudo and then put the pseudo
685 into the hard reg.
687 For small register classes, also do this if this call uses
688 register parameters. This is to avoid reload conflicts while
689 loading the parameters registers. */
691 else if ((! (REG_P (args[i].value)
692 || (GET_CODE (args[i].value) == SUBREG
693 && REG_P (SUBREG_REG (args[i].value)))))
694 && args[i].mode != BLKmode
695 && rtx_cost (args[i].value, SET) > COSTS_N_INSNS (1)
696 && ((SMALL_REGISTER_CLASSES && *reg_parm_seen)
697 || optimize))
698 args[i].value = copy_to_mode_reg (args[i].mode, args[i].value);
702 #ifdef REG_PARM_STACK_SPACE
704 /* The argument list is the property of the called routine and it
705 may clobber it. If the fixed area has been used for previous
706 parameters, we must save and restore it. */
708 static rtx
709 save_fixed_argument_area (int reg_parm_stack_space, rtx argblock, int *low_to_save, int *high_to_save)
711 int low;
712 int high;
714 /* Compute the boundary of the area that needs to be saved, if any. */
715 high = reg_parm_stack_space;
716 #ifdef ARGS_GROW_DOWNWARD
717 high += 1;
718 #endif
719 if (high > highest_outgoing_arg_in_use)
720 high = highest_outgoing_arg_in_use;
722 for (low = 0; low < high; low++)
723 if (stack_usage_map[low] != 0)
725 int num_to_save;
726 enum machine_mode save_mode;
727 int delta;
728 rtx stack_area;
729 rtx save_area;
731 while (stack_usage_map[--high] == 0)
734 *low_to_save = low;
735 *high_to_save = high;
737 num_to_save = high - low + 1;
738 save_mode = mode_for_size (num_to_save * BITS_PER_UNIT, MODE_INT, 1);
740 /* If we don't have the required alignment, must do this
741 in BLKmode. */
742 if ((low & (MIN (GET_MODE_SIZE (save_mode),
743 BIGGEST_ALIGNMENT / UNITS_PER_WORD) - 1)))
744 save_mode = BLKmode;
746 #ifdef ARGS_GROW_DOWNWARD
747 delta = -high;
748 #else
749 delta = low;
750 #endif
751 stack_area = gen_rtx_MEM (save_mode,
752 memory_address (save_mode,
753 plus_constant (argblock,
754 delta)));
756 set_mem_align (stack_area, PARM_BOUNDARY);
757 if (save_mode == BLKmode)
759 save_area = assign_stack_temp (BLKmode, num_to_save, 0);
760 emit_block_move (validize_mem (save_area), stack_area,
761 GEN_INT (num_to_save), BLOCK_OP_CALL_PARM);
763 else
765 save_area = gen_reg_rtx (save_mode);
766 emit_move_insn (save_area, stack_area);
769 return save_area;
772 return NULL_RTX;
775 static void
776 restore_fixed_argument_area (rtx save_area, rtx argblock, int high_to_save, int low_to_save)
778 enum machine_mode save_mode = GET_MODE (save_area);
779 int delta;
780 rtx stack_area;
782 #ifdef ARGS_GROW_DOWNWARD
783 delta = -high_to_save;
784 #else
785 delta = low_to_save;
786 #endif
787 stack_area = gen_rtx_MEM (save_mode,
788 memory_address (save_mode,
789 plus_constant (argblock, delta)));
790 set_mem_align (stack_area, PARM_BOUNDARY);
792 if (save_mode != BLKmode)
793 emit_move_insn (stack_area, save_area);
794 else
795 emit_block_move (stack_area, validize_mem (save_area),
796 GEN_INT (high_to_save - low_to_save + 1),
797 BLOCK_OP_CALL_PARM);
799 #endif /* REG_PARM_STACK_SPACE */
801 /* If any elements in ARGS refer to parameters that are to be passed in
802 registers, but not in memory, and whose alignment does not permit a
803 direct copy into registers. Copy the values into a group of pseudos
804 which we will later copy into the appropriate hard registers.
806 Pseudos for each unaligned argument will be stored into the array
807 args[argnum].aligned_regs. The caller is responsible for deallocating
808 the aligned_regs array if it is nonzero. */
810 static void
811 store_unaligned_arguments_into_pseudos (struct arg_data *args, int num_actuals)
813 int i, j;
815 for (i = 0; i < num_actuals; i++)
816 if (args[i].reg != 0 && ! args[i].pass_on_stack
817 && args[i].mode == BLKmode
818 && (TYPE_ALIGN (TREE_TYPE (args[i].tree_value))
819 < (unsigned int) MIN (BIGGEST_ALIGNMENT, BITS_PER_WORD)))
821 int bytes = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
822 int endian_correction = 0;
824 if (args[i].partial)
826 gcc_assert (args[i].partial % UNITS_PER_WORD == 0);
827 args[i].n_aligned_regs = args[i].partial / UNITS_PER_WORD;
829 else
831 args[i].n_aligned_regs
832 = (bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
835 args[i].aligned_regs = XNEWVEC (rtx, args[i].n_aligned_regs);
837 /* Structures smaller than a word are normally aligned to the
838 least significant byte. On a BYTES_BIG_ENDIAN machine,
839 this means we must skip the empty high order bytes when
840 calculating the bit offset. */
841 if (bytes < UNITS_PER_WORD
842 #ifdef BLOCK_REG_PADDING
843 && (BLOCK_REG_PADDING (args[i].mode,
844 TREE_TYPE (args[i].tree_value), 1)
845 == downward)
846 #else
847 && BYTES_BIG_ENDIAN
848 #endif
850 endian_correction = BITS_PER_WORD - bytes * BITS_PER_UNIT;
852 for (j = 0; j < args[i].n_aligned_regs; j++)
854 rtx reg = gen_reg_rtx (word_mode);
855 rtx word = operand_subword_force (args[i].value, j, BLKmode);
856 int bitsize = MIN (bytes * BITS_PER_UNIT, BITS_PER_WORD);
858 args[i].aligned_regs[j] = reg;
859 word = extract_bit_field (word, bitsize, 0, 1, NULL_RTX,
860 word_mode, word_mode);
862 /* There is no need to restrict this code to loading items
863 in TYPE_ALIGN sized hunks. The bitfield instructions can
864 load up entire word sized registers efficiently.
866 ??? This may not be needed anymore.
867 We use to emit a clobber here but that doesn't let later
868 passes optimize the instructions we emit. By storing 0 into
869 the register later passes know the first AND to zero out the
870 bitfield being set in the register is unnecessary. The store
871 of 0 will be deleted as will at least the first AND. */
873 emit_move_insn (reg, const0_rtx);
875 bytes -= bitsize / BITS_PER_UNIT;
876 store_bit_field (reg, bitsize, endian_correction, word_mode,
877 word);
882 /* Fill in ARGS_SIZE and ARGS array based on the parameters found in
883 CALL_EXPR EXP.
885 NUM_ACTUALS is the total number of parameters.
887 N_NAMED_ARGS is the total number of named arguments.
889 STRUCT_VALUE_ADDR_VALUE is the implicit argument for a struct return
890 value, or null.
892 FNDECL is the tree code for the target of this call (if known)
894 ARGS_SO_FAR holds state needed by the target to know where to place
895 the next argument.
897 REG_PARM_STACK_SPACE is the number of bytes of stack space reserved
898 for arguments which are passed in registers.
900 OLD_STACK_LEVEL is a pointer to an rtx which olds the old stack level
901 and may be modified by this routine.
903 OLD_PENDING_ADJ, MUST_PREALLOCATE and FLAGS are pointers to integer
904 flags which may may be modified by this routine.
906 MAY_TAILCALL is cleared if we encounter an invisible pass-by-reference
907 that requires allocation of stack space.
909 CALL_FROM_THUNK_P is true if this call is the jump from a thunk to
910 the thunked-to function. */
912 static void
913 initialize_argument_information (int num_actuals ATTRIBUTE_UNUSED,
914 struct arg_data *args,
915 struct args_size *args_size,
916 int n_named_args ATTRIBUTE_UNUSED,
917 tree exp, tree struct_value_addr_value,
918 tree fndecl,
919 CUMULATIVE_ARGS *args_so_far,
920 int reg_parm_stack_space,
921 rtx *old_stack_level, int *old_pending_adj,
922 int *must_preallocate, int *ecf_flags,
923 bool *may_tailcall, bool call_from_thunk_p)
925 /* 1 if scanning parms front to back, -1 if scanning back to front. */
926 int inc;
928 /* Count arg position in order args appear. */
929 int argpos;
931 int i;
933 args_size->constant = 0;
934 args_size->var = 0;
936 /* In this loop, we consider args in the order they are written.
937 We fill up ARGS from the front or from the back if necessary
938 so that in any case the first arg to be pushed ends up at the front. */
940 if (PUSH_ARGS_REVERSED)
942 i = num_actuals - 1, inc = -1;
943 /* In this case, must reverse order of args
944 so that we compute and push the last arg first. */
946 else
948 i = 0, inc = 1;
951 /* First fill in the actual arguments in the ARGS array, splitting
952 complex arguments if necessary. */
954 int j = i;
955 call_expr_arg_iterator iter;
956 tree arg;
958 if (struct_value_addr_value)
960 args[j].tree_value = struct_value_addr_value;
961 j += inc;
963 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
965 tree argtype = TREE_TYPE (arg);
966 if (targetm.calls.split_complex_arg
967 && argtype
968 && TREE_CODE (argtype) == COMPLEX_TYPE
969 && targetm.calls.split_complex_arg (argtype))
971 tree subtype = TREE_TYPE (argtype);
972 arg = save_expr (arg);
973 args[j].tree_value = build1 (REALPART_EXPR, subtype, arg);
974 j += inc;
975 args[j].tree_value = build1 (IMAGPART_EXPR, subtype, arg);
977 else
978 args[j].tree_value = arg;
979 j += inc;
983 /* I counts args in order (to be) pushed; ARGPOS counts in order written. */
984 for (argpos = 0; argpos < num_actuals; i += inc, argpos++)
986 tree type = TREE_TYPE (args[i].tree_value);
987 int unsignedp;
988 enum machine_mode mode;
990 /* Replace erroneous argument with constant zero. */
991 if (type == error_mark_node || !COMPLETE_TYPE_P (type))
992 args[i].tree_value = integer_zero_node, type = integer_type_node;
994 /* If TYPE is a transparent union, pass things the way we would
995 pass the first field of the union. We have already verified that
996 the modes are the same. */
997 if (TREE_CODE (type) == UNION_TYPE && TYPE_TRANSPARENT_UNION (type))
998 type = TREE_TYPE (TYPE_FIELDS (type));
1000 /* Decide where to pass this arg.
1002 args[i].reg is nonzero if all or part is passed in registers.
1004 args[i].partial is nonzero if part but not all is passed in registers,
1005 and the exact value says how many bytes are passed in registers.
1007 args[i].pass_on_stack is nonzero if the argument must at least be
1008 computed on the stack. It may then be loaded back into registers
1009 if args[i].reg is nonzero.
1011 These decisions are driven by the FUNCTION_... macros and must agree
1012 with those made by function.c. */
1014 /* See if this argument should be passed by invisible reference. */
1015 if (pass_by_reference (args_so_far, TYPE_MODE (type),
1016 type, argpos < n_named_args))
1018 bool callee_copies;
1019 tree base;
1021 callee_copies
1022 = reference_callee_copied (args_so_far, TYPE_MODE (type),
1023 type, argpos < n_named_args);
1025 /* If we're compiling a thunk, pass through invisible references
1026 instead of making a copy. */
1027 if (call_from_thunk_p
1028 || (callee_copies
1029 && !TREE_ADDRESSABLE (type)
1030 && (base = get_base_address (args[i].tree_value))
1031 && (!DECL_P (base) || MEM_P (DECL_RTL (base)))))
1033 /* We can't use sibcalls if a callee-copied argument is
1034 stored in the current function's frame. */
1035 if (!call_from_thunk_p && DECL_P (base) && !TREE_STATIC (base))
1036 *may_tailcall = false;
1038 args[i].tree_value = build_fold_addr_expr (args[i].tree_value);
1039 type = TREE_TYPE (args[i].tree_value);
1041 if (*ecf_flags & ECF_CONST)
1042 *ecf_flags &= ~(ECF_CONST | ECF_LOOPING_CONST_OR_PURE);
1043 *ecf_flags &= ~ECF_LIBCALL_BLOCK;
1045 else
1047 /* We make a copy of the object and pass the address to the
1048 function being called. */
1049 rtx copy;
1051 if (!COMPLETE_TYPE_P (type)
1052 || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST
1053 || (flag_stack_check && ! STACK_CHECK_BUILTIN
1054 && (0 < compare_tree_int (TYPE_SIZE_UNIT (type),
1055 STACK_CHECK_MAX_VAR_SIZE))))
1057 /* This is a variable-sized object. Make space on the stack
1058 for it. */
1059 rtx size_rtx = expr_size (args[i].tree_value);
1061 if (*old_stack_level == 0)
1063 emit_stack_save (SAVE_BLOCK, old_stack_level, NULL_RTX);
1064 *old_pending_adj = pending_stack_adjust;
1065 pending_stack_adjust = 0;
1068 copy = gen_rtx_MEM (BLKmode,
1069 allocate_dynamic_stack_space
1070 (size_rtx, NULL_RTX, TYPE_ALIGN (type)));
1071 set_mem_attributes (copy, type, 1);
1073 else
1074 copy = assign_temp (type, 0, 1, 0);
1076 store_expr (args[i].tree_value, copy, 0, false);
1078 *ecf_flags &= ~(ECF_LIBCALL_BLOCK);
1080 /* Just change the const function to pure and then let
1081 the next test clear the pure based on
1082 callee_copies. */
1083 if (*ecf_flags & ECF_CONST)
1085 *ecf_flags &= ~ECF_CONST;
1086 *ecf_flags |= ECF_PURE;
1089 if (!callee_copies && *ecf_flags & ECF_PURE)
1090 *ecf_flags &= ~(ECF_PURE | ECF_LOOPING_CONST_OR_PURE);
1092 args[i].tree_value
1093 = build_fold_addr_expr (make_tree (type, copy));
1094 type = TREE_TYPE (args[i].tree_value);
1095 *may_tailcall = false;
1099 mode = TYPE_MODE (type);
1100 unsignedp = TYPE_UNSIGNED (type);
1102 if (targetm.calls.promote_function_args (fndecl ? TREE_TYPE (fndecl) : 0))
1103 mode = promote_mode (type, mode, &unsignedp, 1);
1105 args[i].unsignedp = unsignedp;
1106 args[i].mode = mode;
1108 args[i].reg = FUNCTION_ARG (*args_so_far, mode, type,
1109 argpos < n_named_args);
1110 #ifdef FUNCTION_INCOMING_ARG
1111 /* If this is a sibling call and the machine has register windows, the
1112 register window has to be unwinded before calling the routine, so
1113 arguments have to go into the incoming registers. */
1114 args[i].tail_call_reg = FUNCTION_INCOMING_ARG (*args_so_far, mode, type,
1115 argpos < n_named_args);
1116 #else
1117 args[i].tail_call_reg = args[i].reg;
1118 #endif
1120 if (args[i].reg)
1121 args[i].partial
1122 = targetm.calls.arg_partial_bytes (args_so_far, mode, type,
1123 argpos < n_named_args);
1125 args[i].pass_on_stack = targetm.calls.must_pass_in_stack (mode, type);
1127 /* If FUNCTION_ARG returned a (parallel [(expr_list (nil) ...) ...]),
1128 it means that we are to pass this arg in the register(s) designated
1129 by the PARALLEL, but also to pass it in the stack. */
1130 if (args[i].reg && GET_CODE (args[i].reg) == PARALLEL
1131 && XEXP (XVECEXP (args[i].reg, 0, 0), 0) == 0)
1132 args[i].pass_on_stack = 1;
1134 /* If this is an addressable type, we must preallocate the stack
1135 since we must evaluate the object into its final location.
1137 If this is to be passed in both registers and the stack, it is simpler
1138 to preallocate. */
1139 if (TREE_ADDRESSABLE (type)
1140 || (args[i].pass_on_stack && args[i].reg != 0))
1141 *must_preallocate = 1;
1143 /* If this is an addressable type, we cannot pre-evaluate it. Thus,
1144 we cannot consider this function call constant. */
1145 if (TREE_ADDRESSABLE (type))
1146 *ecf_flags &= ~ECF_LIBCALL_BLOCK;
1148 /* Compute the stack-size of this argument. */
1149 if (args[i].reg == 0 || args[i].partial != 0
1150 || reg_parm_stack_space > 0
1151 || args[i].pass_on_stack)
1152 locate_and_pad_parm (mode, type,
1153 #ifdef STACK_PARMS_IN_REG_PARM_AREA
1155 #else
1156 args[i].reg != 0,
1157 #endif
1158 args[i].pass_on_stack ? 0 : args[i].partial,
1159 fndecl, args_size, &args[i].locate);
1160 #ifdef BLOCK_REG_PADDING
1161 else
1162 /* The argument is passed entirely in registers. See at which
1163 end it should be padded. */
1164 args[i].locate.where_pad =
1165 BLOCK_REG_PADDING (mode, type,
1166 int_size_in_bytes (type) <= UNITS_PER_WORD);
1167 #endif
1169 /* Update ARGS_SIZE, the total stack space for args so far. */
1171 args_size->constant += args[i].locate.size.constant;
1172 if (args[i].locate.size.var)
1173 ADD_PARM_SIZE (*args_size, args[i].locate.size.var);
1175 /* Increment ARGS_SO_FAR, which has info about which arg-registers
1176 have been used, etc. */
1178 FUNCTION_ARG_ADVANCE (*args_so_far, TYPE_MODE (type), type,
1179 argpos < n_named_args);
1183 /* Update ARGS_SIZE to contain the total size for the argument block.
1184 Return the original constant component of the argument block's size.
1186 REG_PARM_STACK_SPACE holds the number of bytes of stack space reserved
1187 for arguments passed in registers. */
1189 static int
1190 compute_argument_block_size (int reg_parm_stack_space,
1191 struct args_size *args_size,
1192 tree fndecl ATTRIBUTE_UNUSED,
1193 int preferred_stack_boundary ATTRIBUTE_UNUSED)
1195 int unadjusted_args_size = args_size->constant;
1197 /* For accumulate outgoing args mode we don't need to align, since the frame
1198 will be already aligned. Align to STACK_BOUNDARY in order to prevent
1199 backends from generating misaligned frame sizes. */
1200 if (ACCUMULATE_OUTGOING_ARGS && preferred_stack_boundary > STACK_BOUNDARY)
1201 preferred_stack_boundary = STACK_BOUNDARY;
1203 /* Compute the actual size of the argument block required. The variable
1204 and constant sizes must be combined, the size may have to be rounded,
1205 and there may be a minimum required size. */
1207 if (args_size->var)
1209 args_size->var = ARGS_SIZE_TREE (*args_size);
1210 args_size->constant = 0;
1212 preferred_stack_boundary /= BITS_PER_UNIT;
1213 if (preferred_stack_boundary > 1)
1215 /* We don't handle this case yet. To handle it correctly we have
1216 to add the delta, round and subtract the delta.
1217 Currently no machine description requires this support. */
1218 gcc_assert (!(stack_pointer_delta & (preferred_stack_boundary - 1)));
1219 args_size->var = round_up (args_size->var, preferred_stack_boundary);
1222 if (reg_parm_stack_space > 0)
1224 args_size->var
1225 = size_binop (MAX_EXPR, args_size->var,
1226 ssize_int (reg_parm_stack_space));
1228 /* The area corresponding to register parameters is not to count in
1229 the size of the block we need. So make the adjustment. */
1230 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl))))
1231 args_size->var
1232 = size_binop (MINUS_EXPR, args_size->var,
1233 ssize_int (reg_parm_stack_space));
1236 else
1238 preferred_stack_boundary /= BITS_PER_UNIT;
1239 if (preferred_stack_boundary < 1)
1240 preferred_stack_boundary = 1;
1241 args_size->constant = (((args_size->constant
1242 + stack_pointer_delta
1243 + preferred_stack_boundary - 1)
1244 / preferred_stack_boundary
1245 * preferred_stack_boundary)
1246 - stack_pointer_delta);
1248 args_size->constant = MAX (args_size->constant,
1249 reg_parm_stack_space);
1251 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl))))
1252 args_size->constant -= reg_parm_stack_space;
1254 return unadjusted_args_size;
1257 /* Precompute parameters as needed for a function call.
1259 FLAGS is mask of ECF_* constants.
1261 NUM_ACTUALS is the number of arguments.
1263 ARGS is an array containing information for each argument; this
1264 routine fills in the INITIAL_VALUE and VALUE fields for each
1265 precomputed argument. */
1267 static void
1268 precompute_arguments (int flags, int num_actuals, struct arg_data *args)
1270 int i;
1272 /* If this is a libcall, then precompute all arguments so that we do not
1273 get extraneous instructions emitted as part of the libcall sequence. */
1275 /* If we preallocated the stack space, and some arguments must be passed
1276 on the stack, then we must precompute any parameter which contains a
1277 function call which will store arguments on the stack.
1278 Otherwise, evaluating the parameter may clobber previous parameters
1279 which have already been stored into the stack. (we have code to avoid
1280 such case by saving the outgoing stack arguments, but it results in
1281 worse code) */
1282 if ((flags & ECF_LIBCALL_BLOCK) == 0 && !ACCUMULATE_OUTGOING_ARGS)
1283 return;
1285 for (i = 0; i < num_actuals; i++)
1287 enum machine_mode mode;
1289 if ((flags & ECF_LIBCALL_BLOCK) == 0
1290 && TREE_CODE (args[i].tree_value) != CALL_EXPR)
1291 continue;
1293 /* If this is an addressable type, we cannot pre-evaluate it. */
1294 gcc_assert (!TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value)));
1296 args[i].initial_value = args[i].value
1297 = expand_normal (args[i].tree_value);
1299 mode = TYPE_MODE (TREE_TYPE (args[i].tree_value));
1300 if (mode != args[i].mode)
1302 args[i].value
1303 = convert_modes (args[i].mode, mode,
1304 args[i].value, args[i].unsignedp);
1305 #if defined(PROMOTE_FUNCTION_MODE) && !defined(PROMOTE_MODE)
1306 /* CSE will replace this only if it contains args[i].value
1307 pseudo, so convert it down to the declared mode using
1308 a SUBREG. */
1309 if (REG_P (args[i].value)
1310 && GET_MODE_CLASS (args[i].mode) == MODE_INT)
1312 args[i].initial_value
1313 = gen_lowpart_SUBREG (mode, args[i].value);
1314 SUBREG_PROMOTED_VAR_P (args[i].initial_value) = 1;
1315 SUBREG_PROMOTED_UNSIGNED_SET (args[i].initial_value,
1316 args[i].unsignedp);
1318 #endif
1323 /* Given the current state of MUST_PREALLOCATE and information about
1324 arguments to a function call in NUM_ACTUALS, ARGS and ARGS_SIZE,
1325 compute and return the final value for MUST_PREALLOCATE. */
1327 static int
1328 finalize_must_preallocate (int must_preallocate, int num_actuals,
1329 struct arg_data *args, struct args_size *args_size)
1331 /* See if we have or want to preallocate stack space.
1333 If we would have to push a partially-in-regs parm
1334 before other stack parms, preallocate stack space instead.
1336 If the size of some parm is not a multiple of the required stack
1337 alignment, we must preallocate.
1339 If the total size of arguments that would otherwise create a copy in
1340 a temporary (such as a CALL) is more than half the total argument list
1341 size, preallocation is faster.
1343 Another reason to preallocate is if we have a machine (like the m88k)
1344 where stack alignment is required to be maintained between every
1345 pair of insns, not just when the call is made. However, we assume here
1346 that such machines either do not have push insns (and hence preallocation
1347 would occur anyway) or the problem is taken care of with
1348 PUSH_ROUNDING. */
1350 if (! must_preallocate)
1352 int partial_seen = 0;
1353 int copy_to_evaluate_size = 0;
1354 int i;
1356 for (i = 0; i < num_actuals && ! must_preallocate; i++)
1358 if (args[i].partial > 0 && ! args[i].pass_on_stack)
1359 partial_seen = 1;
1360 else if (partial_seen && args[i].reg == 0)
1361 must_preallocate = 1;
1363 if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode
1364 && (TREE_CODE (args[i].tree_value) == CALL_EXPR
1365 || TREE_CODE (args[i].tree_value) == TARGET_EXPR
1366 || TREE_CODE (args[i].tree_value) == COND_EXPR
1367 || TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value))))
1368 copy_to_evaluate_size
1369 += int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1372 if (copy_to_evaluate_size * 2 >= args_size->constant
1373 && args_size->constant > 0)
1374 must_preallocate = 1;
1376 return must_preallocate;
1379 /* If we preallocated stack space, compute the address of each argument
1380 and store it into the ARGS array.
1382 We need not ensure it is a valid memory address here; it will be
1383 validized when it is used.
1385 ARGBLOCK is an rtx for the address of the outgoing arguments. */
1387 static void
1388 compute_argument_addresses (struct arg_data *args, rtx argblock, int num_actuals)
1390 if (argblock)
1392 rtx arg_reg = argblock;
1393 int i, arg_offset = 0;
1395 if (GET_CODE (argblock) == PLUS)
1396 arg_reg = XEXP (argblock, 0), arg_offset = INTVAL (XEXP (argblock, 1));
1398 for (i = 0; i < num_actuals; i++)
1400 rtx offset = ARGS_SIZE_RTX (args[i].locate.offset);
1401 rtx slot_offset = ARGS_SIZE_RTX (args[i].locate.slot_offset);
1402 rtx addr;
1403 unsigned int align, boundary;
1404 unsigned int units_on_stack = 0;
1405 enum machine_mode partial_mode = VOIDmode;
1407 /* Skip this parm if it will not be passed on the stack. */
1408 if (! args[i].pass_on_stack
1409 && args[i].reg != 0
1410 && args[i].partial == 0)
1411 continue;
1413 if (GET_CODE (offset) == CONST_INT)
1414 addr = plus_constant (arg_reg, INTVAL (offset));
1415 else
1416 addr = gen_rtx_PLUS (Pmode, arg_reg, offset);
1418 addr = plus_constant (addr, arg_offset);
1420 if (args[i].partial != 0)
1422 /* Only part of the parameter is being passed on the stack.
1423 Generate a simple memory reference of the correct size. */
1424 units_on_stack = args[i].locate.size.constant;
1425 partial_mode = mode_for_size (units_on_stack * BITS_PER_UNIT,
1426 MODE_INT, 1);
1427 args[i].stack = gen_rtx_MEM (partial_mode, addr);
1428 set_mem_size (args[i].stack, GEN_INT (units_on_stack));
1430 else
1432 args[i].stack = gen_rtx_MEM (args[i].mode, addr);
1433 set_mem_attributes (args[i].stack,
1434 TREE_TYPE (args[i].tree_value), 1);
1436 align = BITS_PER_UNIT;
1437 boundary = args[i].locate.boundary;
1438 if (args[i].locate.where_pad != downward)
1439 align = boundary;
1440 else if (GET_CODE (offset) == CONST_INT)
1442 align = INTVAL (offset) * BITS_PER_UNIT | boundary;
1443 align = align & -align;
1445 set_mem_align (args[i].stack, align);
1447 if (GET_CODE (slot_offset) == CONST_INT)
1448 addr = plus_constant (arg_reg, INTVAL (slot_offset));
1449 else
1450 addr = gen_rtx_PLUS (Pmode, arg_reg, slot_offset);
1452 addr = plus_constant (addr, arg_offset);
1454 if (args[i].partial != 0)
1456 /* Only part of the parameter is being passed on the stack.
1457 Generate a simple memory reference of the correct size.
1459 args[i].stack_slot = gen_rtx_MEM (partial_mode, addr);
1460 set_mem_size (args[i].stack_slot, GEN_INT (units_on_stack));
1462 else
1464 args[i].stack_slot = gen_rtx_MEM (args[i].mode, addr);
1465 set_mem_attributes (args[i].stack_slot,
1466 TREE_TYPE (args[i].tree_value), 1);
1468 set_mem_align (args[i].stack_slot, args[i].locate.boundary);
1470 /* Function incoming arguments may overlap with sibling call
1471 outgoing arguments and we cannot allow reordering of reads
1472 from function arguments with stores to outgoing arguments
1473 of sibling calls. */
1474 set_mem_alias_set (args[i].stack, 0);
1475 set_mem_alias_set (args[i].stack_slot, 0);
1480 /* Given a FNDECL and EXP, return an rtx suitable for use as a target address
1481 in a call instruction.
1483 FNDECL is the tree node for the target function. For an indirect call
1484 FNDECL will be NULL_TREE.
1486 ADDR is the operand 0 of CALL_EXPR for this call. */
1488 static rtx
1489 rtx_for_function_call (tree fndecl, tree addr)
1491 rtx funexp;
1493 /* Get the function to call, in the form of RTL. */
1494 if (fndecl)
1496 /* If this is the first use of the function, see if we need to
1497 make an external definition for it. */
1498 if (!TREE_USED (fndecl) && fndecl != current_function_decl)
1500 assemble_external (fndecl);
1501 TREE_USED (fndecl) = 1;
1504 /* Get a SYMBOL_REF rtx for the function address. */
1505 funexp = XEXP (DECL_RTL (fndecl), 0);
1507 else
1508 /* Generate an rtx (probably a pseudo-register) for the address. */
1510 push_temp_slots ();
1511 funexp = expand_normal (addr);
1512 pop_temp_slots (); /* FUNEXP can't be BLKmode. */
1514 return funexp;
1517 /* Return true if and only if SIZE storage units (usually bytes)
1518 starting from address ADDR overlap with already clobbered argument
1519 area. This function is used to determine if we should give up a
1520 sibcall. */
1522 static bool
1523 mem_overlaps_already_clobbered_arg_p (rtx addr, unsigned HOST_WIDE_INT size)
1525 HOST_WIDE_INT i;
1527 if (addr == crtl->args.internal_arg_pointer)
1528 i = 0;
1529 else if (GET_CODE (addr) == PLUS
1530 && XEXP (addr, 0) == crtl->args.internal_arg_pointer
1531 && GET_CODE (XEXP (addr, 1)) == CONST_INT)
1532 i = INTVAL (XEXP (addr, 1));
1533 /* Return true for arg pointer based indexed addressing. */
1534 else if (GET_CODE (addr) == PLUS
1535 && (XEXP (addr, 0) == crtl->args.internal_arg_pointer
1536 || XEXP (addr, 1) == crtl->args.internal_arg_pointer))
1537 return true;
1538 else
1539 return false;
1541 #ifdef ARGS_GROW_DOWNWARD
1542 i = -i - size;
1543 #endif
1544 if (size > 0)
1546 unsigned HOST_WIDE_INT k;
1548 for (k = 0; k < size; k++)
1549 if (i + k < stored_args_map->n_bits
1550 && TEST_BIT (stored_args_map, i + k))
1551 return true;
1554 return false;
1557 /* Do the register loads required for any wholly-register parms or any
1558 parms which are passed both on the stack and in a register. Their
1559 expressions were already evaluated.
1561 Mark all register-parms as living through the call, putting these USE
1562 insns in the CALL_INSN_FUNCTION_USAGE field.
1564 When IS_SIBCALL, perform the check_sibcall_argument_overlap
1565 checking, setting *SIBCALL_FAILURE if appropriate. */
1567 static void
1568 load_register_parameters (struct arg_data *args, int num_actuals,
1569 rtx *call_fusage, int flags, int is_sibcall,
1570 int *sibcall_failure)
1572 int i, j;
1574 for (i = 0; i < num_actuals; i++)
1576 rtx reg = ((flags & ECF_SIBCALL)
1577 ? args[i].tail_call_reg : args[i].reg);
1578 if (reg)
1580 int partial = args[i].partial;
1581 int nregs;
1582 int size = 0;
1583 rtx before_arg = get_last_insn ();
1584 /* Set non-negative if we must move a word at a time, even if
1585 just one word (e.g, partial == 4 && mode == DFmode). Set
1586 to -1 if we just use a normal move insn. This value can be
1587 zero if the argument is a zero size structure. */
1588 nregs = -1;
1589 if (GET_CODE (reg) == PARALLEL)
1591 else if (partial)
1593 gcc_assert (partial % UNITS_PER_WORD == 0);
1594 nregs = partial / UNITS_PER_WORD;
1596 else if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode)
1598 size = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1599 nregs = (size + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD;
1601 else
1602 size = GET_MODE_SIZE (args[i].mode);
1604 /* Handle calls that pass values in multiple non-contiguous
1605 locations. The Irix 6 ABI has examples of this. */
1607 if (GET_CODE (reg) == PARALLEL)
1608 emit_group_move (reg, args[i].parallel_value);
1610 /* If simple case, just do move. If normal partial, store_one_arg
1611 has already loaded the register for us. In all other cases,
1612 load the register(s) from memory. */
1614 else if (nregs == -1)
1616 emit_move_insn (reg, args[i].value);
1617 #ifdef BLOCK_REG_PADDING
1618 /* Handle case where we have a value that needs shifting
1619 up to the msb. eg. a QImode value and we're padding
1620 upward on a BYTES_BIG_ENDIAN machine. */
1621 if (size < UNITS_PER_WORD
1622 && (args[i].locate.where_pad
1623 == (BYTES_BIG_ENDIAN ? upward : downward)))
1625 rtx x;
1626 int shift = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
1628 /* Assigning REG here rather than a temp makes CALL_FUSAGE
1629 report the whole reg as used. Strictly speaking, the
1630 call only uses SIZE bytes at the msb end, but it doesn't
1631 seem worth generating rtl to say that. */
1632 reg = gen_rtx_REG (word_mode, REGNO (reg));
1633 x = expand_shift (LSHIFT_EXPR, word_mode, reg,
1634 build_int_cst (NULL_TREE, shift),
1635 reg, 1);
1636 if (x != reg)
1637 emit_move_insn (reg, x);
1639 #endif
1642 /* If we have pre-computed the values to put in the registers in
1643 the case of non-aligned structures, copy them in now. */
1645 else if (args[i].n_aligned_regs != 0)
1646 for (j = 0; j < args[i].n_aligned_regs; j++)
1647 emit_move_insn (gen_rtx_REG (word_mode, REGNO (reg) + j),
1648 args[i].aligned_regs[j]);
1650 else if (partial == 0 || args[i].pass_on_stack)
1652 rtx mem = validize_mem (args[i].value);
1654 /* Check for overlap with already clobbered argument area. */
1655 if (is_sibcall
1656 && mem_overlaps_already_clobbered_arg_p (XEXP (args[i].value, 0),
1657 size))
1658 *sibcall_failure = 1;
1660 /* Handle a BLKmode that needs shifting. */
1661 if (nregs == 1 && size < UNITS_PER_WORD
1662 #ifdef BLOCK_REG_PADDING
1663 && args[i].locate.where_pad == downward
1664 #else
1665 && BYTES_BIG_ENDIAN
1666 #endif
1669 rtx tem = operand_subword_force (mem, 0, args[i].mode);
1670 rtx ri = gen_rtx_REG (word_mode, REGNO (reg));
1671 rtx x = gen_reg_rtx (word_mode);
1672 int shift = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
1673 enum tree_code dir = BYTES_BIG_ENDIAN ? RSHIFT_EXPR
1674 : LSHIFT_EXPR;
1676 emit_move_insn (x, tem);
1677 x = expand_shift (dir, word_mode, x,
1678 build_int_cst (NULL_TREE, shift),
1679 ri, 1);
1680 if (x != ri)
1681 emit_move_insn (ri, x);
1683 else
1684 move_block_to_reg (REGNO (reg), mem, nregs, args[i].mode);
1687 /* When a parameter is a block, and perhaps in other cases, it is
1688 possible that it did a load from an argument slot that was
1689 already clobbered. */
1690 if (is_sibcall
1691 && check_sibcall_argument_overlap (before_arg, &args[i], 0))
1692 *sibcall_failure = 1;
1694 /* Handle calls that pass values in multiple non-contiguous
1695 locations. The Irix 6 ABI has examples of this. */
1696 if (GET_CODE (reg) == PARALLEL)
1697 use_group_regs (call_fusage, reg);
1698 else if (nregs == -1)
1699 use_reg (call_fusage, reg);
1700 else if (nregs > 0)
1701 use_regs (call_fusage, REGNO (reg), nregs);
1706 /* We need to pop PENDING_STACK_ADJUST bytes. But, if the arguments
1707 wouldn't fill up an even multiple of PREFERRED_UNIT_STACK_BOUNDARY
1708 bytes, then we would need to push some additional bytes to pad the
1709 arguments. So, we compute an adjust to the stack pointer for an
1710 amount that will leave the stack under-aligned by UNADJUSTED_ARGS_SIZE
1711 bytes. Then, when the arguments are pushed the stack will be perfectly
1712 aligned. ARGS_SIZE->CONSTANT is set to the number of bytes that should
1713 be popped after the call. Returns the adjustment. */
1715 static int
1716 combine_pending_stack_adjustment_and_call (int unadjusted_args_size,
1717 struct args_size *args_size,
1718 unsigned int preferred_unit_stack_boundary)
1720 /* The number of bytes to pop so that the stack will be
1721 under-aligned by UNADJUSTED_ARGS_SIZE bytes. */
1722 HOST_WIDE_INT adjustment;
1723 /* The alignment of the stack after the arguments are pushed, if we
1724 just pushed the arguments without adjust the stack here. */
1725 unsigned HOST_WIDE_INT unadjusted_alignment;
1727 unadjusted_alignment
1728 = ((stack_pointer_delta + unadjusted_args_size)
1729 % preferred_unit_stack_boundary);
1731 /* We want to get rid of as many of the PENDING_STACK_ADJUST bytes
1732 as possible -- leaving just enough left to cancel out the
1733 UNADJUSTED_ALIGNMENT. In other words, we want to ensure that the
1734 PENDING_STACK_ADJUST is non-negative, and congruent to
1735 -UNADJUSTED_ALIGNMENT modulo the PREFERRED_UNIT_STACK_BOUNDARY. */
1737 /* Begin by trying to pop all the bytes. */
1738 unadjusted_alignment
1739 = (unadjusted_alignment
1740 - (pending_stack_adjust % preferred_unit_stack_boundary));
1741 adjustment = pending_stack_adjust;
1742 /* Push enough additional bytes that the stack will be aligned
1743 after the arguments are pushed. */
1744 if (preferred_unit_stack_boundary > 1)
1746 if (unadjusted_alignment > 0)
1747 adjustment -= preferred_unit_stack_boundary - unadjusted_alignment;
1748 else
1749 adjustment += unadjusted_alignment;
1752 /* Now, sets ARGS_SIZE->CONSTANT so that we pop the right number of
1753 bytes after the call. The right number is the entire
1754 PENDING_STACK_ADJUST less our ADJUSTMENT plus the amount required
1755 by the arguments in the first place. */
1756 args_size->constant
1757 = pending_stack_adjust - adjustment + unadjusted_args_size;
1759 return adjustment;
1762 /* Scan X expression if it does not dereference any argument slots
1763 we already clobbered by tail call arguments (as noted in stored_args_map
1764 bitmap).
1765 Return nonzero if X expression dereferences such argument slots,
1766 zero otherwise. */
1768 static int
1769 check_sibcall_argument_overlap_1 (rtx x)
1771 RTX_CODE code;
1772 int i, j;
1773 const char *fmt;
1775 if (x == NULL_RTX)
1776 return 0;
1778 code = GET_CODE (x);
1780 if (code == MEM)
1781 return mem_overlaps_already_clobbered_arg_p (XEXP (x, 0),
1782 GET_MODE_SIZE (GET_MODE (x)));
1784 /* Scan all subexpressions. */
1785 fmt = GET_RTX_FORMAT (code);
1786 for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
1788 if (*fmt == 'e')
1790 if (check_sibcall_argument_overlap_1 (XEXP (x, i)))
1791 return 1;
1793 else if (*fmt == 'E')
1795 for (j = 0; j < XVECLEN (x, i); j++)
1796 if (check_sibcall_argument_overlap_1 (XVECEXP (x, i, j)))
1797 return 1;
1800 return 0;
1803 /* Scan sequence after INSN if it does not dereference any argument slots
1804 we already clobbered by tail call arguments (as noted in stored_args_map
1805 bitmap). If MARK_STORED_ARGS_MAP, add stack slots for ARG to
1806 stored_args_map bitmap afterwards (when ARG is a register MARK_STORED_ARGS_MAP
1807 should be 0). Return nonzero if sequence after INSN dereferences such argument
1808 slots, zero otherwise. */
1810 static int
1811 check_sibcall_argument_overlap (rtx insn, struct arg_data *arg, int mark_stored_args_map)
1813 int low, high;
1815 if (insn == NULL_RTX)
1816 insn = get_insns ();
1817 else
1818 insn = NEXT_INSN (insn);
1820 for (; insn; insn = NEXT_INSN (insn))
1821 if (INSN_P (insn)
1822 && check_sibcall_argument_overlap_1 (PATTERN (insn)))
1823 break;
1825 if (mark_stored_args_map)
1827 #ifdef ARGS_GROW_DOWNWARD
1828 low = -arg->locate.slot_offset.constant - arg->locate.size.constant;
1829 #else
1830 low = arg->locate.slot_offset.constant;
1831 #endif
1833 for (high = low + arg->locate.size.constant; low < high; low++)
1834 SET_BIT (stored_args_map, low);
1836 return insn != NULL_RTX;
1839 /* Given that a function returns a value of mode MODE at the most
1840 significant end of hard register VALUE, shift VALUE left or right
1841 as specified by LEFT_P. Return true if some action was needed. */
1843 bool
1844 shift_return_value (enum machine_mode mode, bool left_p, rtx value)
1846 HOST_WIDE_INT shift;
1848 gcc_assert (REG_P (value) && HARD_REGISTER_P (value));
1849 shift = GET_MODE_BITSIZE (GET_MODE (value)) - GET_MODE_BITSIZE (mode);
1850 if (shift == 0)
1851 return false;
1853 /* Use ashr rather than lshr for right shifts. This is for the benefit
1854 of the MIPS port, which requires SImode values to be sign-extended
1855 when stored in 64-bit registers. */
1856 if (!force_expand_binop (GET_MODE (value), left_p ? ashl_optab : ashr_optab,
1857 value, GEN_INT (shift), value, 1, OPTAB_WIDEN))
1858 gcc_unreachable ();
1859 return true;
1862 /* If X is a likely-spilled register value, copy it to a pseudo
1863 register and return that register. Return X otherwise. */
1865 static rtx
1866 avoid_likely_spilled_reg (rtx x)
1868 rtx new;
1870 if (REG_P (x)
1871 && HARD_REGISTER_P (x)
1872 && CLASS_LIKELY_SPILLED_P (REGNO_REG_CLASS (REGNO (x))))
1874 /* Make sure that we generate a REG rather than a CONCAT.
1875 Moves into CONCATs can need nontrivial instructions,
1876 and the whole point of this function is to avoid
1877 using the hard register directly in such a situation. */
1878 generating_concat_p = 0;
1879 new = gen_reg_rtx (GET_MODE (x));
1880 generating_concat_p = 1;
1881 emit_move_insn (new, x);
1882 return new;
1884 return x;
1887 /* Generate all the code for a CALL_EXPR exp
1888 and return an rtx for its value.
1889 Store the value in TARGET (specified as an rtx) if convenient.
1890 If the value is stored in TARGET then TARGET is returned.
1891 If IGNORE is nonzero, then we ignore the value of the function call. */
1894 expand_call (tree exp, rtx target, int ignore)
1896 /* Nonzero if we are currently expanding a call. */
1897 static int currently_expanding_call = 0;
1899 /* RTX for the function to be called. */
1900 rtx funexp;
1901 /* Sequence of insns to perform a normal "call". */
1902 rtx normal_call_insns = NULL_RTX;
1903 /* Sequence of insns to perform a tail "call". */
1904 rtx tail_call_insns = NULL_RTX;
1905 /* Data type of the function. */
1906 tree funtype;
1907 tree type_arg_types;
1908 /* Declaration of the function being called,
1909 or 0 if the function is computed (not known by name). */
1910 tree fndecl = 0;
1911 /* The type of the function being called. */
1912 tree fntype;
1913 bool try_tail_call = CALL_EXPR_TAILCALL (exp);
1914 int pass;
1916 /* Register in which non-BLKmode value will be returned,
1917 or 0 if no value or if value is BLKmode. */
1918 rtx valreg;
1919 /* Address where we should return a BLKmode value;
1920 0 if value not BLKmode. */
1921 rtx structure_value_addr = 0;
1922 /* Nonzero if that address is being passed by treating it as
1923 an extra, implicit first parameter. Otherwise,
1924 it is passed by being copied directly into struct_value_rtx. */
1925 int structure_value_addr_parm = 0;
1926 /* Holds the value of implicit argument for the struct value. */
1927 tree structure_value_addr_value = NULL_TREE;
1928 /* Size of aggregate value wanted, or zero if none wanted
1929 or if we are using the non-reentrant PCC calling convention
1930 or expecting the value in registers. */
1931 HOST_WIDE_INT struct_value_size = 0;
1932 /* Nonzero if called function returns an aggregate in memory PCC style,
1933 by returning the address of where to find it. */
1934 int pcc_struct_value = 0;
1935 rtx struct_value = 0;
1937 /* Number of actual parameters in this call, including struct value addr. */
1938 int num_actuals;
1939 /* Number of named args. Args after this are anonymous ones
1940 and they must all go on the stack. */
1941 int n_named_args;
1942 /* Number of complex actual arguments that need to be split. */
1943 int num_complex_actuals = 0;
1945 /* Vector of information about each argument.
1946 Arguments are numbered in the order they will be pushed,
1947 not the order they are written. */
1948 struct arg_data *args;
1950 /* Total size in bytes of all the stack-parms scanned so far. */
1951 struct args_size args_size;
1952 struct args_size adjusted_args_size;
1953 /* Size of arguments before any adjustments (such as rounding). */
1954 int unadjusted_args_size;
1955 /* Data on reg parms scanned so far. */
1956 CUMULATIVE_ARGS args_so_far;
1957 /* Nonzero if a reg parm has been scanned. */
1958 int reg_parm_seen;
1959 /* Nonzero if this is an indirect function call. */
1961 /* Nonzero if we must avoid push-insns in the args for this call.
1962 If stack space is allocated for register parameters, but not by the
1963 caller, then it is preallocated in the fixed part of the stack frame.
1964 So the entire argument block must then be preallocated (i.e., we
1965 ignore PUSH_ROUNDING in that case). */
1967 int must_preallocate = !PUSH_ARGS;
1969 /* Size of the stack reserved for parameter registers. */
1970 int reg_parm_stack_space = 0;
1972 /* Address of space preallocated for stack parms
1973 (on machines that lack push insns), or 0 if space not preallocated. */
1974 rtx argblock = 0;
1976 /* Mask of ECF_ flags. */
1977 int flags = 0;
1978 #ifdef REG_PARM_STACK_SPACE
1979 /* Define the boundary of the register parm stack space that needs to be
1980 saved, if any. */
1981 int low_to_save, high_to_save;
1982 rtx save_area = 0; /* Place that it is saved */
1983 #endif
1985 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
1986 char *initial_stack_usage_map = stack_usage_map;
1987 char *stack_usage_map_buf = NULL;
1989 int old_stack_allocated;
1991 /* State variables to track stack modifications. */
1992 rtx old_stack_level = 0;
1993 int old_stack_arg_under_construction = 0;
1994 int old_pending_adj = 0;
1995 int old_inhibit_defer_pop = inhibit_defer_pop;
1997 /* Some stack pointer alterations we make are performed via
1998 allocate_dynamic_stack_space. This modifies the stack_pointer_delta,
1999 which we then also need to save/restore along the way. */
2000 int old_stack_pointer_delta = 0;
2002 rtx call_fusage;
2003 tree p = CALL_EXPR_FN (exp);
2004 tree addr = CALL_EXPR_FN (exp);
2005 int i;
2006 /* The alignment of the stack, in bits. */
2007 unsigned HOST_WIDE_INT preferred_stack_boundary;
2008 /* The alignment of the stack, in bytes. */
2009 unsigned HOST_WIDE_INT preferred_unit_stack_boundary;
2010 /* The static chain value to use for this call. */
2011 rtx static_chain_value;
2012 /* See if this is "nothrow" function call. */
2013 if (TREE_NOTHROW (exp))
2014 flags |= ECF_NOTHROW;
2016 /* See if we can find a DECL-node for the actual function, and get the
2017 function attributes (flags) from the function decl or type node. */
2018 fndecl = get_callee_fndecl (exp);
2019 if (fndecl)
2021 fntype = TREE_TYPE (fndecl);
2022 flags |= flags_from_decl_or_type (fndecl);
2024 else
2026 fntype = TREE_TYPE (TREE_TYPE (p));
2027 flags |= flags_from_decl_or_type (fntype);
2030 struct_value = targetm.calls.struct_value_rtx (fntype, 0);
2032 /* Warn if this value is an aggregate type,
2033 regardless of which calling convention we are using for it. */
2034 if (AGGREGATE_TYPE_P (TREE_TYPE (exp)))
2035 warning (OPT_Waggregate_return, "function call has aggregate value");
2037 /* If the result of a non looping pure or const function call is
2038 ignored (or void), and none of its arguments are volatile, we can
2039 avoid expanding the call and just evaluate the arguments for
2040 side-effects. */
2041 if ((flags & (ECF_CONST | ECF_PURE))
2042 && (!(flags & ECF_LOOPING_CONST_OR_PURE))
2043 && (ignore || target == const0_rtx
2044 || TYPE_MODE (TREE_TYPE (exp)) == VOIDmode))
2046 bool volatilep = false;
2047 tree arg;
2048 call_expr_arg_iterator iter;
2050 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
2051 if (TREE_THIS_VOLATILE (arg))
2053 volatilep = true;
2054 break;
2057 if (! volatilep)
2059 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
2060 expand_expr (arg, const0_rtx, VOIDmode, EXPAND_NORMAL);
2061 return const0_rtx;
2065 #ifdef REG_PARM_STACK_SPACE
2066 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
2067 #endif
2069 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl)))
2070 && reg_parm_stack_space > 0 && PUSH_ARGS)
2071 must_preallocate = 1;
2073 /* Set up a place to return a structure. */
2075 /* Cater to broken compilers. */
2076 if (aggregate_value_p (exp, fndecl))
2078 /* This call returns a big structure. */
2079 flags &= ~(ECF_CONST | ECF_PURE | ECF_LOOPING_CONST_OR_PURE
2080 | ECF_LIBCALL_BLOCK);
2082 #ifdef PCC_STATIC_STRUCT_RETURN
2084 pcc_struct_value = 1;
2086 #else /* not PCC_STATIC_STRUCT_RETURN */
2088 struct_value_size = int_size_in_bytes (TREE_TYPE (exp));
2090 if (target && MEM_P (target) && CALL_EXPR_RETURN_SLOT_OPT (exp))
2091 structure_value_addr = XEXP (target, 0);
2092 else
2094 /* For variable-sized objects, we must be called with a target
2095 specified. If we were to allocate space on the stack here,
2096 we would have no way of knowing when to free it. */
2097 rtx d = assign_temp (TREE_TYPE (exp), 0, 1, 1);
2099 mark_temp_addr_taken (d);
2100 structure_value_addr = XEXP (d, 0);
2101 target = 0;
2104 #endif /* not PCC_STATIC_STRUCT_RETURN */
2107 /* Figure out the amount to which the stack should be aligned. */
2108 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
2109 if (fndecl)
2111 struct cgraph_rtl_info *i = cgraph_rtl_info (fndecl);
2112 if (i && i->preferred_incoming_stack_boundary)
2113 preferred_stack_boundary = i->preferred_incoming_stack_boundary;
2116 /* Operand 0 is a pointer-to-function; get the type of the function. */
2117 funtype = TREE_TYPE (addr);
2118 gcc_assert (POINTER_TYPE_P (funtype));
2119 funtype = TREE_TYPE (funtype);
2121 /* Count whether there are actual complex arguments that need to be split
2122 into their real and imaginary parts. Munge the type_arg_types
2123 appropriately here as well. */
2124 if (targetm.calls.split_complex_arg)
2126 call_expr_arg_iterator iter;
2127 tree arg;
2128 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
2130 tree type = TREE_TYPE (arg);
2131 if (type && TREE_CODE (type) == COMPLEX_TYPE
2132 && targetm.calls.split_complex_arg (type))
2133 num_complex_actuals++;
2135 type_arg_types = split_complex_types (TYPE_ARG_TYPES (funtype));
2137 else
2138 type_arg_types = TYPE_ARG_TYPES (funtype);
2140 if (flags & ECF_MAY_BE_ALLOCA)
2141 cfun->calls_alloca = 1;
2143 /* If struct_value_rtx is 0, it means pass the address
2144 as if it were an extra parameter. Put the argument expression
2145 in structure_value_addr_value. */
2146 if (structure_value_addr && struct_value == 0)
2148 /* If structure_value_addr is a REG other than
2149 virtual_outgoing_args_rtx, we can use always use it. If it
2150 is not a REG, we must always copy it into a register.
2151 If it is virtual_outgoing_args_rtx, we must copy it to another
2152 register in some cases. */
2153 rtx temp = (!REG_P (structure_value_addr)
2154 || (ACCUMULATE_OUTGOING_ARGS
2155 && stack_arg_under_construction
2156 && structure_value_addr == virtual_outgoing_args_rtx)
2157 ? copy_addr_to_reg (convert_memory_address
2158 (Pmode, structure_value_addr))
2159 : structure_value_addr);
2161 structure_value_addr_value =
2162 make_tree (build_pointer_type (TREE_TYPE (funtype)), temp);
2163 structure_value_addr_parm = 1;
2166 /* Count the arguments and set NUM_ACTUALS. */
2167 num_actuals =
2168 call_expr_nargs (exp) + num_complex_actuals + structure_value_addr_parm;
2170 /* Compute number of named args.
2171 First, do a raw count of the args for INIT_CUMULATIVE_ARGS. */
2173 if (type_arg_types != 0)
2174 n_named_args
2175 = (list_length (type_arg_types)
2176 /* Count the struct value address, if it is passed as a parm. */
2177 + structure_value_addr_parm);
2178 else
2179 /* If we know nothing, treat all args as named. */
2180 n_named_args = num_actuals;
2182 /* Start updating where the next arg would go.
2184 On some machines (such as the PA) indirect calls have a different
2185 calling convention than normal calls. The fourth argument in
2186 INIT_CUMULATIVE_ARGS tells the backend if this is an indirect call
2187 or not. */
2188 INIT_CUMULATIVE_ARGS (args_so_far, funtype, NULL_RTX, fndecl, n_named_args);
2190 /* Now possibly adjust the number of named args.
2191 Normally, don't include the last named arg if anonymous args follow.
2192 We do include the last named arg if
2193 targetm.calls.strict_argument_naming() returns nonzero.
2194 (If no anonymous args follow, the result of list_length is actually
2195 one too large. This is harmless.)
2197 If targetm.calls.pretend_outgoing_varargs_named() returns
2198 nonzero, and targetm.calls.strict_argument_naming() returns zero,
2199 this machine will be able to place unnamed args that were passed
2200 in registers into the stack. So treat all args as named. This
2201 allows the insns emitting for a specific argument list to be
2202 independent of the function declaration.
2204 If targetm.calls.pretend_outgoing_varargs_named() returns zero,
2205 we do not have any reliable way to pass unnamed args in
2206 registers, so we must force them into memory. */
2208 if (type_arg_types != 0
2209 && targetm.calls.strict_argument_naming (&args_so_far))
2211 else if (type_arg_types != 0
2212 && ! targetm.calls.pretend_outgoing_varargs_named (&args_so_far))
2213 /* Don't include the last named arg. */
2214 --n_named_args;
2215 else
2216 /* Treat all args as named. */
2217 n_named_args = num_actuals;
2219 /* Make a vector to hold all the information about each arg. */
2220 args = alloca (num_actuals * sizeof (struct arg_data));
2221 memset (args, 0, num_actuals * sizeof (struct arg_data));
2223 /* Build up entries in the ARGS array, compute the size of the
2224 arguments into ARGS_SIZE, etc. */
2225 initialize_argument_information (num_actuals, args, &args_size,
2226 n_named_args, exp,
2227 structure_value_addr_value, fndecl,
2228 &args_so_far, reg_parm_stack_space,
2229 &old_stack_level, &old_pending_adj,
2230 &must_preallocate, &flags,
2231 &try_tail_call, CALL_FROM_THUNK_P (exp));
2233 if (args_size.var)
2235 /* If this function requires a variable-sized argument list, don't
2236 try to make a cse'able block for this call. We may be able to
2237 do this eventually, but it is too complicated to keep track of
2238 what insns go in the cse'able block and which don't. */
2240 flags &= ~ECF_LIBCALL_BLOCK;
2241 must_preallocate = 1;
2244 /* Now make final decision about preallocating stack space. */
2245 must_preallocate = finalize_must_preallocate (must_preallocate,
2246 num_actuals, args,
2247 &args_size);
2249 /* If the structure value address will reference the stack pointer, we
2250 must stabilize it. We don't need to do this if we know that we are
2251 not going to adjust the stack pointer in processing this call. */
2253 if (structure_value_addr
2254 && (reg_mentioned_p (virtual_stack_dynamic_rtx, structure_value_addr)
2255 || reg_mentioned_p (virtual_outgoing_args_rtx,
2256 structure_value_addr))
2257 && (args_size.var
2258 || (!ACCUMULATE_OUTGOING_ARGS && args_size.constant)))
2259 structure_value_addr = copy_to_reg (structure_value_addr);
2261 /* Tail calls can make things harder to debug, and we've traditionally
2262 pushed these optimizations into -O2. Don't try if we're already
2263 expanding a call, as that means we're an argument. Don't try if
2264 there's cleanups, as we know there's code to follow the call. */
2266 if (currently_expanding_call++ != 0
2267 || !flag_optimize_sibling_calls
2268 || args_size.var
2269 || lookup_stmt_eh_region (exp) >= 0
2270 || dbg_cnt (tail_call) == false)
2271 try_tail_call = 0;
2273 /* Rest of purposes for tail call optimizations to fail. */
2274 if (
2275 #ifdef HAVE_sibcall_epilogue
2276 !HAVE_sibcall_epilogue
2277 #else
2279 #endif
2280 || !try_tail_call
2281 /* Doing sibling call optimization needs some work, since
2282 structure_value_addr can be allocated on the stack.
2283 It does not seem worth the effort since few optimizable
2284 sibling calls will return a structure. */
2285 || structure_value_addr != NULL_RTX
2286 /* Check whether the target is able to optimize the call
2287 into a sibcall. */
2288 || !targetm.function_ok_for_sibcall (fndecl, exp)
2289 /* Functions that do not return exactly once may not be sibcall
2290 optimized. */
2291 || (flags & (ECF_RETURNS_TWICE | ECF_NORETURN))
2292 || TYPE_VOLATILE (TREE_TYPE (TREE_TYPE (addr)))
2293 /* If the called function is nested in the current one, it might access
2294 some of the caller's arguments, but could clobber them beforehand if
2295 the argument areas are shared. */
2296 || (fndecl && decl_function_context (fndecl) == current_function_decl)
2297 /* If this function requires more stack slots than the current
2298 function, we cannot change it into a sibling call.
2299 crtl->args.pretend_args_size is not part of the
2300 stack allocated by our caller. */
2301 || args_size.constant > (crtl->args.size
2302 - crtl->args.pretend_args_size)
2303 /* If the callee pops its own arguments, then it must pop exactly
2304 the same number of arguments as the current function. */
2305 || (RETURN_POPS_ARGS (fndecl, funtype, args_size.constant)
2306 != RETURN_POPS_ARGS (current_function_decl,
2307 TREE_TYPE (current_function_decl),
2308 crtl->args.size))
2309 || !lang_hooks.decls.ok_for_sibcall (fndecl))
2310 try_tail_call = 0;
2312 /* Ensure current function's preferred stack boundary is at least
2313 what we need. We don't have to increase alignment for recursive
2314 functions. */
2315 if (crtl->preferred_stack_boundary < preferred_stack_boundary
2316 && fndecl != current_function_decl)
2317 crtl->preferred_stack_boundary = preferred_stack_boundary;
2319 preferred_unit_stack_boundary = preferred_stack_boundary / BITS_PER_UNIT;
2321 /* We want to make two insn chains; one for a sibling call, the other
2322 for a normal call. We will select one of the two chains after
2323 initial RTL generation is complete. */
2324 for (pass = try_tail_call ? 0 : 1; pass < 2; pass++)
2326 int sibcall_failure = 0;
2327 /* We want to emit any pending stack adjustments before the tail
2328 recursion "call". That way we know any adjustment after the tail
2329 recursion call can be ignored if we indeed use the tail
2330 call expansion. */
2331 int save_pending_stack_adjust = 0;
2332 int save_stack_pointer_delta = 0;
2333 rtx insns;
2334 rtx before_call, next_arg_reg, after_args;
2336 if (pass == 0)
2338 /* State variables we need to save and restore between
2339 iterations. */
2340 save_pending_stack_adjust = pending_stack_adjust;
2341 save_stack_pointer_delta = stack_pointer_delta;
2343 if (pass)
2344 flags &= ~ECF_SIBCALL;
2345 else
2346 flags |= ECF_SIBCALL;
2348 /* Other state variables that we must reinitialize each time
2349 through the loop (that are not initialized by the loop itself). */
2350 argblock = 0;
2351 call_fusage = 0;
2353 /* Start a new sequence for the normal call case.
2355 From this point on, if the sibling call fails, we want to set
2356 sibcall_failure instead of continuing the loop. */
2357 start_sequence ();
2359 /* Don't let pending stack adjusts add up to too much.
2360 Also, do all pending adjustments now if there is any chance
2361 this might be a call to alloca or if we are expanding a sibling
2362 call sequence.
2363 Also do the adjustments before a throwing call, otherwise
2364 exception handling can fail; PR 19225. */
2365 if (pending_stack_adjust >= 32
2366 || (pending_stack_adjust > 0
2367 && (flags & ECF_MAY_BE_ALLOCA))
2368 || (pending_stack_adjust > 0
2369 && flag_exceptions && !(flags & ECF_NOTHROW))
2370 || pass == 0)
2371 do_pending_stack_adjust ();
2373 /* When calling a const function, we must pop the stack args right away,
2374 so that the pop is deleted or moved with the call. */
2375 if (pass && (flags & ECF_LIBCALL_BLOCK))
2376 NO_DEFER_POP;
2378 /* Precompute any arguments as needed. */
2379 if (pass)
2380 precompute_arguments (flags, num_actuals, args);
2382 /* Now we are about to start emitting insns that can be deleted
2383 if a libcall is deleted. */
2384 if (pass && (flags & (ECF_LIBCALL_BLOCK | ECF_MALLOC)))
2385 start_sequence ();
2387 if (pass == 0 && crtl->stack_protect_guard)
2388 stack_protect_epilogue ();
2390 adjusted_args_size = args_size;
2391 /* Compute the actual size of the argument block required. The variable
2392 and constant sizes must be combined, the size may have to be rounded,
2393 and there may be a minimum required size. When generating a sibcall
2394 pattern, do not round up, since we'll be re-using whatever space our
2395 caller provided. */
2396 unadjusted_args_size
2397 = compute_argument_block_size (reg_parm_stack_space,
2398 &adjusted_args_size,
2399 fndecl,
2400 (pass == 0 ? 0
2401 : preferred_stack_boundary));
2403 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
2405 /* The argument block when performing a sibling call is the
2406 incoming argument block. */
2407 if (pass == 0)
2409 argblock = virtual_incoming_args_rtx;
2410 argblock
2411 #ifdef STACK_GROWS_DOWNWARD
2412 = plus_constant (argblock, crtl->args.pretend_args_size);
2413 #else
2414 = plus_constant (argblock, -crtl->args.pretend_args_size);
2415 #endif
2416 stored_args_map = sbitmap_alloc (args_size.constant);
2417 sbitmap_zero (stored_args_map);
2420 /* If we have no actual push instructions, or shouldn't use them,
2421 make space for all args right now. */
2422 else if (adjusted_args_size.var != 0)
2424 if (old_stack_level == 0)
2426 emit_stack_save (SAVE_BLOCK, &old_stack_level, NULL_RTX);
2427 old_stack_pointer_delta = stack_pointer_delta;
2428 old_pending_adj = pending_stack_adjust;
2429 pending_stack_adjust = 0;
2430 /* stack_arg_under_construction says whether a stack arg is
2431 being constructed at the old stack level. Pushing the stack
2432 gets a clean outgoing argument block. */
2433 old_stack_arg_under_construction = stack_arg_under_construction;
2434 stack_arg_under_construction = 0;
2436 argblock = push_block (ARGS_SIZE_RTX (adjusted_args_size), 0, 0);
2438 else
2440 /* Note that we must go through the motions of allocating an argument
2441 block even if the size is zero because we may be storing args
2442 in the area reserved for register arguments, which may be part of
2443 the stack frame. */
2445 int needed = adjusted_args_size.constant;
2447 /* Store the maximum argument space used. It will be pushed by
2448 the prologue (if ACCUMULATE_OUTGOING_ARGS, or stack overflow
2449 checking). */
2451 if (needed > crtl->outgoing_args_size)
2452 crtl->outgoing_args_size = needed;
2454 if (must_preallocate)
2456 if (ACCUMULATE_OUTGOING_ARGS)
2458 /* Since the stack pointer will never be pushed, it is
2459 possible for the evaluation of a parm to clobber
2460 something we have already written to the stack.
2461 Since most function calls on RISC machines do not use
2462 the stack, this is uncommon, but must work correctly.
2464 Therefore, we save any area of the stack that was already
2465 written and that we are using. Here we set up to do this
2466 by making a new stack usage map from the old one. The
2467 actual save will be done by store_one_arg.
2469 Another approach might be to try to reorder the argument
2470 evaluations to avoid this conflicting stack usage. */
2472 /* Since we will be writing into the entire argument area,
2473 the map must be allocated for its entire size, not just
2474 the part that is the responsibility of the caller. */
2475 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl))))
2476 needed += reg_parm_stack_space;
2478 #ifdef ARGS_GROW_DOWNWARD
2479 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2480 needed + 1);
2481 #else
2482 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2483 needed);
2484 #endif
2485 if (stack_usage_map_buf)
2486 free (stack_usage_map_buf);
2487 stack_usage_map_buf = XNEWVEC (char, highest_outgoing_arg_in_use);
2488 stack_usage_map = stack_usage_map_buf;
2490 if (initial_highest_arg_in_use)
2491 memcpy (stack_usage_map, initial_stack_usage_map,
2492 initial_highest_arg_in_use);
2494 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
2495 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
2496 (highest_outgoing_arg_in_use
2497 - initial_highest_arg_in_use));
2498 needed = 0;
2500 /* The address of the outgoing argument list must not be
2501 copied to a register here, because argblock would be left
2502 pointing to the wrong place after the call to
2503 allocate_dynamic_stack_space below. */
2505 argblock = virtual_outgoing_args_rtx;
2507 else
2509 if (inhibit_defer_pop == 0)
2511 /* Try to reuse some or all of the pending_stack_adjust
2512 to get this space. */
2513 needed
2514 = (combine_pending_stack_adjustment_and_call
2515 (unadjusted_args_size,
2516 &adjusted_args_size,
2517 preferred_unit_stack_boundary));
2519 /* combine_pending_stack_adjustment_and_call computes
2520 an adjustment before the arguments are allocated.
2521 Account for them and see whether or not the stack
2522 needs to go up or down. */
2523 needed = unadjusted_args_size - needed;
2525 if (needed < 0)
2527 /* We're releasing stack space. */
2528 /* ??? We can avoid any adjustment at all if we're
2529 already aligned. FIXME. */
2530 pending_stack_adjust = -needed;
2531 do_pending_stack_adjust ();
2532 needed = 0;
2534 else
2535 /* We need to allocate space. We'll do that in
2536 push_block below. */
2537 pending_stack_adjust = 0;
2540 /* Special case this because overhead of `push_block' in
2541 this case is non-trivial. */
2542 if (needed == 0)
2543 argblock = virtual_outgoing_args_rtx;
2544 else
2546 argblock = push_block (GEN_INT (needed), 0, 0);
2547 #ifdef ARGS_GROW_DOWNWARD
2548 argblock = plus_constant (argblock, needed);
2549 #endif
2552 /* We only really need to call `copy_to_reg' in the case
2553 where push insns are going to be used to pass ARGBLOCK
2554 to a function call in ARGS. In that case, the stack
2555 pointer changes value from the allocation point to the
2556 call point, and hence the value of
2557 VIRTUAL_OUTGOING_ARGS_RTX changes as well. But might
2558 as well always do it. */
2559 argblock = copy_to_reg (argblock);
2564 if (ACCUMULATE_OUTGOING_ARGS)
2566 /* The save/restore code in store_one_arg handles all
2567 cases except one: a constructor call (including a C
2568 function returning a BLKmode struct) to initialize
2569 an argument. */
2570 if (stack_arg_under_construction)
2572 rtx push_size
2573 = GEN_INT (adjusted_args_size.constant
2574 + (OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL
2575 : TREE_TYPE (fndecl))) ? 0
2576 : reg_parm_stack_space));
2577 if (old_stack_level == 0)
2579 emit_stack_save (SAVE_BLOCK, &old_stack_level,
2580 NULL_RTX);
2581 old_stack_pointer_delta = stack_pointer_delta;
2582 old_pending_adj = pending_stack_adjust;
2583 pending_stack_adjust = 0;
2584 /* stack_arg_under_construction says whether a stack
2585 arg is being constructed at the old stack level.
2586 Pushing the stack gets a clean outgoing argument
2587 block. */
2588 old_stack_arg_under_construction
2589 = stack_arg_under_construction;
2590 stack_arg_under_construction = 0;
2591 /* Make a new map for the new argument list. */
2592 if (stack_usage_map_buf)
2593 free (stack_usage_map_buf);
2594 stack_usage_map_buf = XCNEWVEC (char, highest_outgoing_arg_in_use);
2595 stack_usage_map = stack_usage_map_buf;
2596 highest_outgoing_arg_in_use = 0;
2598 allocate_dynamic_stack_space (push_size, NULL_RTX,
2599 BITS_PER_UNIT);
2602 /* If argument evaluation might modify the stack pointer,
2603 copy the address of the argument list to a register. */
2604 for (i = 0; i < num_actuals; i++)
2605 if (args[i].pass_on_stack)
2607 argblock = copy_addr_to_reg (argblock);
2608 break;
2612 compute_argument_addresses (args, argblock, num_actuals);
2614 /* If we push args individually in reverse order, perform stack alignment
2615 before the first push (the last arg). */
2616 if (PUSH_ARGS_REVERSED && argblock == 0
2617 && adjusted_args_size.constant != unadjusted_args_size)
2619 /* When the stack adjustment is pending, we get better code
2620 by combining the adjustments. */
2621 if (pending_stack_adjust
2622 && ! (flags & ECF_LIBCALL_BLOCK)
2623 && ! inhibit_defer_pop)
2625 pending_stack_adjust
2626 = (combine_pending_stack_adjustment_and_call
2627 (unadjusted_args_size,
2628 &adjusted_args_size,
2629 preferred_unit_stack_boundary));
2630 do_pending_stack_adjust ();
2632 else if (argblock == 0)
2633 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
2634 - unadjusted_args_size));
2636 /* Now that the stack is properly aligned, pops can't safely
2637 be deferred during the evaluation of the arguments. */
2638 NO_DEFER_POP;
2640 funexp = rtx_for_function_call (fndecl, addr);
2642 /* Figure out the register where the value, if any, will come back. */
2643 valreg = 0;
2644 if (TYPE_MODE (TREE_TYPE (exp)) != VOIDmode
2645 && ! structure_value_addr)
2647 if (pcc_struct_value)
2648 valreg = hard_function_value (build_pointer_type (TREE_TYPE (exp)),
2649 fndecl, NULL, (pass == 0));
2650 else
2651 valreg = hard_function_value (TREE_TYPE (exp), fndecl, fntype,
2652 (pass == 0));
2654 /* If VALREG is a PARALLEL whose first member has a zero
2655 offset, use that. This is for targets such as m68k that
2656 return the same value in multiple places. */
2657 if (GET_CODE (valreg) == PARALLEL)
2659 rtx elem = XVECEXP (valreg, 0, 0);
2660 rtx where = XEXP (elem, 0);
2661 rtx offset = XEXP (elem, 1);
2662 if (offset == const0_rtx
2663 && GET_MODE (where) == GET_MODE (valreg))
2664 valreg = where;
2668 /* Precompute all register parameters. It isn't safe to compute anything
2669 once we have started filling any specific hard regs. */
2670 precompute_register_parameters (num_actuals, args, &reg_parm_seen);
2672 if (CALL_EXPR_STATIC_CHAIN (exp))
2673 static_chain_value = expand_normal (CALL_EXPR_STATIC_CHAIN (exp));
2674 else
2675 static_chain_value = 0;
2677 #ifdef REG_PARM_STACK_SPACE
2678 /* Save the fixed argument area if it's part of the caller's frame and
2679 is clobbered by argument setup for this call. */
2680 if (ACCUMULATE_OUTGOING_ARGS && pass)
2681 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
2682 &low_to_save, &high_to_save);
2683 #endif
2685 /* Now store (and compute if necessary) all non-register parms.
2686 These come before register parms, since they can require block-moves,
2687 which could clobber the registers used for register parms.
2688 Parms which have partial registers are not stored here,
2689 but we do preallocate space here if they want that. */
2691 for (i = 0; i < num_actuals; i++)
2692 if (args[i].reg == 0 || args[i].pass_on_stack)
2694 rtx before_arg = get_last_insn ();
2696 if (store_one_arg (&args[i], argblock, flags,
2697 adjusted_args_size.var != 0,
2698 reg_parm_stack_space)
2699 || (pass == 0
2700 && check_sibcall_argument_overlap (before_arg,
2701 &args[i], 1)))
2702 sibcall_failure = 1;
2704 if (flags & ECF_CONST
2705 && args[i].stack
2706 && args[i].value == args[i].stack)
2707 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
2708 gen_rtx_USE (VOIDmode,
2709 args[i].value),
2710 call_fusage);
2713 /* If we have a parm that is passed in registers but not in memory
2714 and whose alignment does not permit a direct copy into registers,
2715 make a group of pseudos that correspond to each register that we
2716 will later fill. */
2717 if (STRICT_ALIGNMENT)
2718 store_unaligned_arguments_into_pseudos (args, num_actuals);
2720 /* Now store any partially-in-registers parm.
2721 This is the last place a block-move can happen. */
2722 if (reg_parm_seen)
2723 for (i = 0; i < num_actuals; i++)
2724 if (args[i].partial != 0 && ! args[i].pass_on_stack)
2726 rtx before_arg = get_last_insn ();
2728 if (store_one_arg (&args[i], argblock, flags,
2729 adjusted_args_size.var != 0,
2730 reg_parm_stack_space)
2731 || (pass == 0
2732 && check_sibcall_argument_overlap (before_arg,
2733 &args[i], 1)))
2734 sibcall_failure = 1;
2737 /* If we pushed args in forward order, perform stack alignment
2738 after pushing the last arg. */
2739 if (!PUSH_ARGS_REVERSED && argblock == 0)
2740 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
2741 - unadjusted_args_size));
2743 /* If register arguments require space on the stack and stack space
2744 was not preallocated, allocate stack space here for arguments
2745 passed in registers. */
2746 if (OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl)))
2747 && !ACCUMULATE_OUTGOING_ARGS
2748 && must_preallocate == 0 && reg_parm_stack_space > 0)
2749 anti_adjust_stack (GEN_INT (reg_parm_stack_space));
2751 /* Pass the function the address in which to return a
2752 structure value. */
2753 if (pass != 0 && structure_value_addr && ! structure_value_addr_parm)
2755 structure_value_addr
2756 = convert_memory_address (Pmode, structure_value_addr);
2757 emit_move_insn (struct_value,
2758 force_reg (Pmode,
2759 force_operand (structure_value_addr,
2760 NULL_RTX)));
2762 if (REG_P (struct_value))
2763 use_reg (&call_fusage, struct_value);
2766 after_args = get_last_insn ();
2767 funexp = prepare_call_address (funexp, static_chain_value,
2768 &call_fusage, reg_parm_seen, pass == 0);
2770 load_register_parameters (args, num_actuals, &call_fusage, flags,
2771 pass == 0, &sibcall_failure);
2773 /* Save a pointer to the last insn before the call, so that we can
2774 later safely search backwards to find the CALL_INSN. */
2775 before_call = get_last_insn ();
2777 /* Set up next argument register. For sibling calls on machines
2778 with register windows this should be the incoming register. */
2779 #ifdef FUNCTION_INCOMING_ARG
2780 if (pass == 0)
2781 next_arg_reg = FUNCTION_INCOMING_ARG (args_so_far, VOIDmode,
2782 void_type_node, 1);
2783 else
2784 #endif
2785 next_arg_reg = FUNCTION_ARG (args_so_far, VOIDmode,
2786 void_type_node, 1);
2788 /* All arguments and registers used for the call must be set up by
2789 now! */
2791 /* Stack must be properly aligned now. */
2792 gcc_assert (!pass
2793 || !(stack_pointer_delta % preferred_unit_stack_boundary));
2795 /* Generate the actual call instruction. */
2796 emit_call_1 (funexp, exp, fndecl, funtype, unadjusted_args_size,
2797 adjusted_args_size.constant, struct_value_size,
2798 next_arg_reg, valreg, old_inhibit_defer_pop, call_fusage,
2799 flags, & args_so_far);
2801 /* If the call setup or the call itself overlaps with anything
2802 of the argument setup we probably clobbered our call address.
2803 In that case we can't do sibcalls. */
2804 if (pass == 0
2805 && check_sibcall_argument_overlap (after_args, 0, 0))
2806 sibcall_failure = 1;
2808 /* If a non-BLKmode value is returned at the most significant end
2809 of a register, shift the register right by the appropriate amount
2810 and update VALREG accordingly. BLKmode values are handled by the
2811 group load/store machinery below. */
2812 if (!structure_value_addr
2813 && !pcc_struct_value
2814 && TYPE_MODE (TREE_TYPE (exp)) != BLKmode
2815 && targetm.calls.return_in_msb (TREE_TYPE (exp)))
2817 if (shift_return_value (TYPE_MODE (TREE_TYPE (exp)), false, valreg))
2818 sibcall_failure = 1;
2819 valreg = gen_rtx_REG (TYPE_MODE (TREE_TYPE (exp)), REGNO (valreg));
2822 /* If call is cse'able, make appropriate pair of reg-notes around it.
2823 Test valreg so we don't crash; may safely ignore `const'
2824 if return type is void. Disable for PARALLEL return values, because
2825 we have no way to move such values into a pseudo register. */
2826 if (pass && (flags & ECF_LIBCALL_BLOCK))
2828 rtx insns;
2829 rtx insn;
2830 bool failed = valreg == 0 || GET_CODE (valreg) == PARALLEL;
2832 insns = get_insns ();
2834 /* Expansion of block moves possibly introduced a loop that may
2835 not appear inside libcall block. */
2836 for (insn = insns; insn; insn = NEXT_INSN (insn))
2837 if (JUMP_P (insn))
2838 failed = true;
2840 if (failed)
2842 end_sequence ();
2843 emit_insn (insns);
2845 else
2847 rtx note = 0;
2848 rtx temp = gen_reg_rtx (GET_MODE (valreg));
2850 /* Mark the return value as a pointer if needed. */
2851 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
2852 mark_reg_pointer (temp,
2853 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (exp))));
2855 end_sequence ();
2856 if (flag_unsafe_math_optimizations
2857 && fndecl
2858 && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
2859 && (DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRT
2860 || DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRTF
2861 || DECL_FUNCTION_CODE (fndecl) == BUILT_IN_SQRTL))
2862 note = gen_rtx_fmt_e (SQRT,
2863 GET_MODE (temp),
2864 args[0].initial_value);
2865 else
2867 /* Construct an "equal form" for the value which
2868 mentions all the arguments in order as well as
2869 the function name. */
2870 for (i = 0; i < num_actuals; i++)
2871 note = gen_rtx_EXPR_LIST (VOIDmode,
2872 args[i].initial_value, note);
2873 note = gen_rtx_EXPR_LIST (VOIDmode, funexp, note);
2875 emit_libcall_block (insns, temp, valreg, note);
2877 valreg = temp;
2880 else if (pass && (flags & ECF_MALLOC))
2882 rtx temp = gen_reg_rtx (GET_MODE (valreg));
2883 rtx last, insns;
2885 /* The return value from a malloc-like function is a pointer. */
2886 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
2887 mark_reg_pointer (temp, BIGGEST_ALIGNMENT);
2889 emit_move_insn (temp, valreg);
2891 /* The return value from a malloc-like function can not alias
2892 anything else. */
2893 last = get_last_insn ();
2894 REG_NOTES (last) =
2895 gen_rtx_EXPR_LIST (REG_NOALIAS, temp, REG_NOTES (last));
2897 /* Write out the sequence. */
2898 insns = get_insns ();
2899 end_sequence ();
2900 emit_insn (insns);
2901 valreg = temp;
2904 /* For calls to `setjmp', etc., inform
2905 function.c:setjmp_warnings that it should complain if
2906 nonvolatile values are live. For functions that cannot
2907 return, inform flow that control does not fall through. */
2909 if ((flags & ECF_NORETURN) || pass == 0)
2911 /* The barrier must be emitted
2912 immediately after the CALL_INSN. Some ports emit more
2913 than just a CALL_INSN above, so we must search for it here. */
2915 rtx last = get_last_insn ();
2916 while (!CALL_P (last))
2918 last = PREV_INSN (last);
2919 /* There was no CALL_INSN? */
2920 gcc_assert (last != before_call);
2923 emit_barrier_after (last);
2925 /* Stack adjustments after a noreturn call are dead code.
2926 However when NO_DEFER_POP is in effect, we must preserve
2927 stack_pointer_delta. */
2928 if (inhibit_defer_pop == 0)
2930 stack_pointer_delta = old_stack_allocated;
2931 pending_stack_adjust = 0;
2935 /* If value type not void, return an rtx for the value. */
2937 if (TYPE_MODE (TREE_TYPE (exp)) == VOIDmode
2938 || ignore)
2939 target = const0_rtx;
2940 else if (structure_value_addr)
2942 if (target == 0 || !MEM_P (target))
2944 target
2945 = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
2946 memory_address (TYPE_MODE (TREE_TYPE (exp)),
2947 structure_value_addr));
2948 set_mem_attributes (target, exp, 1);
2951 else if (pcc_struct_value)
2953 /* This is the special C++ case where we need to
2954 know what the true target was. We take care to
2955 never use this value more than once in one expression. */
2956 target = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
2957 copy_to_reg (valreg));
2958 set_mem_attributes (target, exp, 1);
2960 /* Handle calls that return values in multiple non-contiguous locations.
2961 The Irix 6 ABI has examples of this. */
2962 else if (GET_CODE (valreg) == PARALLEL)
2964 if (target == 0)
2966 /* This will only be assigned once, so it can be readonly. */
2967 tree nt = build_qualified_type (TREE_TYPE (exp),
2968 (TYPE_QUALS (TREE_TYPE (exp))
2969 | TYPE_QUAL_CONST));
2971 target = assign_temp (nt, 0, 1, 1);
2974 if (! rtx_equal_p (target, valreg))
2975 emit_group_store (target, valreg, TREE_TYPE (exp),
2976 int_size_in_bytes (TREE_TYPE (exp)));
2978 /* We can not support sibling calls for this case. */
2979 sibcall_failure = 1;
2981 else if (target
2982 && GET_MODE (target) == TYPE_MODE (TREE_TYPE (exp))
2983 && GET_MODE (target) == GET_MODE (valreg))
2985 bool may_overlap = false;
2987 /* We have to copy a return value in a CLASS_LIKELY_SPILLED hard
2988 reg to a plain register. */
2989 if (!REG_P (target) || HARD_REGISTER_P (target))
2990 valreg = avoid_likely_spilled_reg (valreg);
2992 /* If TARGET is a MEM in the argument area, and we have
2993 saved part of the argument area, then we can't store
2994 directly into TARGET as it may get overwritten when we
2995 restore the argument save area below. Don't work too
2996 hard though and simply force TARGET to a register if it
2997 is a MEM; the optimizer is quite likely to sort it out. */
2998 if (ACCUMULATE_OUTGOING_ARGS && pass && MEM_P (target))
2999 for (i = 0; i < num_actuals; i++)
3000 if (args[i].save_area)
3002 may_overlap = true;
3003 break;
3006 if (may_overlap)
3007 target = copy_to_reg (valreg);
3008 else
3010 /* TARGET and VALREG cannot be equal at this point
3011 because the latter would not have
3012 REG_FUNCTION_VALUE_P true, while the former would if
3013 it were referring to the same register.
3015 If they refer to the same register, this move will be
3016 a no-op, except when function inlining is being
3017 done. */
3018 emit_move_insn (target, valreg);
3020 /* If we are setting a MEM, this code must be executed.
3021 Since it is emitted after the call insn, sibcall
3022 optimization cannot be performed in that case. */
3023 if (MEM_P (target))
3024 sibcall_failure = 1;
3027 else if (TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
3029 target = copy_blkmode_from_reg (target, valreg, TREE_TYPE (exp));
3031 /* We can not support sibling calls for this case. */
3032 sibcall_failure = 1;
3034 else
3035 target = copy_to_reg (avoid_likely_spilled_reg (valreg));
3037 if (targetm.calls.promote_function_return(funtype))
3039 /* If we promoted this return value, make the proper SUBREG.
3040 TARGET might be const0_rtx here, so be careful. */
3041 if (REG_P (target)
3042 && TYPE_MODE (TREE_TYPE (exp)) != BLKmode
3043 && GET_MODE (target) != TYPE_MODE (TREE_TYPE (exp)))
3045 tree type = TREE_TYPE (exp);
3046 int unsignedp = TYPE_UNSIGNED (type);
3047 int offset = 0;
3048 enum machine_mode pmode;
3050 pmode = promote_mode (type, TYPE_MODE (type), &unsignedp, 1);
3051 /* If we don't promote as expected, something is wrong. */
3052 gcc_assert (GET_MODE (target) == pmode);
3054 if ((WORDS_BIG_ENDIAN || BYTES_BIG_ENDIAN)
3055 && (GET_MODE_SIZE (GET_MODE (target))
3056 > GET_MODE_SIZE (TYPE_MODE (type))))
3058 offset = GET_MODE_SIZE (GET_MODE (target))
3059 - GET_MODE_SIZE (TYPE_MODE (type));
3060 if (! BYTES_BIG_ENDIAN)
3061 offset = (offset / UNITS_PER_WORD) * UNITS_PER_WORD;
3062 else if (! WORDS_BIG_ENDIAN)
3063 offset %= UNITS_PER_WORD;
3065 target = gen_rtx_SUBREG (TYPE_MODE (type), target, offset);
3066 SUBREG_PROMOTED_VAR_P (target) = 1;
3067 SUBREG_PROMOTED_UNSIGNED_SET (target, unsignedp);
3071 /* If size of args is variable or this was a constructor call for a stack
3072 argument, restore saved stack-pointer value. */
3074 if (old_stack_level)
3076 emit_stack_restore (SAVE_BLOCK, old_stack_level, NULL_RTX);
3077 stack_pointer_delta = old_stack_pointer_delta;
3078 pending_stack_adjust = old_pending_adj;
3079 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
3080 stack_arg_under_construction = old_stack_arg_under_construction;
3081 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3082 stack_usage_map = initial_stack_usage_map;
3083 sibcall_failure = 1;
3085 else if (ACCUMULATE_OUTGOING_ARGS && pass)
3087 #ifdef REG_PARM_STACK_SPACE
3088 if (save_area)
3089 restore_fixed_argument_area (save_area, argblock,
3090 high_to_save, low_to_save);
3091 #endif
3093 /* If we saved any argument areas, restore them. */
3094 for (i = 0; i < num_actuals; i++)
3095 if (args[i].save_area)
3097 enum machine_mode save_mode = GET_MODE (args[i].save_area);
3098 rtx stack_area
3099 = gen_rtx_MEM (save_mode,
3100 memory_address (save_mode,
3101 XEXP (args[i].stack_slot, 0)));
3103 if (save_mode != BLKmode)
3104 emit_move_insn (stack_area, args[i].save_area);
3105 else
3106 emit_block_move (stack_area, args[i].save_area,
3107 GEN_INT (args[i].locate.size.constant),
3108 BLOCK_OP_CALL_PARM);
3111 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3112 stack_usage_map = initial_stack_usage_map;
3115 /* If this was alloca, record the new stack level for nonlocal gotos.
3116 Check for the handler slots since we might not have a save area
3117 for non-local gotos. */
3119 if ((flags & ECF_MAY_BE_ALLOCA) && cfun->nonlocal_goto_save_area != 0)
3120 update_nonlocal_goto_save_area ();
3122 /* Free up storage we no longer need. */
3123 for (i = 0; i < num_actuals; ++i)
3124 if (args[i].aligned_regs)
3125 free (args[i].aligned_regs);
3127 insns = get_insns ();
3128 end_sequence ();
3130 if (pass == 0)
3132 tail_call_insns = insns;
3134 /* Restore the pending stack adjustment now that we have
3135 finished generating the sibling call sequence. */
3137 pending_stack_adjust = save_pending_stack_adjust;
3138 stack_pointer_delta = save_stack_pointer_delta;
3140 /* Prepare arg structure for next iteration. */
3141 for (i = 0; i < num_actuals; i++)
3143 args[i].value = 0;
3144 args[i].aligned_regs = 0;
3145 args[i].stack = 0;
3148 sbitmap_free (stored_args_map);
3150 else
3152 normal_call_insns = insns;
3154 /* Verify that we've deallocated all the stack we used. */
3155 gcc_assert ((flags & ECF_NORETURN)
3156 || (old_stack_allocated
3157 == stack_pointer_delta - pending_stack_adjust));
3160 /* If something prevents making this a sibling call,
3161 zero out the sequence. */
3162 if (sibcall_failure)
3163 tail_call_insns = NULL_RTX;
3164 else
3165 break;
3168 /* If tail call production succeeded, we need to remove REG_EQUIV notes on
3169 arguments too, as argument area is now clobbered by the call. */
3170 if (tail_call_insns)
3172 emit_insn (tail_call_insns);
3173 crtl->tail_call_emit = true;
3175 else
3176 emit_insn (normal_call_insns);
3178 currently_expanding_call--;
3180 if (stack_usage_map_buf)
3181 free (stack_usage_map_buf);
3183 return target;
3186 /* A sibling call sequence invalidates any REG_EQUIV notes made for
3187 this function's incoming arguments.
3189 At the start of RTL generation we know the only REG_EQUIV notes
3190 in the rtl chain are those for incoming arguments, so we can look
3191 for REG_EQUIV notes between the start of the function and the
3192 NOTE_INSN_FUNCTION_BEG.
3194 This is (slight) overkill. We could keep track of the highest
3195 argument we clobber and be more selective in removing notes, but it
3196 does not seem to be worth the effort. */
3198 void
3199 fixup_tail_calls (void)
3201 rtx insn;
3203 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
3205 rtx note;
3207 /* There are never REG_EQUIV notes for the incoming arguments
3208 after the NOTE_INSN_FUNCTION_BEG note, so stop if we see it. */
3209 if (NOTE_P (insn)
3210 && NOTE_KIND (insn) == NOTE_INSN_FUNCTION_BEG)
3211 break;
3213 note = find_reg_note (insn, REG_EQUIV, 0);
3214 if (note)
3215 remove_note (insn, note);
3216 note = find_reg_note (insn, REG_EQUIV, 0);
3217 gcc_assert (!note);
3221 /* Traverse a list of TYPES and expand all complex types into their
3222 components. */
3223 static tree
3224 split_complex_types (tree types)
3226 tree p;
3228 /* Before allocating memory, check for the common case of no complex. */
3229 for (p = types; p; p = TREE_CHAIN (p))
3231 tree type = TREE_VALUE (p);
3232 if (TREE_CODE (type) == COMPLEX_TYPE
3233 && targetm.calls.split_complex_arg (type))
3234 goto found;
3236 return types;
3238 found:
3239 types = copy_list (types);
3241 for (p = types; p; p = TREE_CHAIN (p))
3243 tree complex_type = TREE_VALUE (p);
3245 if (TREE_CODE (complex_type) == COMPLEX_TYPE
3246 && targetm.calls.split_complex_arg (complex_type))
3248 tree next, imag;
3250 /* Rewrite complex type with component type. */
3251 TREE_VALUE (p) = TREE_TYPE (complex_type);
3252 next = TREE_CHAIN (p);
3254 /* Add another component type for the imaginary part. */
3255 imag = build_tree_list (NULL_TREE, TREE_VALUE (p));
3256 TREE_CHAIN (p) = imag;
3257 TREE_CHAIN (imag) = next;
3259 /* Skip the newly created node. */
3260 p = TREE_CHAIN (p);
3264 return types;
3267 /* Output a library call to function FUN (a SYMBOL_REF rtx).
3268 The RETVAL parameter specifies whether return value needs to be saved, other
3269 parameters are documented in the emit_library_call function below. */
3271 static rtx
3272 emit_library_call_value_1 (int retval, rtx orgfun, rtx value,
3273 enum libcall_type fn_type,
3274 enum machine_mode outmode, int nargs, va_list p)
3276 /* Total size in bytes of all the stack-parms scanned so far. */
3277 struct args_size args_size;
3278 /* Size of arguments before any adjustments (such as rounding). */
3279 struct args_size original_args_size;
3280 int argnum;
3281 rtx fun;
3282 /* Todo, choose the correct decl type of orgfun. Sadly this information
3283 isn't present here, so we default to native calling abi here. */
3284 tree fndecl ATTRIBUTE_UNUSED = NULL_TREE; /* library calls default to host calling abi ? */
3285 int inc;
3286 int count;
3287 rtx argblock = 0;
3288 CUMULATIVE_ARGS args_so_far;
3289 struct arg
3291 rtx value;
3292 enum machine_mode mode;
3293 rtx reg;
3294 int partial;
3295 struct locate_and_pad_arg_data locate;
3296 rtx save_area;
3298 struct arg *argvec;
3299 int old_inhibit_defer_pop = inhibit_defer_pop;
3300 rtx call_fusage = 0;
3301 rtx mem_value = 0;
3302 rtx valreg;
3303 int pcc_struct_value = 0;
3304 int struct_value_size = 0;
3305 int flags;
3306 int reg_parm_stack_space = 0;
3307 int needed;
3308 rtx before_call;
3309 tree tfom; /* type_for_mode (outmode, 0) */
3311 #ifdef REG_PARM_STACK_SPACE
3312 /* Define the boundary of the register parm stack space that needs to be
3313 save, if any. */
3314 int low_to_save, high_to_save;
3315 rtx save_area = 0; /* Place that it is saved. */
3316 #endif
3318 /* Size of the stack reserved for parameter registers. */
3319 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
3320 char *initial_stack_usage_map = stack_usage_map;
3321 char *stack_usage_map_buf = NULL;
3323 rtx struct_value = targetm.calls.struct_value_rtx (0, 0);
3325 #ifdef REG_PARM_STACK_SPACE
3326 reg_parm_stack_space = REG_PARM_STACK_SPACE ((tree) 0);
3327 #endif
3329 /* By default, library functions can not throw. */
3330 flags = ECF_NOTHROW;
3332 switch (fn_type)
3334 case LCT_NORMAL:
3335 break;
3336 case LCT_CONST:
3337 flags |= ECF_CONST;
3338 break;
3339 case LCT_PURE:
3340 flags |= ECF_PURE;
3341 break;
3342 case LCT_CONST_MAKE_BLOCK:
3343 flags |= ECF_CONST | ECF_LIBCALL_BLOCK;
3344 break;
3345 case LCT_PURE_MAKE_BLOCK:
3346 flags |= ECF_PURE | ECF_LIBCALL_BLOCK;
3347 break;
3348 case LCT_NORETURN:
3349 flags |= ECF_NORETURN;
3350 break;
3351 case LCT_THROW:
3352 flags = ECF_NORETURN;
3353 break;
3354 case LCT_RETURNS_TWICE:
3355 flags = ECF_RETURNS_TWICE;
3356 break;
3358 fun = orgfun;
3360 /* Ensure current function's preferred stack boundary is at least
3361 what we need. */
3362 if (crtl->preferred_stack_boundary < PREFERRED_STACK_BOUNDARY)
3363 crtl->preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
3365 /* If this kind of value comes back in memory,
3366 decide where in memory it should come back. */
3367 if (outmode != VOIDmode)
3369 tfom = lang_hooks.types.type_for_mode (outmode, 0);
3370 if (aggregate_value_p (tfom, 0))
3372 #ifdef PCC_STATIC_STRUCT_RETURN
3373 rtx pointer_reg
3374 = hard_function_value (build_pointer_type (tfom), 0, 0, 0);
3375 mem_value = gen_rtx_MEM (outmode, pointer_reg);
3376 pcc_struct_value = 1;
3377 if (value == 0)
3378 value = gen_reg_rtx (outmode);
3379 #else /* not PCC_STATIC_STRUCT_RETURN */
3380 struct_value_size = GET_MODE_SIZE (outmode);
3381 if (value != 0 && MEM_P (value))
3382 mem_value = value;
3383 else
3384 mem_value = assign_temp (tfom, 0, 1, 1);
3385 #endif
3386 /* This call returns a big structure. */
3387 flags &= ~(ECF_CONST | ECF_PURE | ECF_LOOPING_CONST_OR_PURE
3388 | ECF_LIBCALL_BLOCK);
3391 else
3392 tfom = void_type_node;
3394 /* ??? Unfinished: must pass the memory address as an argument. */
3396 /* Copy all the libcall-arguments out of the varargs data
3397 and into a vector ARGVEC.
3399 Compute how to pass each argument. We only support a very small subset
3400 of the full argument passing conventions to limit complexity here since
3401 library functions shouldn't have many args. */
3403 argvec = alloca ((nargs + 1) * sizeof (struct arg));
3404 memset (argvec, 0, (nargs + 1) * sizeof (struct arg));
3406 #ifdef INIT_CUMULATIVE_LIBCALL_ARGS
3407 INIT_CUMULATIVE_LIBCALL_ARGS (args_so_far, outmode, fun);
3408 #else
3409 INIT_CUMULATIVE_ARGS (args_so_far, NULL_TREE, fun, 0, nargs);
3410 #endif
3412 args_size.constant = 0;
3413 args_size.var = 0;
3415 count = 0;
3417 /* Now we are about to start emitting insns that can be deleted
3418 if a libcall is deleted. */
3419 if (flags & ECF_LIBCALL_BLOCK)
3420 start_sequence ();
3422 push_temp_slots ();
3424 /* If there's a structure value address to be passed,
3425 either pass it in the special place, or pass it as an extra argument. */
3426 if (mem_value && struct_value == 0 && ! pcc_struct_value)
3428 rtx addr = XEXP (mem_value, 0);
3430 nargs++;
3432 /* Make sure it is a reasonable operand for a move or push insn. */
3433 if (!REG_P (addr) && !MEM_P (addr)
3434 && ! (CONSTANT_P (addr) && LEGITIMATE_CONSTANT_P (addr)))
3435 addr = force_operand (addr, NULL_RTX);
3437 argvec[count].value = addr;
3438 argvec[count].mode = Pmode;
3439 argvec[count].partial = 0;
3441 argvec[count].reg = FUNCTION_ARG (args_so_far, Pmode, NULL_TREE, 1);
3442 gcc_assert (targetm.calls.arg_partial_bytes (&args_so_far, Pmode,
3443 NULL_TREE, 1) == 0);
3445 locate_and_pad_parm (Pmode, NULL_TREE,
3446 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3448 #else
3449 argvec[count].reg != 0,
3450 #endif
3451 0, NULL_TREE, &args_size, &argvec[count].locate);
3453 if (argvec[count].reg == 0 || argvec[count].partial != 0
3454 || reg_parm_stack_space > 0)
3455 args_size.constant += argvec[count].locate.size.constant;
3457 FUNCTION_ARG_ADVANCE (args_so_far, Pmode, (tree) 0, 1);
3459 count++;
3462 for (; count < nargs; count++)
3464 rtx val = va_arg (p, rtx);
3465 enum machine_mode mode = va_arg (p, enum machine_mode);
3467 /* We cannot convert the arg value to the mode the library wants here;
3468 must do it earlier where we know the signedness of the arg. */
3469 gcc_assert (mode != BLKmode
3470 && (GET_MODE (val) == mode || GET_MODE (val) == VOIDmode));
3472 /* Make sure it is a reasonable operand for a move or push insn. */
3473 if (!REG_P (val) && !MEM_P (val)
3474 && ! (CONSTANT_P (val) && LEGITIMATE_CONSTANT_P (val)))
3475 val = force_operand (val, NULL_RTX);
3477 if (pass_by_reference (&args_so_far, mode, NULL_TREE, 1))
3479 rtx slot;
3480 int must_copy
3481 = !reference_callee_copied (&args_so_far, mode, NULL_TREE, 1);
3483 /* loop.c won't look at CALL_INSN_FUNCTION_USAGE of const/pure
3484 functions, so we have to pretend this isn't such a function. */
3485 if (flags & ECF_LIBCALL_BLOCK)
3487 rtx insns = get_insns ();
3488 end_sequence ();
3489 emit_insn (insns);
3492 /* If this was a CONST function, it is now PURE since it now
3493 reads memory. */
3494 if (flags & ECF_CONST)
3496 flags &= ~ECF_CONST;
3497 flags |= ECF_PURE;
3500 if (GET_MODE (val) == MEM && !must_copy)
3501 slot = val;
3502 else
3504 slot = assign_temp (lang_hooks.types.type_for_mode (mode, 0),
3505 0, 1, 1);
3506 emit_move_insn (slot, val);
3509 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
3510 gen_rtx_USE (VOIDmode, slot),
3511 call_fusage);
3512 if (must_copy)
3513 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
3514 gen_rtx_CLOBBER (VOIDmode,
3515 slot),
3516 call_fusage);
3518 mode = Pmode;
3519 val = force_operand (XEXP (slot, 0), NULL_RTX);
3522 argvec[count].value = val;
3523 argvec[count].mode = mode;
3525 argvec[count].reg = FUNCTION_ARG (args_so_far, mode, NULL_TREE, 1);
3527 argvec[count].partial
3528 = targetm.calls.arg_partial_bytes (&args_so_far, mode, NULL_TREE, 1);
3530 locate_and_pad_parm (mode, NULL_TREE,
3531 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3533 #else
3534 argvec[count].reg != 0,
3535 #endif
3536 argvec[count].partial,
3537 NULL_TREE, &args_size, &argvec[count].locate);
3539 gcc_assert (!argvec[count].locate.size.var);
3541 if (argvec[count].reg == 0 || argvec[count].partial != 0
3542 || reg_parm_stack_space > 0)
3543 args_size.constant += argvec[count].locate.size.constant;
3545 FUNCTION_ARG_ADVANCE (args_so_far, mode, (tree) 0, 1);
3548 /* If this machine requires an external definition for library
3549 functions, write one out. */
3550 assemble_external_libcall (fun);
3552 original_args_size = args_size;
3553 args_size.constant = (((args_size.constant
3554 + stack_pointer_delta
3555 + STACK_BYTES - 1)
3556 / STACK_BYTES
3557 * STACK_BYTES)
3558 - stack_pointer_delta);
3560 args_size.constant = MAX (args_size.constant,
3561 reg_parm_stack_space);
3563 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl))))
3564 args_size.constant -= reg_parm_stack_space;
3566 if (args_size.constant > crtl->outgoing_args_size)
3567 crtl->outgoing_args_size = args_size.constant;
3569 if (ACCUMULATE_OUTGOING_ARGS)
3571 /* Since the stack pointer will never be pushed, it is possible for
3572 the evaluation of a parm to clobber something we have already
3573 written to the stack. Since most function calls on RISC machines
3574 do not use the stack, this is uncommon, but must work correctly.
3576 Therefore, we save any area of the stack that was already written
3577 and that we are using. Here we set up to do this by making a new
3578 stack usage map from the old one.
3580 Another approach might be to try to reorder the argument
3581 evaluations to avoid this conflicting stack usage. */
3583 needed = args_size.constant;
3585 /* Since we will be writing into the entire argument area, the
3586 map must be allocated for its entire size, not just the part that
3587 is the responsibility of the caller. */
3588 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? NULL_TREE : TREE_TYPE (fndecl))))
3589 needed += reg_parm_stack_space;
3591 #ifdef ARGS_GROW_DOWNWARD
3592 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3593 needed + 1);
3594 #else
3595 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3596 needed);
3597 #endif
3598 stack_usage_map_buf = XNEWVEC (char, highest_outgoing_arg_in_use);
3599 stack_usage_map = stack_usage_map_buf;
3601 if (initial_highest_arg_in_use)
3602 memcpy (stack_usage_map, initial_stack_usage_map,
3603 initial_highest_arg_in_use);
3605 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
3606 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
3607 highest_outgoing_arg_in_use - initial_highest_arg_in_use);
3608 needed = 0;
3610 /* We must be careful to use virtual regs before they're instantiated,
3611 and real regs afterwards. Loop optimization, for example, can create
3612 new libcalls after we've instantiated the virtual regs, and if we
3613 use virtuals anyway, they won't match the rtl patterns. */
3615 if (virtuals_instantiated)
3616 argblock = plus_constant (stack_pointer_rtx, STACK_POINTER_OFFSET);
3617 else
3618 argblock = virtual_outgoing_args_rtx;
3620 else
3622 if (!PUSH_ARGS)
3623 argblock = push_block (GEN_INT (args_size.constant), 0, 0);
3626 /* If we push args individually in reverse order, perform stack alignment
3627 before the first push (the last arg). */
3628 if (argblock == 0 && PUSH_ARGS_REVERSED)
3629 anti_adjust_stack (GEN_INT (args_size.constant
3630 - original_args_size.constant));
3632 if (PUSH_ARGS_REVERSED)
3634 inc = -1;
3635 argnum = nargs - 1;
3637 else
3639 inc = 1;
3640 argnum = 0;
3643 #ifdef REG_PARM_STACK_SPACE
3644 if (ACCUMULATE_OUTGOING_ARGS)
3646 /* The argument list is the property of the called routine and it
3647 may clobber it. If the fixed area has been used for previous
3648 parameters, we must save and restore it. */
3649 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
3650 &low_to_save, &high_to_save);
3652 #endif
3654 /* Push the args that need to be pushed. */
3656 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3657 are to be pushed. */
3658 for (count = 0; count < nargs; count++, argnum += inc)
3660 enum machine_mode mode = argvec[argnum].mode;
3661 rtx val = argvec[argnum].value;
3662 rtx reg = argvec[argnum].reg;
3663 int partial = argvec[argnum].partial;
3664 int lower_bound = 0, upper_bound = 0, i;
3666 if (! (reg != 0 && partial == 0))
3668 if (ACCUMULATE_OUTGOING_ARGS)
3670 /* If this is being stored into a pre-allocated, fixed-size,
3671 stack area, save any previous data at that location. */
3673 #ifdef ARGS_GROW_DOWNWARD
3674 /* stack_slot is negative, but we want to index stack_usage_map
3675 with positive values. */
3676 upper_bound = -argvec[argnum].locate.offset.constant + 1;
3677 lower_bound = upper_bound - argvec[argnum].locate.size.constant;
3678 #else
3679 lower_bound = argvec[argnum].locate.offset.constant;
3680 upper_bound = lower_bound + argvec[argnum].locate.size.constant;
3681 #endif
3683 i = lower_bound;
3684 /* Don't worry about things in the fixed argument area;
3685 it has already been saved. */
3686 if (i < reg_parm_stack_space)
3687 i = reg_parm_stack_space;
3688 while (i < upper_bound && stack_usage_map[i] == 0)
3689 i++;
3691 if (i < upper_bound)
3693 /* We need to make a save area. */
3694 unsigned int size
3695 = argvec[argnum].locate.size.constant * BITS_PER_UNIT;
3696 enum machine_mode save_mode
3697 = mode_for_size (size, MODE_INT, 1);
3698 rtx adr
3699 = plus_constant (argblock,
3700 argvec[argnum].locate.offset.constant);
3701 rtx stack_area
3702 = gen_rtx_MEM (save_mode, memory_address (save_mode, adr));
3704 if (save_mode == BLKmode)
3706 argvec[argnum].save_area
3707 = assign_stack_temp (BLKmode,
3708 argvec[argnum].locate.size.constant,
3711 emit_block_move (validize_mem (argvec[argnum].save_area),
3712 stack_area,
3713 GEN_INT (argvec[argnum].locate.size.constant),
3714 BLOCK_OP_CALL_PARM);
3716 else
3718 argvec[argnum].save_area = gen_reg_rtx (save_mode);
3720 emit_move_insn (argvec[argnum].save_area, stack_area);
3725 emit_push_insn (val, mode, NULL_TREE, NULL_RTX, PARM_BOUNDARY,
3726 partial, reg, 0, argblock,
3727 GEN_INT (argvec[argnum].locate.offset.constant),
3728 reg_parm_stack_space,
3729 ARGS_SIZE_RTX (argvec[argnum].locate.alignment_pad));
3731 /* Now mark the segment we just used. */
3732 if (ACCUMULATE_OUTGOING_ARGS)
3733 for (i = lower_bound; i < upper_bound; i++)
3734 stack_usage_map[i] = 1;
3736 NO_DEFER_POP;
3738 if (flags & ECF_CONST)
3740 rtx use;
3742 /* Indicate argument access so that alias.c knows that these
3743 values are live. */
3744 if (argblock)
3745 use = plus_constant (argblock,
3746 argvec[argnum].locate.offset.constant);
3747 else
3748 /* When arguments are pushed, trying to tell alias.c where
3749 exactly this argument is won't work, because the
3750 auto-increment causes confusion. So we merely indicate
3751 that we access something with a known mode somewhere on
3752 the stack. */
3753 use = gen_rtx_PLUS (Pmode, virtual_outgoing_args_rtx,
3754 gen_rtx_SCRATCH (Pmode));
3755 use = gen_rtx_MEM (argvec[argnum].mode, use);
3756 use = gen_rtx_USE (VOIDmode, use);
3757 call_fusage = gen_rtx_EXPR_LIST (VOIDmode, use, call_fusage);
3762 /* If we pushed args in forward order, perform stack alignment
3763 after pushing the last arg. */
3764 if (argblock == 0 && !PUSH_ARGS_REVERSED)
3765 anti_adjust_stack (GEN_INT (args_size.constant
3766 - original_args_size.constant));
3768 if (PUSH_ARGS_REVERSED)
3769 argnum = nargs - 1;
3770 else
3771 argnum = 0;
3773 fun = prepare_call_address (fun, NULL, &call_fusage, 0, 0);
3775 /* Now load any reg parms into their regs. */
3777 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3778 are to be pushed. */
3779 for (count = 0; count < nargs; count++, argnum += inc)
3781 enum machine_mode mode = argvec[argnum].mode;
3782 rtx val = argvec[argnum].value;
3783 rtx reg = argvec[argnum].reg;
3784 int partial = argvec[argnum].partial;
3786 /* Handle calls that pass values in multiple non-contiguous
3787 locations. The PA64 has examples of this for library calls. */
3788 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3789 emit_group_load (reg, val, NULL_TREE, GET_MODE_SIZE (mode));
3790 else if (reg != 0 && partial == 0)
3791 emit_move_insn (reg, val);
3793 NO_DEFER_POP;
3796 /* Any regs containing parms remain in use through the call. */
3797 for (count = 0; count < nargs; count++)
3799 rtx reg = argvec[count].reg;
3800 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3801 use_group_regs (&call_fusage, reg);
3802 else if (reg != 0)
3804 int partial = argvec[count].partial;
3805 if (partial)
3807 int nregs;
3808 gcc_assert (partial % UNITS_PER_WORD == 0);
3809 nregs = partial / UNITS_PER_WORD;
3810 use_regs (&call_fusage, REGNO (reg), nregs);
3812 else
3813 use_reg (&call_fusage, reg);
3817 /* Pass the function the address in which to return a structure value. */
3818 if (mem_value != 0 && struct_value != 0 && ! pcc_struct_value)
3820 emit_move_insn (struct_value,
3821 force_reg (Pmode,
3822 force_operand (XEXP (mem_value, 0),
3823 NULL_RTX)));
3824 if (REG_P (struct_value))
3825 use_reg (&call_fusage, struct_value);
3828 /* Don't allow popping to be deferred, since then
3829 cse'ing of library calls could delete a call and leave the pop. */
3830 NO_DEFER_POP;
3831 valreg = (mem_value == 0 && outmode != VOIDmode
3832 ? hard_libcall_value (outmode) : NULL_RTX);
3834 /* Stack must be properly aligned now. */
3835 gcc_assert (!(stack_pointer_delta
3836 & (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT - 1)));
3838 before_call = get_last_insn ();
3840 /* We pass the old value of inhibit_defer_pop + 1 to emit_call_1, which
3841 will set inhibit_defer_pop to that value. */
3842 /* The return type is needed to decide how many bytes the function pops.
3843 Signedness plays no role in that, so for simplicity, we pretend it's
3844 always signed. We also assume that the list of arguments passed has
3845 no impact, so we pretend it is unknown. */
3847 emit_call_1 (fun, NULL,
3848 get_identifier (XSTR (orgfun, 0)),
3849 build_function_type (tfom, NULL_TREE),
3850 original_args_size.constant, args_size.constant,
3851 struct_value_size,
3852 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1),
3853 valreg,
3854 old_inhibit_defer_pop + 1, call_fusage, flags, & args_so_far);
3856 /* For calls to `setjmp', etc., inform function.c:setjmp_warnings
3857 that it should complain if nonvolatile values are live. For
3858 functions that cannot return, inform flow that control does not
3859 fall through. */
3861 if (flags & ECF_NORETURN)
3863 /* The barrier note must be emitted
3864 immediately after the CALL_INSN. Some ports emit more than
3865 just a CALL_INSN above, so we must search for it here. */
3867 rtx last = get_last_insn ();
3868 while (!CALL_P (last))
3870 last = PREV_INSN (last);
3871 /* There was no CALL_INSN? */
3872 gcc_assert (last != before_call);
3875 emit_barrier_after (last);
3878 /* Now restore inhibit_defer_pop to its actual original value. */
3879 OK_DEFER_POP;
3881 /* If call is cse'able, make appropriate pair of reg-notes around it.
3882 Test valreg so we don't crash; may safely ignore `const'
3883 if return type is void. Disable for PARALLEL return values, because
3884 we have no way to move such values into a pseudo register. */
3885 if (flags & ECF_LIBCALL_BLOCK)
3887 rtx insns;
3889 if (valreg == 0)
3891 insns = get_insns ();
3892 end_sequence ();
3893 emit_insn (insns);
3895 else
3897 rtx note = 0;
3898 rtx temp;
3899 int i;
3901 if (GET_CODE (valreg) == PARALLEL)
3903 temp = gen_reg_rtx (outmode);
3904 emit_group_store (temp, valreg, NULL_TREE,
3905 GET_MODE_SIZE (outmode));
3906 valreg = temp;
3909 temp = gen_reg_rtx (GET_MODE (valreg));
3911 /* Construct an "equal form" for the value which mentions all the
3912 arguments in order as well as the function name. */
3913 for (i = 0; i < nargs; i++)
3914 note = gen_rtx_EXPR_LIST (VOIDmode, argvec[i].value, note);
3915 note = gen_rtx_EXPR_LIST (VOIDmode, fun, note);
3917 insns = get_insns ();
3918 end_sequence ();
3919 emit_libcall_block (insns, temp, valreg, note);
3921 valreg = temp;
3924 pop_temp_slots ();
3926 /* Copy the value to the right place. */
3927 if (outmode != VOIDmode && retval)
3929 if (mem_value)
3931 if (value == 0)
3932 value = mem_value;
3933 if (value != mem_value)
3934 emit_move_insn (value, mem_value);
3936 else if (GET_CODE (valreg) == PARALLEL)
3938 if (value == 0)
3939 value = gen_reg_rtx (outmode);
3940 emit_group_store (value, valreg, NULL_TREE, GET_MODE_SIZE (outmode));
3942 else
3944 /* Convert to the proper mode if PROMOTE_MODE has been active. */
3945 if (GET_MODE (valreg) != outmode)
3947 int unsignedp = TYPE_UNSIGNED (tfom);
3949 gcc_assert (targetm.calls.promote_function_return (tfom));
3950 gcc_assert (promote_mode (tfom, outmode, &unsignedp, 0)
3951 == GET_MODE (valreg));
3953 valreg = convert_modes (outmode, GET_MODE (valreg), valreg, 0);
3956 if (value != 0)
3957 emit_move_insn (value, valreg);
3958 else
3959 value = valreg;
3963 if (ACCUMULATE_OUTGOING_ARGS)
3965 #ifdef REG_PARM_STACK_SPACE
3966 if (save_area)
3967 restore_fixed_argument_area (save_area, argblock,
3968 high_to_save, low_to_save);
3969 #endif
3971 /* If we saved any argument areas, restore them. */
3972 for (count = 0; count < nargs; count++)
3973 if (argvec[count].save_area)
3975 enum machine_mode save_mode = GET_MODE (argvec[count].save_area);
3976 rtx adr = plus_constant (argblock,
3977 argvec[count].locate.offset.constant);
3978 rtx stack_area = gen_rtx_MEM (save_mode,
3979 memory_address (save_mode, adr));
3981 if (save_mode == BLKmode)
3982 emit_block_move (stack_area,
3983 validize_mem (argvec[count].save_area),
3984 GEN_INT (argvec[count].locate.size.constant),
3985 BLOCK_OP_CALL_PARM);
3986 else
3987 emit_move_insn (stack_area, argvec[count].save_area);
3990 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3991 stack_usage_map = initial_stack_usage_map;
3994 if (stack_usage_map_buf)
3995 free (stack_usage_map_buf);
3997 return value;
4001 /* Output a library call to function FUN (a SYMBOL_REF rtx)
4002 (emitting the queue unless NO_QUEUE is nonzero),
4003 for a value of mode OUTMODE,
4004 with NARGS different arguments, passed as alternating rtx values
4005 and machine_modes to convert them to.
4007 FN_TYPE should be LCT_NORMAL for `normal' calls, LCT_CONST for `const'
4008 calls, LCT_PURE for `pure' calls, LCT_CONST_MAKE_BLOCK for `const' calls
4009 which should be enclosed in REG_LIBCALL/REG_RETVAL notes,
4010 LCT_PURE_MAKE_BLOCK for `purep' calls which should be enclosed in
4011 REG_LIBCALL/REG_RETVAL notes with extra (use (memory (scratch)),
4012 or other LCT_ value for other types of library calls. */
4014 void
4015 emit_library_call (rtx orgfun, enum libcall_type fn_type,
4016 enum machine_mode outmode, int nargs, ...)
4018 va_list p;
4020 va_start (p, nargs);
4021 emit_library_call_value_1 (0, orgfun, NULL_RTX, fn_type, outmode, nargs, p);
4022 va_end (p);
4025 /* Like emit_library_call except that an extra argument, VALUE,
4026 comes second and says where to store the result.
4027 (If VALUE is zero, this function chooses a convenient way
4028 to return the value.
4030 This function returns an rtx for where the value is to be found.
4031 If VALUE is nonzero, VALUE is returned. */
4034 emit_library_call_value (rtx orgfun, rtx value,
4035 enum libcall_type fn_type,
4036 enum machine_mode outmode, int nargs, ...)
4038 rtx result;
4039 va_list p;
4041 va_start (p, nargs);
4042 result = emit_library_call_value_1 (1, orgfun, value, fn_type, outmode,
4043 nargs, p);
4044 va_end (p);
4046 return result;
4049 /* Store a single argument for a function call
4050 into the register or memory area where it must be passed.
4051 *ARG describes the argument value and where to pass it.
4053 ARGBLOCK is the address of the stack-block for all the arguments,
4054 or 0 on a machine where arguments are pushed individually.
4056 MAY_BE_ALLOCA nonzero says this could be a call to `alloca'
4057 so must be careful about how the stack is used.
4059 VARIABLE_SIZE nonzero says that this was a variable-sized outgoing
4060 argument stack. This is used if ACCUMULATE_OUTGOING_ARGS to indicate
4061 that we need not worry about saving and restoring the stack.
4063 FNDECL is the declaration of the function we are calling.
4065 Return nonzero if this arg should cause sibcall failure,
4066 zero otherwise. */
4068 static int
4069 store_one_arg (struct arg_data *arg, rtx argblock, int flags,
4070 int variable_size ATTRIBUTE_UNUSED, int reg_parm_stack_space)
4072 tree pval = arg->tree_value;
4073 rtx reg = 0;
4074 int partial = 0;
4075 int used = 0;
4076 int i, lower_bound = 0, upper_bound = 0;
4077 int sibcall_failure = 0;
4079 if (TREE_CODE (pval) == ERROR_MARK)
4080 return 1;
4082 /* Push a new temporary level for any temporaries we make for
4083 this argument. */
4084 push_temp_slots ();
4086 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL))
4088 /* If this is being stored into a pre-allocated, fixed-size, stack area,
4089 save any previous data at that location. */
4090 if (argblock && ! variable_size && arg->stack)
4092 #ifdef ARGS_GROW_DOWNWARD
4093 /* stack_slot is negative, but we want to index stack_usage_map
4094 with positive values. */
4095 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
4096 upper_bound = -INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1)) + 1;
4097 else
4098 upper_bound = 0;
4100 lower_bound = upper_bound - arg->locate.size.constant;
4101 #else
4102 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
4103 lower_bound = INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1));
4104 else
4105 lower_bound = 0;
4107 upper_bound = lower_bound + arg->locate.size.constant;
4108 #endif
4110 i = lower_bound;
4111 /* Don't worry about things in the fixed argument area;
4112 it has already been saved. */
4113 if (i < reg_parm_stack_space)
4114 i = reg_parm_stack_space;
4115 while (i < upper_bound && stack_usage_map[i] == 0)
4116 i++;
4118 if (i < upper_bound)
4120 /* We need to make a save area. */
4121 unsigned int size = arg->locate.size.constant * BITS_PER_UNIT;
4122 enum machine_mode save_mode = mode_for_size (size, MODE_INT, 1);
4123 rtx adr = memory_address (save_mode, XEXP (arg->stack_slot, 0));
4124 rtx stack_area = gen_rtx_MEM (save_mode, adr);
4126 if (save_mode == BLKmode)
4128 tree ot = TREE_TYPE (arg->tree_value);
4129 tree nt = build_qualified_type (ot, (TYPE_QUALS (ot)
4130 | TYPE_QUAL_CONST));
4132 arg->save_area = assign_temp (nt, 0, 1, 1);
4133 preserve_temp_slots (arg->save_area);
4134 emit_block_move (validize_mem (arg->save_area), stack_area,
4135 GEN_INT (arg->locate.size.constant),
4136 BLOCK_OP_CALL_PARM);
4138 else
4140 arg->save_area = gen_reg_rtx (save_mode);
4141 emit_move_insn (arg->save_area, stack_area);
4147 /* If this isn't going to be placed on both the stack and in registers,
4148 set up the register and number of words. */
4149 if (! arg->pass_on_stack)
4151 if (flags & ECF_SIBCALL)
4152 reg = arg->tail_call_reg;
4153 else
4154 reg = arg->reg;
4155 partial = arg->partial;
4158 /* Being passed entirely in a register. We shouldn't be called in
4159 this case. */
4160 gcc_assert (reg == 0 || partial != 0);
4162 /* If this arg needs special alignment, don't load the registers
4163 here. */
4164 if (arg->n_aligned_regs != 0)
4165 reg = 0;
4167 /* If this is being passed partially in a register, we can't evaluate
4168 it directly into its stack slot. Otherwise, we can. */
4169 if (arg->value == 0)
4171 /* stack_arg_under_construction is nonzero if a function argument is
4172 being evaluated directly into the outgoing argument list and
4173 expand_call must take special action to preserve the argument list
4174 if it is called recursively.
4176 For scalar function arguments stack_usage_map is sufficient to
4177 determine which stack slots must be saved and restored. Scalar
4178 arguments in general have pass_on_stack == 0.
4180 If this argument is initialized by a function which takes the
4181 address of the argument (a C++ constructor or a C function
4182 returning a BLKmode structure), then stack_usage_map is
4183 insufficient and expand_call must push the stack around the
4184 function call. Such arguments have pass_on_stack == 1.
4186 Note that it is always safe to set stack_arg_under_construction,
4187 but this generates suboptimal code if set when not needed. */
4189 if (arg->pass_on_stack)
4190 stack_arg_under_construction++;
4192 arg->value = expand_expr (pval,
4193 (partial
4194 || TYPE_MODE (TREE_TYPE (pval)) != arg->mode)
4195 ? NULL_RTX : arg->stack,
4196 VOIDmode, EXPAND_STACK_PARM);
4198 /* If we are promoting object (or for any other reason) the mode
4199 doesn't agree, convert the mode. */
4201 if (arg->mode != TYPE_MODE (TREE_TYPE (pval)))
4202 arg->value = convert_modes (arg->mode, TYPE_MODE (TREE_TYPE (pval)),
4203 arg->value, arg->unsignedp);
4205 if (arg->pass_on_stack)
4206 stack_arg_under_construction--;
4209 /* Check for overlap with already clobbered argument area. */
4210 if ((flags & ECF_SIBCALL)
4211 && MEM_P (arg->value)
4212 && mem_overlaps_already_clobbered_arg_p (XEXP (arg->value, 0),
4213 arg->locate.size.constant))
4214 sibcall_failure = 1;
4216 /* Don't allow anything left on stack from computation
4217 of argument to alloca. */
4218 if (flags & ECF_MAY_BE_ALLOCA)
4219 do_pending_stack_adjust ();
4221 if (arg->value == arg->stack)
4222 /* If the value is already in the stack slot, we are done. */
4224 else if (arg->mode != BLKmode)
4226 int size;
4227 unsigned int parm_align;
4229 /* Argument is a scalar, not entirely passed in registers.
4230 (If part is passed in registers, arg->partial says how much
4231 and emit_push_insn will take care of putting it there.)
4233 Push it, and if its size is less than the
4234 amount of space allocated to it,
4235 also bump stack pointer by the additional space.
4236 Note that in C the default argument promotions
4237 will prevent such mismatches. */
4239 size = GET_MODE_SIZE (arg->mode);
4240 /* Compute how much space the push instruction will push.
4241 On many machines, pushing a byte will advance the stack
4242 pointer by a halfword. */
4243 #ifdef PUSH_ROUNDING
4244 size = PUSH_ROUNDING (size);
4245 #endif
4246 used = size;
4248 /* Compute how much space the argument should get:
4249 round up to a multiple of the alignment for arguments. */
4250 if (none != FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)))
4251 used = (((size + PARM_BOUNDARY / BITS_PER_UNIT - 1)
4252 / (PARM_BOUNDARY / BITS_PER_UNIT))
4253 * (PARM_BOUNDARY / BITS_PER_UNIT));
4255 /* Compute the alignment of the pushed argument. */
4256 parm_align = arg->locate.boundary;
4257 if (FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)) == downward)
4259 int pad = used - size;
4260 if (pad)
4262 unsigned int pad_align = (pad & -pad) * BITS_PER_UNIT;
4263 parm_align = MIN (parm_align, pad_align);
4267 /* This isn't already where we want it on the stack, so put it there.
4268 This can either be done with push or copy insns. */
4269 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), NULL_RTX,
4270 parm_align, partial, reg, used - size, argblock,
4271 ARGS_SIZE_RTX (arg->locate.offset), reg_parm_stack_space,
4272 ARGS_SIZE_RTX (arg->locate.alignment_pad));
4274 /* Unless this is a partially-in-register argument, the argument is now
4275 in the stack. */
4276 if (partial == 0)
4277 arg->value = arg->stack;
4279 else
4281 /* BLKmode, at least partly to be pushed. */
4283 unsigned int parm_align;
4284 int excess;
4285 rtx size_rtx;
4287 /* Pushing a nonscalar.
4288 If part is passed in registers, PARTIAL says how much
4289 and emit_push_insn will take care of putting it there. */
4291 /* Round its size up to a multiple
4292 of the allocation unit for arguments. */
4294 if (arg->locate.size.var != 0)
4296 excess = 0;
4297 size_rtx = ARGS_SIZE_RTX (arg->locate.size);
4299 else
4301 /* PUSH_ROUNDING has no effect on us, because emit_push_insn
4302 for BLKmode is careful to avoid it. */
4303 excess = (arg->locate.size.constant
4304 - int_size_in_bytes (TREE_TYPE (pval))
4305 + partial);
4306 size_rtx = expand_expr (size_in_bytes (TREE_TYPE (pval)),
4307 NULL_RTX, TYPE_MODE (sizetype), 0);
4310 parm_align = arg->locate.boundary;
4312 /* When an argument is padded down, the block is aligned to
4313 PARM_BOUNDARY, but the actual argument isn't. */
4314 if (FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)) == downward)
4316 if (arg->locate.size.var)
4317 parm_align = BITS_PER_UNIT;
4318 else if (excess)
4320 unsigned int excess_align = (excess & -excess) * BITS_PER_UNIT;
4321 parm_align = MIN (parm_align, excess_align);
4325 if ((flags & ECF_SIBCALL) && MEM_P (arg->value))
4327 /* emit_push_insn might not work properly if arg->value and
4328 argblock + arg->locate.offset areas overlap. */
4329 rtx x = arg->value;
4330 int i = 0;
4332 if (XEXP (x, 0) == crtl->args.internal_arg_pointer
4333 || (GET_CODE (XEXP (x, 0)) == PLUS
4334 && XEXP (XEXP (x, 0), 0) ==
4335 crtl->args.internal_arg_pointer
4336 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT))
4338 if (XEXP (x, 0) != crtl->args.internal_arg_pointer)
4339 i = INTVAL (XEXP (XEXP (x, 0), 1));
4341 /* expand_call should ensure this. */
4342 gcc_assert (!arg->locate.offset.var
4343 && arg->locate.size.var == 0
4344 && GET_CODE (size_rtx) == CONST_INT);
4346 if (arg->locate.offset.constant > i)
4348 if (arg->locate.offset.constant < i + INTVAL (size_rtx))
4349 sibcall_failure = 1;
4351 else if (arg->locate.offset.constant < i)
4353 /* Use arg->locate.size.constant instead of size_rtx
4354 because we only care about the part of the argument
4355 on the stack. */
4356 if (i < (arg->locate.offset.constant
4357 + arg->locate.size.constant))
4358 sibcall_failure = 1;
4360 else
4362 /* Even though they appear to be at the same location,
4363 if part of the outgoing argument is in registers,
4364 they aren't really at the same location. Check for
4365 this by making sure that the incoming size is the
4366 same as the outgoing size. */
4367 if (arg->locate.size.constant != INTVAL (size_rtx))
4368 sibcall_failure = 1;
4373 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), size_rtx,
4374 parm_align, partial, reg, excess, argblock,
4375 ARGS_SIZE_RTX (arg->locate.offset), reg_parm_stack_space,
4376 ARGS_SIZE_RTX (arg->locate.alignment_pad));
4378 /* Unless this is a partially-in-register argument, the argument is now
4379 in the stack.
4381 ??? Unlike the case above, in which we want the actual
4382 address of the data, so that we can load it directly into a
4383 register, here we want the address of the stack slot, so that
4384 it's properly aligned for word-by-word copying or something
4385 like that. It's not clear that this is always correct. */
4386 if (partial == 0)
4387 arg->value = arg->stack_slot;
4390 if (arg->reg && GET_CODE (arg->reg) == PARALLEL)
4392 tree type = TREE_TYPE (arg->tree_value);
4393 arg->parallel_value
4394 = emit_group_load_into_temps (arg->reg, arg->value, type,
4395 int_size_in_bytes (type));
4398 /* Mark all slots this store used. */
4399 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL)
4400 && argblock && ! variable_size && arg->stack)
4401 for (i = lower_bound; i < upper_bound; i++)
4402 stack_usage_map[i] = 1;
4404 /* Once we have pushed something, pops can't safely
4405 be deferred during the rest of the arguments. */
4406 NO_DEFER_POP;
4408 /* Free any temporary slots made in processing this argument. Show
4409 that we might have taken the address of something and pushed that
4410 as an operand. */
4411 preserve_temp_slots (NULL_RTX);
4412 free_temp_slots ();
4413 pop_temp_slots ();
4415 return sibcall_failure;
4418 /* Nonzero if we do not know how to pass TYPE solely in registers. */
4420 bool
4421 must_pass_in_stack_var_size (enum machine_mode mode ATTRIBUTE_UNUSED,
4422 const_tree type)
4424 if (!type)
4425 return false;
4427 /* If the type has variable size... */
4428 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
4429 return true;
4431 /* If the type is marked as addressable (it is required
4432 to be constructed into the stack)... */
4433 if (TREE_ADDRESSABLE (type))
4434 return true;
4436 return false;
4439 /* Another version of the TARGET_MUST_PASS_IN_STACK hook. This one
4440 takes trailing padding of a structure into account. */
4441 /* ??? Should be able to merge these two by examining BLOCK_REG_PADDING. */
4443 bool
4444 must_pass_in_stack_var_size_or_pad (enum machine_mode mode, const_tree type)
4446 if (!type)
4447 return false;
4449 /* If the type has variable size... */
4450 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
4451 return true;
4453 /* If the type is marked as addressable (it is required
4454 to be constructed into the stack)... */
4455 if (TREE_ADDRESSABLE (type))
4456 return true;
4458 /* If the padding and mode of the type is such that a copy into
4459 a register would put it into the wrong part of the register. */
4460 if (mode == BLKmode
4461 && int_size_in_bytes (type) % (PARM_BOUNDARY / BITS_PER_UNIT)
4462 && (FUNCTION_ARG_PADDING (mode, type)
4463 == (BYTES_BIG_ENDIAN ? upward : downward)))
4464 return true;
4466 return false;