Daily bump.
[official-gcc.git] / gcc / calls.c
blob9513c308507b2c9777dc4d8c8c9b19406e38f1c9
1 /* Convert function calls to rtl insns, for GNU C compiler.
2 Copyright (C) 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998
3 1999, 2000 Free Software Foundation, Inc.
5 This file is part of GNU CC.
7 GNU CC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
10 any later version.
12 GNU CC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GNU CC; see the file COPYING. If not, write to
19 the Free Software Foundation, 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA. */
22 #include "config.h"
23 #include "system.h"
24 #include "rtl.h"
25 #include "tree.h"
26 #include "flags.h"
27 #include "expr.h"
28 #include "function.h"
29 #include "regs.h"
30 #include "insn-flags.h"
31 #include "toplev.h"
32 #include "output.h"
33 #include "tm_p.h"
34 #include "timevar.h"
35 #include "sbitmap.h"
37 #ifndef ACCUMULATE_OUTGOING_ARGS
38 #define ACCUMULATE_OUTGOING_ARGS 0
39 #endif
41 /* Supply a default definition for PUSH_ARGS. */
42 #ifndef PUSH_ARGS
43 #ifdef PUSH_ROUNDING
44 #define PUSH_ARGS !ACCUMULATE_OUTGOING_ARGS
45 #else
46 #define PUSH_ARGS 0
47 #endif
48 #endif
50 #if !defined FUNCTION_OK_FOR_SIBCALL
51 #define FUNCTION_OK_FOR_SIBCALL(DECL) 1
52 #endif
54 #if !defined PREFERRED_STACK_BOUNDARY && defined STACK_BOUNDARY
55 #define PREFERRED_STACK_BOUNDARY STACK_BOUNDARY
56 #endif
58 /* Decide whether a function's arguments should be processed
59 from first to last or from last to first.
61 They should if the stack and args grow in opposite directions, but
62 only if we have push insns. */
64 #ifdef PUSH_ROUNDING
66 #if defined (STACK_GROWS_DOWNWARD) != defined (ARGS_GROW_DOWNWARD)
67 #define PUSH_ARGS_REVERSED PUSH_ARGS
68 #endif
70 #endif
72 #ifndef PUSH_ARGS_REVERSED
73 #define PUSH_ARGS_REVERSED 0
74 #endif
76 /* Like PREFERRED_STACK_BOUNDARY but in units of bytes, not bits. */
77 #define STACK_BYTES (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT)
79 /* Data structure and subroutines used within expand_call. */
81 struct arg_data
83 /* Tree node for this argument. */
84 tree tree_value;
85 /* Mode for value; TYPE_MODE unless promoted. */
86 enum machine_mode mode;
87 /* Current RTL value for argument, or 0 if it isn't precomputed. */
88 rtx value;
89 /* Initially-compute RTL value for argument; only for const functions. */
90 rtx initial_value;
91 /* Register to pass this argument in, 0 if passed on stack, or an
92 PARALLEL if the arg is to be copied into multiple non-contiguous
93 registers. */
94 rtx reg;
95 /* Register to pass this argument in when generating tail call sequence.
96 This is not the same register as for normal calls on machines with
97 register windows. */
98 rtx tail_call_reg;
99 /* If REG was promoted from the actual mode of the argument expression,
100 indicates whether the promotion is sign- or zero-extended. */
101 int unsignedp;
102 /* Number of registers to use. 0 means put the whole arg in registers.
103 Also 0 if not passed in registers. */
104 int partial;
105 /* Non-zero if argument must be passed on stack.
106 Note that some arguments may be passed on the stack
107 even though pass_on_stack is zero, just because FUNCTION_ARG says so.
108 pass_on_stack identifies arguments that *cannot* go in registers. */
109 int pass_on_stack;
110 /* Offset of this argument from beginning of stack-args. */
111 struct args_size offset;
112 /* Similar, but offset to the start of the stack slot. Different from
113 OFFSET if this arg pads downward. */
114 struct args_size slot_offset;
115 /* Size of this argument on the stack, rounded up for any padding it gets,
116 parts of the argument passed in registers do not count.
117 If REG_PARM_STACK_SPACE is defined, then register parms
118 are counted here as well. */
119 struct args_size size;
120 /* Location on the stack at which parameter should be stored. The store
121 has already been done if STACK == VALUE. */
122 rtx stack;
123 /* Location on the stack of the start of this argument slot. This can
124 differ from STACK if this arg pads downward. This location is known
125 to be aligned to FUNCTION_ARG_BOUNDARY. */
126 rtx stack_slot;
127 /* Place that this stack area has been saved, if needed. */
128 rtx save_area;
129 /* If an argument's alignment does not permit direct copying into registers,
130 copy in smaller-sized pieces into pseudos. These are stored in a
131 block pointed to by this field. The next field says how many
132 word-sized pseudos we made. */
133 rtx *aligned_regs;
134 int n_aligned_regs;
135 /* The amount that the stack pointer needs to be adjusted to
136 force alignment for the next argument. */
137 struct args_size alignment_pad;
140 /* A vector of one char per byte of stack space. A byte if non-zero if
141 the corresponding stack location has been used.
142 This vector is used to prevent a function call within an argument from
143 clobbering any stack already set up. */
144 static char *stack_usage_map;
146 /* Size of STACK_USAGE_MAP. */
147 static int highest_outgoing_arg_in_use;
149 /* A bitmap of virtual-incoming stack space. Bit is set if the corresponding
150 stack location's tail call argument has been already stored into the stack.
151 This bitmap is used to prevent sibling call optimization if function tries
152 to use parent's incoming argument slots when they have been already
153 overwritten with tail call arguments. */
154 static sbitmap stored_args_map;
156 /* stack_arg_under_construction is nonzero when an argument may be
157 initialized with a constructor call (including a C function that
158 returns a BLKmode struct) and expand_call must take special action
159 to make sure the object being constructed does not overlap the
160 argument list for the constructor call. */
161 int stack_arg_under_construction;
163 static int calls_function PARAMS ((tree, int));
164 static int calls_function_1 PARAMS ((tree, int));
166 /* Nonzero if this is a call to a `const' function. */
167 #define ECF_CONST 1
168 /* Nonzero if this is a call to a `volatile' function. */
169 #define ECF_NORETURN 2
170 /* Nonzero if this is a call to malloc or a related function. */
171 #define ECF_MALLOC 4
172 /* Nonzero if it is plausible that this is a call to alloca. */
173 #define ECF_MAY_BE_ALLOCA 8
174 /* Nonzero if this is a call to a function that won't throw an exception. */
175 #define ECF_NOTHROW 16
176 /* Nonzero if this is a call to setjmp or a related function. */
177 #define ECF_RETURNS_TWICE 32
178 /* Nonzero if this is a call to `longjmp'. */
179 #define ECF_LONGJMP 64
180 /* Nonzero if this is a syscall that makes a new process in the image of
181 the current one. */
182 #define ECF_FORK_OR_EXEC 128
183 #define ECF_SIBCALL 256
184 /* Nonzero if this is a call to "pure" function (like const function,
185 but may read memory. */
186 #define ECF_PURE 512
187 /* Nonzero if this is a call to a function that returns with the stack
188 pointer depressed. */
189 #define ECF_SP_DEPRESSED 1024
191 static void emit_call_1 PARAMS ((rtx, tree, tree, HOST_WIDE_INT,
192 HOST_WIDE_INT, HOST_WIDE_INT, rtx,
193 rtx, int, rtx, int));
194 static void precompute_register_parameters PARAMS ((int,
195 struct arg_data *,
196 int *));
197 static int store_one_arg PARAMS ((struct arg_data *, rtx, int, int,
198 int));
199 static void store_unaligned_arguments_into_pseudos PARAMS ((struct arg_data *,
200 int));
201 static int finalize_must_preallocate PARAMS ((int, int,
202 struct arg_data *,
203 struct args_size *));
204 static void precompute_arguments PARAMS ((int, int,
205 struct arg_data *));
206 static int compute_argument_block_size PARAMS ((int,
207 struct args_size *,
208 int));
209 static void initialize_argument_information PARAMS ((int,
210 struct arg_data *,
211 struct args_size *,
212 int, tree, tree,
213 CUMULATIVE_ARGS *,
214 int, rtx *, int *,
215 int *, int *));
216 static void compute_argument_addresses PARAMS ((struct arg_data *,
217 rtx, int));
218 static rtx rtx_for_function_call PARAMS ((tree, tree));
219 static void load_register_parameters PARAMS ((struct arg_data *,
220 int, rtx *, int));
221 static int libfunc_nothrow PARAMS ((rtx));
222 static rtx emit_library_call_value_1 PARAMS ((int, rtx, rtx,
223 enum libcall_type,
224 enum machine_mode,
225 int, va_list));
226 static int special_function_p PARAMS ((tree, int));
227 static int flags_from_decl_or_type PARAMS ((tree));
228 static rtx try_to_integrate PARAMS ((tree, tree, rtx,
229 int, tree, rtx));
230 static int check_sibcall_argument_overlap_1 PARAMS ((rtx));
231 static int check_sibcall_argument_overlap PARAMS ((rtx, struct arg_data *));
233 static int combine_pending_stack_adjustment_and_call
234 PARAMS ((int, struct args_size *, int));
236 #ifdef REG_PARM_STACK_SPACE
237 static rtx save_fixed_argument_area PARAMS ((int, rtx, int *, int *));
238 static void restore_fixed_argument_area PARAMS ((rtx, rtx, int, int));
239 #endif
241 /* If WHICH is 1, return 1 if EXP contains a call to the built-in function
242 `alloca'.
244 If WHICH is 0, return 1 if EXP contains a call to any function.
245 Actually, we only need return 1 if evaluating EXP would require pushing
246 arguments on the stack, but that is too difficult to compute, so we just
247 assume any function call might require the stack. */
249 static tree calls_function_save_exprs;
251 static int
252 calls_function (exp, which)
253 tree exp;
254 int which;
256 int val;
258 calls_function_save_exprs = 0;
259 val = calls_function_1 (exp, which);
260 calls_function_save_exprs = 0;
261 return val;
264 /* Recursive function to do the work of above function. */
266 static int
267 calls_function_1 (exp, which)
268 tree exp;
269 int which;
271 register int i;
272 enum tree_code code = TREE_CODE (exp);
273 int class = TREE_CODE_CLASS (code);
274 int length = first_rtl_op (code);
276 /* If this code is language-specific, we don't know what it will do. */
277 if ((int) code >= NUM_TREE_CODES)
278 return 1;
280 switch (code)
282 case CALL_EXPR:
283 if (which == 0)
284 return 1;
285 else if ((TREE_CODE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))))
286 == FUNCTION_TYPE)
287 && (TYPE_RETURNS_STACK_DEPRESSED
288 (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))))))
289 return 1;
290 else if (TREE_CODE (TREE_OPERAND (exp, 0)) == ADDR_EXPR
291 && (TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
292 == FUNCTION_DECL)
293 && (special_function_p (TREE_OPERAND (TREE_OPERAND (exp, 0), 0),
295 & ECF_MAY_BE_ALLOCA))
296 return 1;
298 break;
300 case SAVE_EXPR:
301 if (SAVE_EXPR_RTL (exp) != 0)
302 return 0;
303 if (value_member (exp, calls_function_save_exprs))
304 return 0;
305 calls_function_save_exprs = tree_cons (NULL_TREE, exp,
306 calls_function_save_exprs);
307 return (TREE_OPERAND (exp, 0) != 0
308 && calls_function_1 (TREE_OPERAND (exp, 0), which));
310 case BLOCK:
312 register tree local;
313 register tree subblock;
315 for (local = BLOCK_VARS (exp); local; local = TREE_CHAIN (local))
316 if (DECL_INITIAL (local) != 0
317 && calls_function_1 (DECL_INITIAL (local), which))
318 return 1;
320 for (subblock = BLOCK_SUBBLOCKS (exp);
321 subblock;
322 subblock = TREE_CHAIN (subblock))
323 if (calls_function_1 (subblock, which))
324 return 1;
326 return 0;
328 case TREE_LIST:
329 for (; exp != 0; exp = TREE_CHAIN (exp))
330 if (calls_function_1 (TREE_VALUE (exp), which))
331 return 1;
332 return 0;
334 default:
335 break;
338 /* Only expressions, references, and blocks can contain calls. */
339 if (! IS_EXPR_CODE_CLASS (class) && class != 'r' && class != 'b')
340 return 0;
342 for (i = 0; i < length; i++)
343 if (TREE_OPERAND (exp, i) != 0
344 && calls_function_1 (TREE_OPERAND (exp, i), which))
345 return 1;
347 return 0;
350 /* Force FUNEXP into a form suitable for the address of a CALL,
351 and return that as an rtx. Also load the static chain register
352 if FNDECL is a nested function.
354 CALL_FUSAGE points to a variable holding the prospective
355 CALL_INSN_FUNCTION_USAGE information. */
358 prepare_call_address (funexp, fndecl, call_fusage, reg_parm_seen)
359 rtx funexp;
360 tree fndecl;
361 rtx *call_fusage;
362 int reg_parm_seen;
364 rtx static_chain_value = 0;
366 funexp = protect_from_queue (funexp, 0);
368 if (fndecl != 0)
369 /* Get possible static chain value for nested function in C. */
370 static_chain_value = lookup_static_chain (fndecl);
372 /* Make a valid memory address and copy constants thru pseudo-regs,
373 but not for a constant address if -fno-function-cse. */
374 if (GET_CODE (funexp) != SYMBOL_REF)
375 /* If we are using registers for parameters, force the
376 function address into a register now. */
377 funexp = ((SMALL_REGISTER_CLASSES && reg_parm_seen)
378 ? force_not_mem (memory_address (FUNCTION_MODE, funexp))
379 : memory_address (FUNCTION_MODE, funexp));
380 else
382 #ifndef NO_FUNCTION_CSE
383 if (optimize && ! flag_no_function_cse)
384 #ifdef NO_RECURSIVE_FUNCTION_CSE
385 if (fndecl != current_function_decl)
386 #endif
387 funexp = force_reg (Pmode, funexp);
388 #endif
391 if (static_chain_value != 0)
393 emit_move_insn (static_chain_rtx, static_chain_value);
395 if (GET_CODE (static_chain_rtx) == REG)
396 use_reg (call_fusage, static_chain_rtx);
399 return funexp;
402 /* Generate instructions to call function FUNEXP,
403 and optionally pop the results.
404 The CALL_INSN is the first insn generated.
406 FNDECL is the declaration node of the function. This is given to the
407 macro RETURN_POPS_ARGS to determine whether this function pops its own args.
409 FUNTYPE is the data type of the function. This is given to the macro
410 RETURN_POPS_ARGS to determine whether this function pops its own args.
411 We used to allow an identifier for library functions, but that doesn't
412 work when the return type is an aggregate type and the calling convention
413 says that the pointer to this aggregate is to be popped by the callee.
415 STACK_SIZE is the number of bytes of arguments on the stack,
416 ROUNDED_STACK_SIZE is that number rounded up to
417 PREFERRED_STACK_BOUNDARY; zero if the size is variable. This is
418 both to put into the call insn and to generate explicit popping
419 code if necessary.
421 STRUCT_VALUE_SIZE is the number of bytes wanted in a structure value.
422 It is zero if this call doesn't want a structure value.
424 NEXT_ARG_REG is the rtx that results from executing
425 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1)
426 just after all the args have had their registers assigned.
427 This could be whatever you like, but normally it is the first
428 arg-register beyond those used for args in this call,
429 or 0 if all the arg-registers are used in this call.
430 It is passed on to `gen_call' so you can put this info in the call insn.
432 VALREG is a hard register in which a value is returned,
433 or 0 if the call does not return a value.
435 OLD_INHIBIT_DEFER_POP is the value that `inhibit_defer_pop' had before
436 the args to this call were processed.
437 We restore `inhibit_defer_pop' to that value.
439 CALL_FUSAGE is either empty or an EXPR_LIST of USE expressions that
440 denote registers used by the called function. */
442 static void
443 emit_call_1 (funexp, fndecl, funtype, stack_size, rounded_stack_size,
444 struct_value_size, next_arg_reg, valreg, old_inhibit_defer_pop,
445 call_fusage, ecf_flags)
446 rtx funexp;
447 tree fndecl ATTRIBUTE_UNUSED;
448 tree funtype ATTRIBUTE_UNUSED;
449 HOST_WIDE_INT stack_size ATTRIBUTE_UNUSED;
450 HOST_WIDE_INT rounded_stack_size;
451 HOST_WIDE_INT struct_value_size ATTRIBUTE_UNUSED;
452 rtx next_arg_reg;
453 rtx valreg;
454 int old_inhibit_defer_pop;
455 rtx call_fusage;
456 int ecf_flags;
458 rtx rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
459 rtx call_insn;
460 int already_popped = 0;
461 HOST_WIDE_INT n_popped = RETURN_POPS_ARGS (fndecl, funtype, stack_size);
462 #if defined (HAVE_call) && defined (HAVE_call_value)
463 rtx struct_value_size_rtx;
464 struct_value_size_rtx = GEN_INT (struct_value_size);
465 #endif
467 /* Ensure address is valid. SYMBOL_REF is already valid, so no need,
468 and we don't want to load it into a register as an optimization,
469 because prepare_call_address already did it if it should be done. */
470 if (GET_CODE (funexp) != SYMBOL_REF)
471 funexp = memory_address (FUNCTION_MODE, funexp);
473 #if defined (HAVE_sibcall_pop) && defined (HAVE_sibcall_value_pop)
474 if ((ecf_flags & ECF_SIBCALL)
475 && HAVE_sibcall_pop && HAVE_sibcall_value_pop
476 && (n_popped > 0 || stack_size == 0))
478 rtx n_pop = GEN_INT (n_popped));
479 rtx pat;
481 /* If this subroutine pops its own args, record that in the call insn
482 if possible, for the sake of frame pointer elimination. */
484 if (valreg)
485 pat = GEN_SIBCALL_VALUE_POP (valreg,
486 gen_rtx_MEM (FUNCTION_MODE, funexp),
487 rounded_stack_size_rtx, next_arg_reg,
488 n_pop);
489 else
490 pat = GEN_SIBCALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
491 rounded_stack_size_rtx, next_arg_reg, n_pop);
493 emit_call_insn (pat);
494 already_popped = 1;
496 else
497 #endif
499 #if defined (HAVE_call_pop) && defined (HAVE_call_value_pop)
500 /* If the target has "call" or "call_value" insns, then prefer them
501 if no arguments are actually popped. If the target does not have
502 "call" or "call_value" insns, then we must use the popping versions
503 even if the call has no arguments to pop. */
504 #if defined (HAVE_call) && defined (HAVE_call_value)
505 if (HAVE_call && HAVE_call_value && HAVE_call_pop && HAVE_call_value_pop
506 && n_popped > 0 && ! (ecf_flags & ECF_SP_DEPRESSED))
507 #else
508 if (HAVE_call_pop && HAVE_call_value_pop)
509 #endif
511 rtx n_pop = GEN_INT (n_popped);
512 rtx pat;
514 /* If this subroutine pops its own args, record that in the call insn
515 if possible, for the sake of frame pointer elimination. */
517 if (valreg)
518 pat = GEN_CALL_VALUE_POP (valreg,
519 gen_rtx_MEM (FUNCTION_MODE, funexp),
520 rounded_stack_size_rtx, next_arg_reg, n_pop);
521 else
522 pat = GEN_CALL_POP (gen_rtx_MEM (FUNCTION_MODE, funexp),
523 rounded_stack_size_rtx, next_arg_reg, n_pop);
525 emit_call_insn (pat);
526 already_popped = 1;
528 else
529 #endif
531 #if defined (HAVE_sibcall) && defined (HAVE_sibcall_value)
532 if ((ecf_flags & ECF_SIBCALL)
533 && HAVE_sibcall && HAVE_sibcall_value)
535 if (valreg)
536 emit_call_insn (GEN_SIBCALL_VALUE (valreg,
537 gen_rtx_MEM (FUNCTION_MODE, funexp),
538 rounded_stack_size_rtx,
539 next_arg_reg, NULL_RTX));
540 else
541 emit_call_insn (GEN_SIBCALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
542 rounded_stack_size_rtx, next_arg_reg,
543 struct_value_size_rtx));
545 else
546 #endif
548 #if defined (HAVE_call) && defined (HAVE_call_value)
549 if (HAVE_call && HAVE_call_value)
551 if (valreg)
552 emit_call_insn (GEN_CALL_VALUE (valreg,
553 gen_rtx_MEM (FUNCTION_MODE, funexp),
554 rounded_stack_size_rtx, next_arg_reg,
555 NULL_RTX));
556 else
557 emit_call_insn (GEN_CALL (gen_rtx_MEM (FUNCTION_MODE, funexp),
558 rounded_stack_size_rtx, next_arg_reg,
559 struct_value_size_rtx));
561 else
562 #endif
563 abort ();
565 /* Find the CALL insn we just emitted. */
566 for (call_insn = get_last_insn ();
567 call_insn && GET_CODE (call_insn) != CALL_INSN;
568 call_insn = PREV_INSN (call_insn))
571 if (! call_insn)
572 abort ();
574 /* Mark memory as used for "pure" function call. */
575 if (ecf_flags & ECF_PURE)
577 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
578 gen_rtx_USE (VOIDmode,
579 gen_rtx_MEM (BLKmode,
580 gen_rtx_SCRATCH (VOIDmode))), call_fusage);
583 /* Put the register usage information on the CALL. If there is already
584 some usage information, put ours at the end. */
585 if (CALL_INSN_FUNCTION_USAGE (call_insn))
587 rtx link;
589 for (link = CALL_INSN_FUNCTION_USAGE (call_insn); XEXP (link, 1) != 0;
590 link = XEXP (link, 1))
593 XEXP (link, 1) = call_fusage;
595 else
596 CALL_INSN_FUNCTION_USAGE (call_insn) = call_fusage;
598 /* If this is a const call, then set the insn's unchanging bit. */
599 if (ecf_flags & (ECF_CONST | ECF_PURE))
600 CONST_CALL_P (call_insn) = 1;
602 /* If this call can't throw, attach a REG_EH_REGION reg note to that
603 effect. */
604 if (ecf_flags & ECF_NOTHROW)
605 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_EH_REGION, const0_rtx,
606 REG_NOTES (call_insn));
608 if (ecf_flags & ECF_NORETURN)
609 REG_NOTES (call_insn) = gen_rtx_EXPR_LIST (REG_NORETURN, const0_rtx,
610 REG_NOTES (call_insn));
612 SIBLING_CALL_P (call_insn) = ((ecf_flags & ECF_SIBCALL) != 0);
614 /* Restore this now, so that we do defer pops for this call's args
615 if the context of the call as a whole permits. */
616 inhibit_defer_pop = old_inhibit_defer_pop;
618 if (n_popped > 0)
620 if (!already_popped)
621 CALL_INSN_FUNCTION_USAGE (call_insn)
622 = gen_rtx_EXPR_LIST (VOIDmode,
623 gen_rtx_CLOBBER (VOIDmode, stack_pointer_rtx),
624 CALL_INSN_FUNCTION_USAGE (call_insn));
625 rounded_stack_size -= n_popped;
626 rounded_stack_size_rtx = GEN_INT (rounded_stack_size);
627 stack_pointer_delta -= n_popped;
630 if (!ACCUMULATE_OUTGOING_ARGS)
632 /* If returning from the subroutine does not automatically pop the args,
633 we need an instruction to pop them sooner or later.
634 Perhaps do it now; perhaps just record how much space to pop later.
636 If returning from the subroutine does pop the args, indicate that the
637 stack pointer will be changed. */
639 if (rounded_stack_size != 0 && ! (ecf_flags & ECF_SP_DEPRESSED))
641 if (flag_defer_pop && inhibit_defer_pop == 0
642 && ! (ecf_flags & (ECF_CONST | ECF_PURE)))
643 pending_stack_adjust += rounded_stack_size;
644 else
645 adjust_stack (rounded_stack_size_rtx);
648 /* When we accumulate outgoing args, we must avoid any stack manipulations.
649 Restore the stack pointer to its original value now. Usually
650 ACCUMULATE_OUTGOING_ARGS targets don't get here, but there are exceptions.
651 On i386 ACCUMULATE_OUTGOING_ARGS can be enabled on demand, and
652 popping variants of functions exist as well.
654 ??? We may optimize similar to defer_pop above, but it is
655 probably not worthwhile.
657 ??? It will be worthwhile to enable combine_stack_adjustments even for
658 such machines. */
659 else if (n_popped)
660 anti_adjust_stack (GEN_INT (n_popped));
663 /* Determine if the function identified by NAME and FNDECL is one with
664 special properties we wish to know about.
666 For example, if the function might return more than one time (setjmp), then
667 set RETURNS_TWICE to a nonzero value.
669 Similarly set LONGJMP for if the function is in the longjmp family.
671 Set MALLOC for any of the standard memory allocation functions which
672 allocate from the heap.
674 Set MAY_BE_ALLOCA for any memory allocation function that might allocate
675 space from the stack such as alloca. */
677 static int
678 special_function_p (fndecl, flags)
679 tree fndecl;
680 int flags;
682 if (! (flags & ECF_MALLOC)
683 && fndecl && DECL_NAME (fndecl)
684 && IDENTIFIER_LENGTH (DECL_NAME (fndecl)) <= 17
685 /* Exclude functions not at the file scope, or not `extern',
686 since they are not the magic functions we would otherwise
687 think they are. */
688 && DECL_CONTEXT (fndecl) == NULL_TREE && TREE_PUBLIC (fndecl))
690 const char *name = IDENTIFIER_POINTER (DECL_NAME (fndecl));
691 const char *tname = name;
693 /* We assume that alloca will always be called by name. It
694 makes no sense to pass it as a pointer-to-function to
695 anything that does not understand its behavior. */
696 if (((IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 6
697 && name[0] == 'a'
698 && ! strcmp (name, "alloca"))
699 || (IDENTIFIER_LENGTH (DECL_NAME (fndecl)) == 16
700 && name[0] == '_'
701 && ! strcmp (name, "__builtin_alloca"))))
702 flags |= ECF_MAY_BE_ALLOCA;
704 /* Disregard prefix _, __ or __x. */
705 if (name[0] == '_')
707 if (name[1] == '_' && name[2] == 'x')
708 tname += 3;
709 else if (name[1] == '_')
710 tname += 2;
711 else
712 tname += 1;
715 if (tname[0] == 's')
717 if ((tname[1] == 'e'
718 && (! strcmp (tname, "setjmp")
719 || ! strcmp (tname, "setjmp_syscall")))
720 || (tname[1] == 'i'
721 && ! strcmp (tname, "sigsetjmp"))
722 || (tname[1] == 'a'
723 && ! strcmp (tname, "savectx")))
724 flags |= ECF_RETURNS_TWICE;
726 if (tname[1] == 'i'
727 && ! strcmp (tname, "siglongjmp"))
728 flags |= ECF_LONGJMP;
730 else if ((tname[0] == 'q' && tname[1] == 's'
731 && ! strcmp (tname, "qsetjmp"))
732 || (tname[0] == 'v' && tname[1] == 'f'
733 && ! strcmp (tname, "vfork")))
734 flags |= ECF_RETURNS_TWICE;
736 else if (tname[0] == 'l' && tname[1] == 'o'
737 && ! strcmp (tname, "longjmp"))
738 flags |= ECF_LONGJMP;
740 else if ((tname[0] == 'f' && tname[1] == 'o'
741 && ! strcmp (tname, "fork"))
742 /* Linux specific: __clone. check NAME to insist on the
743 leading underscores, to avoid polluting the ISO / POSIX
744 namespace. */
745 || (name[0] == '_' && name[1] == '_'
746 && ! strcmp (tname, "clone"))
747 || (tname[0] == 'e' && tname[1] == 'x' && tname[2] == 'e'
748 && tname[3] == 'c' && (tname[4] == 'l' || tname[4] == 'v')
749 && (tname[5] == '\0'
750 || ((tname[5] == 'p' || tname[5] == 'e')
751 && tname[6] == '\0'))))
752 flags |= ECF_FORK_OR_EXEC;
754 /* Do not add any more malloc-like functions to this list,
755 instead mark them as malloc functions using the malloc attribute.
756 Note, realloc is not suitable for attribute malloc since
757 it may return the same address across multiple calls.
758 C++ operator new is not suitable because it is not required
759 to return a unique pointer; indeed, the standard placement new
760 just returns its argument. */
761 else if (TYPE_MODE (TREE_TYPE (TREE_TYPE (fndecl))) == Pmode
762 && (! strcmp (tname, "malloc")
763 || ! strcmp (tname, "calloc")
764 || ! strcmp (tname, "strdup")))
765 flags |= ECF_MALLOC;
767 return flags;
770 /* Return nonzero when tree represent call to longjmp. */
773 setjmp_call_p (fndecl)
774 tree fndecl;
776 return special_function_p (fndecl, 0) & ECF_RETURNS_TWICE;
779 /* Detect flags (function attributes) from the function type node. */
781 static int
782 flags_from_decl_or_type (exp)
783 tree exp;
785 int flags = 0;
787 /* ??? We can't set IS_MALLOC for function types? */
788 if (DECL_P (exp))
790 /* The function exp may have the `malloc' attribute. */
791 if (DECL_P (exp) && DECL_IS_MALLOC (exp))
792 flags |= ECF_MALLOC;
794 /* The function exp may have the `pure' attribute. */
795 if (DECL_P (exp) && DECL_IS_PURE (exp))
796 flags |= ECF_PURE;
798 if (TREE_NOTHROW (exp))
799 flags |= ECF_NOTHROW;
802 if (TREE_READONLY (exp) && ! TREE_THIS_VOLATILE (exp))
803 flags |= ECF_CONST;
805 if (TREE_THIS_VOLATILE (exp))
806 flags |= ECF_NORETURN;
808 return flags;
811 /* Precompute all register parameters as described by ARGS, storing values
812 into fields within the ARGS array.
814 NUM_ACTUALS indicates the total number elements in the ARGS array.
816 Set REG_PARM_SEEN if we encounter a register parameter. */
818 static void
819 precompute_register_parameters (num_actuals, args, reg_parm_seen)
820 int num_actuals;
821 struct arg_data *args;
822 int *reg_parm_seen;
824 int i;
826 *reg_parm_seen = 0;
828 for (i = 0; i < num_actuals; i++)
829 if (args[i].reg != 0 && ! args[i].pass_on_stack)
831 *reg_parm_seen = 1;
833 if (args[i].value == 0)
835 push_temp_slots ();
836 args[i].value = expand_expr (args[i].tree_value, NULL_RTX,
837 VOIDmode, 0);
838 preserve_temp_slots (args[i].value);
839 pop_temp_slots ();
841 /* ANSI doesn't require a sequence point here,
842 but PCC has one, so this will avoid some problems. */
843 emit_queue ();
846 /* If we are to promote the function arg to a wider mode,
847 do it now. */
849 if (args[i].mode != TYPE_MODE (TREE_TYPE (args[i].tree_value)))
850 args[i].value
851 = convert_modes (args[i].mode,
852 TYPE_MODE (TREE_TYPE (args[i].tree_value)),
853 args[i].value, args[i].unsignedp);
855 /* If the value is expensive, and we are inside an appropriately
856 short loop, put the value into a pseudo and then put the pseudo
857 into the hard reg.
859 For small register classes, also do this if this call uses
860 register parameters. This is to avoid reload conflicts while
861 loading the parameters registers. */
863 if ((! (GET_CODE (args[i].value) == REG
864 || (GET_CODE (args[i].value) == SUBREG
865 && GET_CODE (SUBREG_REG (args[i].value)) == REG)))
866 && args[i].mode != BLKmode
867 && rtx_cost (args[i].value, SET) > COSTS_N_INSNS (1)
868 && ((SMALL_REGISTER_CLASSES && *reg_parm_seen)
869 || preserve_subexpressions_p ()))
870 args[i].value = copy_to_mode_reg (args[i].mode, args[i].value);
874 #ifdef REG_PARM_STACK_SPACE
876 /* The argument list is the property of the called routine and it
877 may clobber it. If the fixed area has been used for previous
878 parameters, we must save and restore it. */
880 static rtx
881 save_fixed_argument_area (reg_parm_stack_space, argblock,
882 low_to_save, high_to_save)
883 int reg_parm_stack_space;
884 rtx argblock;
885 int *low_to_save;
886 int *high_to_save;
888 int i;
889 rtx save_area = NULL_RTX;
891 /* Compute the boundary of the that needs to be saved, if any. */
892 #ifdef ARGS_GROW_DOWNWARD
893 for (i = 0; i < reg_parm_stack_space + 1; i++)
894 #else
895 for (i = 0; i < reg_parm_stack_space; i++)
896 #endif
898 if (i >= highest_outgoing_arg_in_use
899 || stack_usage_map[i] == 0)
900 continue;
902 if (*low_to_save == -1)
903 *low_to_save = i;
905 *high_to_save = i;
908 if (*low_to_save >= 0)
910 int num_to_save = *high_to_save - *low_to_save + 1;
911 enum machine_mode save_mode
912 = mode_for_size (num_to_save * BITS_PER_UNIT, MODE_INT, 1);
913 rtx stack_area;
915 /* If we don't have the required alignment, must do this in BLKmode. */
916 if ((*low_to_save & (MIN (GET_MODE_SIZE (save_mode),
917 BIGGEST_ALIGNMENT / UNITS_PER_WORD) - 1)))
918 save_mode = BLKmode;
920 #ifdef ARGS_GROW_DOWNWARD
921 stack_area
922 = gen_rtx_MEM (save_mode,
923 memory_address (save_mode,
924 plus_constant (argblock,
925 - *high_to_save)));
926 #else
927 stack_area = gen_rtx_MEM (save_mode,
928 memory_address (save_mode,
929 plus_constant (argblock,
930 *low_to_save)));
931 #endif
932 if (save_mode == BLKmode)
934 save_area = assign_stack_temp (BLKmode, num_to_save, 0);
935 /* Cannot use emit_block_move here because it can be done by a
936 library call which in turn gets into this place again and deadly
937 infinite recursion happens. */
938 move_by_pieces (validize_mem (save_area), stack_area, num_to_save,
939 PARM_BOUNDARY);
941 else
943 save_area = gen_reg_rtx (save_mode);
944 emit_move_insn (save_area, stack_area);
947 return save_area;
950 static void
951 restore_fixed_argument_area (save_area, argblock, high_to_save, low_to_save)
952 rtx save_area;
953 rtx argblock;
954 int high_to_save;
955 int low_to_save;
957 enum machine_mode save_mode = GET_MODE (save_area);
958 #ifdef ARGS_GROW_DOWNWARD
959 rtx stack_area
960 = gen_rtx_MEM (save_mode,
961 memory_address (save_mode,
962 plus_constant (argblock,
963 - high_to_save)));
964 #else
965 rtx stack_area
966 = gen_rtx_MEM (save_mode,
967 memory_address (save_mode,
968 plus_constant (argblock,
969 low_to_save)));
970 #endif
972 if (save_mode != BLKmode)
973 emit_move_insn (stack_area, save_area);
974 else
975 /* Cannot use emit_block_move here because it can be done by a library
976 call which in turn gets into this place again and deadly infinite
977 recursion happens. */
978 move_by_pieces (stack_area, validize_mem (save_area),
979 high_to_save - low_to_save + 1, PARM_BOUNDARY);
981 #endif
983 /* If any elements in ARGS refer to parameters that are to be passed in
984 registers, but not in memory, and whose alignment does not permit a
985 direct copy into registers. Copy the values into a group of pseudos
986 which we will later copy into the appropriate hard registers.
988 Pseudos for each unaligned argument will be stored into the array
989 args[argnum].aligned_regs. The caller is responsible for deallocating
990 the aligned_regs array if it is nonzero. */
992 static void
993 store_unaligned_arguments_into_pseudos (args, num_actuals)
994 struct arg_data *args;
995 int num_actuals;
997 int i, j;
999 for (i = 0; i < num_actuals; i++)
1000 if (args[i].reg != 0 && ! args[i].pass_on_stack
1001 && args[i].mode == BLKmode
1002 && (TYPE_ALIGN (TREE_TYPE (args[i].tree_value))
1003 < (unsigned int) MIN (BIGGEST_ALIGNMENT, BITS_PER_WORD)))
1005 int bytes = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1006 int big_endian_correction = 0;
1008 args[i].n_aligned_regs
1009 = args[i].partial ? args[i].partial
1010 : (bytes + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD;
1012 args[i].aligned_regs = (rtx *) xmalloc (sizeof (rtx)
1013 * args[i].n_aligned_regs);
1015 /* Structures smaller than a word are aligned to the least
1016 significant byte (to the right). On a BYTES_BIG_ENDIAN machine,
1017 this means we must skip the empty high order bytes when
1018 calculating the bit offset. */
1019 if (BYTES_BIG_ENDIAN && bytes < UNITS_PER_WORD)
1020 big_endian_correction = (BITS_PER_WORD - (bytes * BITS_PER_UNIT));
1022 for (j = 0; j < args[i].n_aligned_regs; j++)
1024 rtx reg = gen_reg_rtx (word_mode);
1025 rtx word = operand_subword_force (args[i].value, j, BLKmode);
1026 int bitsize = MIN (bytes * BITS_PER_UNIT, BITS_PER_WORD);
1027 int bitalign = TYPE_ALIGN (TREE_TYPE (args[i].tree_value));
1029 args[i].aligned_regs[j] = reg;
1031 /* There is no need to restrict this code to loading items
1032 in TYPE_ALIGN sized hunks. The bitfield instructions can
1033 load up entire word sized registers efficiently.
1035 ??? This may not be needed anymore.
1036 We use to emit a clobber here but that doesn't let later
1037 passes optimize the instructions we emit. By storing 0 into
1038 the register later passes know the first AND to zero out the
1039 bitfield being set in the register is unnecessary. The store
1040 of 0 will be deleted as will at least the first AND. */
1042 emit_move_insn (reg, const0_rtx);
1044 bytes -= bitsize / BITS_PER_UNIT;
1045 store_bit_field (reg, bitsize, big_endian_correction, word_mode,
1046 extract_bit_field (word, bitsize, 0, 1, NULL_RTX,
1047 word_mode, word_mode, bitalign,
1048 BITS_PER_WORD),
1049 bitalign, BITS_PER_WORD);
1054 /* Fill in ARGS_SIZE and ARGS array based on the parameters found in
1055 ACTPARMS.
1057 NUM_ACTUALS is the total number of parameters.
1059 N_NAMED_ARGS is the total number of named arguments.
1061 FNDECL is the tree code for the target of this call (if known)
1063 ARGS_SO_FAR holds state needed by the target to know where to place
1064 the next argument.
1066 REG_PARM_STACK_SPACE is the number of bytes of stack space reserved
1067 for arguments which are passed in registers.
1069 OLD_STACK_LEVEL is a pointer to an rtx which olds the old stack level
1070 and may be modified by this routine.
1072 OLD_PENDING_ADJ, MUST_PREALLOCATE and FLAGS are pointers to integer
1073 flags which may may be modified by this routine. */
1075 static void
1076 initialize_argument_information (num_actuals, args, args_size, n_named_args,
1077 actparms, fndecl, args_so_far,
1078 reg_parm_stack_space, old_stack_level,
1079 old_pending_adj, must_preallocate,
1080 ecf_flags)
1081 int num_actuals ATTRIBUTE_UNUSED;
1082 struct arg_data *args;
1083 struct args_size *args_size;
1084 int n_named_args ATTRIBUTE_UNUSED;
1085 tree actparms;
1086 tree fndecl;
1087 CUMULATIVE_ARGS *args_so_far;
1088 int reg_parm_stack_space;
1089 rtx *old_stack_level;
1090 int *old_pending_adj;
1091 int *must_preallocate;
1092 int *ecf_flags;
1094 /* 1 if scanning parms front to back, -1 if scanning back to front. */
1095 int inc;
1097 /* Count arg position in order args appear. */
1098 int argpos;
1100 struct args_size alignment_pad;
1101 int i;
1102 tree p;
1104 args_size->constant = 0;
1105 args_size->var = 0;
1107 /* In this loop, we consider args in the order they are written.
1108 We fill up ARGS from the front or from the back if necessary
1109 so that in any case the first arg to be pushed ends up at the front. */
1111 if (PUSH_ARGS_REVERSED)
1113 i = num_actuals - 1, inc = -1;
1114 /* In this case, must reverse order of args
1115 so that we compute and push the last arg first. */
1117 else
1119 i = 0, inc = 1;
1122 /* I counts args in order (to be) pushed; ARGPOS counts in order written. */
1123 for (p = actparms, argpos = 0; p; p = TREE_CHAIN (p), i += inc, argpos++)
1125 tree type = TREE_TYPE (TREE_VALUE (p));
1126 int unsignedp;
1127 enum machine_mode mode;
1129 args[i].tree_value = TREE_VALUE (p);
1131 /* Replace erroneous argument with constant zero. */
1132 if (type == error_mark_node || !COMPLETE_TYPE_P (type))
1133 args[i].tree_value = integer_zero_node, type = integer_type_node;
1135 /* If TYPE is a transparent union, pass things the way we would
1136 pass the first field of the union. We have already verified that
1137 the modes are the same. */
1138 if (TREE_CODE (type) == UNION_TYPE && TYPE_TRANSPARENT_UNION (type))
1139 type = TREE_TYPE (TYPE_FIELDS (type));
1141 /* Decide where to pass this arg.
1143 args[i].reg is nonzero if all or part is passed in registers.
1145 args[i].partial is nonzero if part but not all is passed in registers,
1146 and the exact value says how many words are passed in registers.
1148 args[i].pass_on_stack is nonzero if the argument must at least be
1149 computed on the stack. It may then be loaded back into registers
1150 if args[i].reg is nonzero.
1152 These decisions are driven by the FUNCTION_... macros and must agree
1153 with those made by function.c. */
1155 /* See if this argument should be passed by invisible reference. */
1156 if ((TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST
1157 && contains_placeholder_p (TYPE_SIZE (type)))
1158 || TREE_ADDRESSABLE (type)
1159 #ifdef FUNCTION_ARG_PASS_BY_REFERENCE
1160 || FUNCTION_ARG_PASS_BY_REFERENCE (*args_so_far, TYPE_MODE (type),
1161 type, argpos < n_named_args)
1162 #endif
1165 /* If we're compiling a thunk, pass through invisible
1166 references instead of making a copy. */
1167 if (current_function_is_thunk
1168 #ifdef FUNCTION_ARG_CALLEE_COPIES
1169 || (FUNCTION_ARG_CALLEE_COPIES (*args_so_far, TYPE_MODE (type),
1170 type, argpos < n_named_args)
1171 /* If it's in a register, we must make a copy of it too. */
1172 /* ??? Is this a sufficient test? Is there a better one? */
1173 && !(TREE_CODE (args[i].tree_value) == VAR_DECL
1174 && REG_P (DECL_RTL (args[i].tree_value)))
1175 && ! TREE_ADDRESSABLE (type))
1176 #endif
1179 /* C++ uses a TARGET_EXPR to indicate that we want to make a
1180 new object from the argument. If we are passing by
1181 invisible reference, the callee will do that for us, so we
1182 can strip off the TARGET_EXPR. This is not always safe,
1183 but it is safe in the only case where this is a useful
1184 optimization; namely, when the argument is a plain object.
1185 In that case, the frontend is just asking the backend to
1186 make a bitwise copy of the argument. */
1188 if (TREE_CODE (args[i].tree_value) == TARGET_EXPR
1189 && (DECL_P (TREE_OPERAND (args[i].tree_value, 1)))
1190 && ! REG_P (DECL_RTL (TREE_OPERAND (args[i].tree_value, 1))))
1191 args[i].tree_value = TREE_OPERAND (args[i].tree_value, 1);
1193 args[i].tree_value = build1 (ADDR_EXPR,
1194 build_pointer_type (type),
1195 args[i].tree_value);
1196 type = build_pointer_type (type);
1198 else
1200 /* We make a copy of the object and pass the address to the
1201 function being called. */
1202 rtx copy;
1204 if (!COMPLETE_TYPE_P (type)
1205 || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST
1206 || (flag_stack_check && ! STACK_CHECK_BUILTIN
1207 && (0 < compare_tree_int (TYPE_SIZE_UNIT (type),
1208 STACK_CHECK_MAX_VAR_SIZE))))
1210 /* This is a variable-sized object. Make space on the stack
1211 for it. */
1212 rtx size_rtx = expr_size (TREE_VALUE (p));
1214 if (*old_stack_level == 0)
1216 emit_stack_save (SAVE_BLOCK, old_stack_level, NULL_RTX);
1217 *old_pending_adj = pending_stack_adjust;
1218 pending_stack_adjust = 0;
1221 copy = gen_rtx_MEM (BLKmode,
1222 allocate_dynamic_stack_space
1223 (size_rtx, NULL_RTX, TYPE_ALIGN (type)));
1224 set_mem_attributes (copy, type, 1);
1226 else
1227 copy = assign_temp (type, 0, 1, 0);
1229 store_expr (args[i].tree_value, copy, 0);
1230 *ecf_flags &= ~(ECF_CONST | ECF_PURE);
1232 args[i].tree_value = build1 (ADDR_EXPR,
1233 build_pointer_type (type),
1234 make_tree (type, copy));
1235 type = build_pointer_type (type);
1239 mode = TYPE_MODE (type);
1240 unsignedp = TREE_UNSIGNED (type);
1242 #ifdef PROMOTE_FUNCTION_ARGS
1243 mode = promote_mode (type, mode, &unsignedp, 1);
1244 #endif
1246 args[i].unsignedp = unsignedp;
1247 args[i].mode = mode;
1249 args[i].reg = FUNCTION_ARG (*args_so_far, mode, type,
1250 argpos < n_named_args);
1251 #ifdef FUNCTION_INCOMING_ARG
1252 /* If this is a sibling call and the machine has register windows, the
1253 register window has to be unwinded before calling the routine, so
1254 arguments have to go into the incoming registers. */
1255 args[i].tail_call_reg = FUNCTION_INCOMING_ARG (*args_so_far, mode, type,
1256 argpos < n_named_args);
1257 #else
1258 args[i].tail_call_reg = args[i].reg;
1259 #endif
1261 #ifdef FUNCTION_ARG_PARTIAL_NREGS
1262 if (args[i].reg)
1263 args[i].partial
1264 = FUNCTION_ARG_PARTIAL_NREGS (*args_so_far, mode, type,
1265 argpos < n_named_args);
1266 #endif
1268 args[i].pass_on_stack = MUST_PASS_IN_STACK (mode, type);
1270 /* If FUNCTION_ARG returned a (parallel [(expr_list (nil) ...) ...]),
1271 it means that we are to pass this arg in the register(s) designated
1272 by the PARALLEL, but also to pass it in the stack. */
1273 if (args[i].reg && GET_CODE (args[i].reg) == PARALLEL
1274 && XEXP (XVECEXP (args[i].reg, 0, 0), 0) == 0)
1275 args[i].pass_on_stack = 1;
1277 /* If this is an addressable type, we must preallocate the stack
1278 since we must evaluate the object into its final location.
1280 If this is to be passed in both registers and the stack, it is simpler
1281 to preallocate. */
1282 if (TREE_ADDRESSABLE (type)
1283 || (args[i].pass_on_stack && args[i].reg != 0))
1284 *must_preallocate = 1;
1286 /* If this is an addressable type, we cannot pre-evaluate it. Thus,
1287 we cannot consider this function call constant. */
1288 if (TREE_ADDRESSABLE (type))
1289 *ecf_flags &= ~(ECF_CONST | ECF_PURE);
1291 /* Compute the stack-size of this argument. */
1292 if (args[i].reg == 0 || args[i].partial != 0
1293 || reg_parm_stack_space > 0
1294 || args[i].pass_on_stack)
1295 locate_and_pad_parm (mode, type,
1296 #ifdef STACK_PARMS_IN_REG_PARM_AREA
1298 #else
1299 args[i].reg != 0,
1300 #endif
1301 fndecl, args_size, &args[i].offset,
1302 &args[i].size, &alignment_pad);
1304 #ifndef ARGS_GROW_DOWNWARD
1305 args[i].slot_offset = *args_size;
1306 #endif
1308 args[i].alignment_pad = alignment_pad;
1310 /* If a part of the arg was put into registers,
1311 don't include that part in the amount pushed. */
1312 if (reg_parm_stack_space == 0 && ! args[i].pass_on_stack)
1313 args[i].size.constant -= ((args[i].partial * UNITS_PER_WORD)
1314 / (PARM_BOUNDARY / BITS_PER_UNIT)
1315 * (PARM_BOUNDARY / BITS_PER_UNIT));
1317 /* Update ARGS_SIZE, the total stack space for args so far. */
1319 args_size->constant += args[i].size.constant;
1320 if (args[i].size.var)
1322 ADD_PARM_SIZE (*args_size, args[i].size.var);
1325 /* Since the slot offset points to the bottom of the slot,
1326 we must record it after incrementing if the args grow down. */
1327 #ifdef ARGS_GROW_DOWNWARD
1328 args[i].slot_offset = *args_size;
1330 args[i].slot_offset.constant = -args_size->constant;
1331 if (args_size->var)
1332 SUB_PARM_SIZE (args[i].slot_offset, args_size->var);
1333 #endif
1335 /* Increment ARGS_SO_FAR, which has info about which arg-registers
1336 have been used, etc. */
1338 FUNCTION_ARG_ADVANCE (*args_so_far, TYPE_MODE (type), type,
1339 argpos < n_named_args);
1343 /* Update ARGS_SIZE to contain the total size for the argument block.
1344 Return the original constant component of the argument block's size.
1346 REG_PARM_STACK_SPACE holds the number of bytes of stack space reserved
1347 for arguments passed in registers. */
1349 static int
1350 compute_argument_block_size (reg_parm_stack_space, args_size,
1351 preferred_stack_boundary)
1352 int reg_parm_stack_space;
1353 struct args_size *args_size;
1354 int preferred_stack_boundary ATTRIBUTE_UNUSED;
1356 int unadjusted_args_size = args_size->constant;
1358 /* For accumulate outgoing args mode we don't need to align, since the frame
1359 will be already aligned. Align to STACK_BOUNDARY in order to prevent
1360 backends from generating missaligned frame sizes. */
1361 #ifdef STACK_BOUNDARY
1362 if (ACCUMULATE_OUTGOING_ARGS && preferred_stack_boundary > STACK_BOUNDARY)
1363 preferred_stack_boundary = STACK_BOUNDARY;
1364 #endif
1366 /* Compute the actual size of the argument block required. The variable
1367 and constant sizes must be combined, the size may have to be rounded,
1368 and there may be a minimum required size. */
1370 if (args_size->var)
1372 args_size->var = ARGS_SIZE_TREE (*args_size);
1373 args_size->constant = 0;
1375 #ifdef PREFERRED_STACK_BOUNDARY
1376 preferred_stack_boundary /= BITS_PER_UNIT;
1377 if (preferred_stack_boundary > 1)
1379 /* We don't handle this case yet. To handle it correctly we have
1380 to add the delta, round and substract the delta.
1381 Currently no machine description requires this support. */
1382 if (stack_pointer_delta & (preferred_stack_boundary - 1))
1383 abort ();
1384 args_size->var = round_up (args_size->var, preferred_stack_boundary);
1386 #endif
1388 if (reg_parm_stack_space > 0)
1390 args_size->var
1391 = size_binop (MAX_EXPR, args_size->var,
1392 ssize_int (reg_parm_stack_space));
1394 #ifndef OUTGOING_REG_PARM_STACK_SPACE
1395 /* The area corresponding to register parameters is not to count in
1396 the size of the block we need. So make the adjustment. */
1397 args_size->var
1398 = size_binop (MINUS_EXPR, args_size->var,
1399 ssize_int (reg_parm_stack_space));
1400 #endif
1403 else
1405 #ifdef PREFERRED_STACK_BOUNDARY
1406 preferred_stack_boundary /= BITS_PER_UNIT;
1407 if (preferred_stack_boundary < 1)
1408 preferred_stack_boundary = 1;
1409 args_size->constant = (((args_size->constant
1410 + stack_pointer_delta
1411 + preferred_stack_boundary - 1)
1412 / preferred_stack_boundary
1413 * preferred_stack_boundary)
1414 - stack_pointer_delta);
1415 #endif
1417 args_size->constant = MAX (args_size->constant,
1418 reg_parm_stack_space);
1420 #ifdef MAYBE_REG_PARM_STACK_SPACE
1421 if (reg_parm_stack_space == 0)
1422 args_size->constant = 0;
1423 #endif
1425 #ifndef OUTGOING_REG_PARM_STACK_SPACE
1426 args_size->constant -= reg_parm_stack_space;
1427 #endif
1429 return unadjusted_args_size;
1432 /* Precompute parameters as needed for a function call.
1434 FLAGS is mask of ECF_* constants.
1436 NUM_ACTUALS is the number of arguments.
1438 ARGS is an array containing information for each argument; this
1439 routine fills in the INITIAL_VALUE and VALUE fields for each
1440 precomputed argument. */
1442 static void
1443 precompute_arguments (flags, num_actuals, args)
1444 int flags;
1445 int num_actuals;
1446 struct arg_data *args;
1448 int i;
1450 /* If this function call is cse'able, precompute all the parameters.
1451 Note that if the parameter is constructed into a temporary, this will
1452 cause an additional copy because the parameter will be constructed
1453 into a temporary location and then copied into the outgoing arguments.
1454 If a parameter contains a call to alloca and this function uses the
1455 stack, precompute the parameter. */
1457 /* If we preallocated the stack space, and some arguments must be passed
1458 on the stack, then we must precompute any parameter which contains a
1459 function call which will store arguments on the stack.
1460 Otherwise, evaluating the parameter may clobber previous parameters
1461 which have already been stored into the stack. (we have code to avoid
1462 such case by saving the ougoing stack arguments, but it results in
1463 worse code) */
1465 for (i = 0; i < num_actuals; i++)
1466 if ((flags & (ECF_CONST | ECF_PURE))
1467 || calls_function (args[i].tree_value, !ACCUMULATE_OUTGOING_ARGS))
1469 /* If this is an addressable type, we cannot pre-evaluate it. */
1470 if (TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value)))
1471 abort ();
1473 push_temp_slots ();
1475 args[i].value
1476 = expand_expr (args[i].tree_value, NULL_RTX, VOIDmode, 0);
1478 preserve_temp_slots (args[i].value);
1479 pop_temp_slots ();
1481 /* ANSI doesn't require a sequence point here,
1482 but PCC has one, so this will avoid some problems. */
1483 emit_queue ();
1485 args[i].initial_value = args[i].value
1486 = protect_from_queue (args[i].value, 0);
1488 if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) != args[i].mode)
1490 args[i].value
1491 = convert_modes (args[i].mode,
1492 TYPE_MODE (TREE_TYPE (args[i].tree_value)),
1493 args[i].value, args[i].unsignedp);
1494 #ifdef PROMOTE_FOR_CALL_ONLY
1495 /* CSE will replace this only if it contains args[i].value
1496 pseudo, so convert it down to the declared mode using
1497 a SUBREG. */
1498 if (GET_CODE (args[i].value) == REG
1499 && GET_MODE_CLASS (args[i].mode) == MODE_INT)
1501 args[i].initial_value
1502 = gen_rtx_SUBREG (TYPE_MODE (TREE_TYPE (args[i].tree_value)),
1503 args[i].value, 0);
1504 SUBREG_PROMOTED_VAR_P (args[i].initial_value) = 1;
1505 SUBREG_PROMOTED_UNSIGNED_P (args[i].initial_value)
1506 = args[i].unsignedp;
1508 #endif
1513 /* Given the current state of MUST_PREALLOCATE and information about
1514 arguments to a function call in NUM_ACTUALS, ARGS and ARGS_SIZE,
1515 compute and return the final value for MUST_PREALLOCATE. */
1517 static int
1518 finalize_must_preallocate (must_preallocate, num_actuals, args, args_size)
1519 int must_preallocate;
1520 int num_actuals;
1521 struct arg_data *args;
1522 struct args_size *args_size;
1524 /* See if we have or want to preallocate stack space.
1526 If we would have to push a partially-in-regs parm
1527 before other stack parms, preallocate stack space instead.
1529 If the size of some parm is not a multiple of the required stack
1530 alignment, we must preallocate.
1532 If the total size of arguments that would otherwise create a copy in
1533 a temporary (such as a CALL) is more than half the total argument list
1534 size, preallocation is faster.
1536 Another reason to preallocate is if we have a machine (like the m88k)
1537 where stack alignment is required to be maintained between every
1538 pair of insns, not just when the call is made. However, we assume here
1539 that such machines either do not have push insns (and hence preallocation
1540 would occur anyway) or the problem is taken care of with
1541 PUSH_ROUNDING. */
1543 if (! must_preallocate)
1545 int partial_seen = 0;
1546 int copy_to_evaluate_size = 0;
1547 int i;
1549 for (i = 0; i < num_actuals && ! must_preallocate; i++)
1551 if (args[i].partial > 0 && ! args[i].pass_on_stack)
1552 partial_seen = 1;
1553 else if (partial_seen && args[i].reg == 0)
1554 must_preallocate = 1;
1556 if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode
1557 && (TREE_CODE (args[i].tree_value) == CALL_EXPR
1558 || TREE_CODE (args[i].tree_value) == TARGET_EXPR
1559 || TREE_CODE (args[i].tree_value) == COND_EXPR
1560 || TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value))))
1561 copy_to_evaluate_size
1562 += int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1565 if (copy_to_evaluate_size * 2 >= args_size->constant
1566 && args_size->constant > 0)
1567 must_preallocate = 1;
1569 return must_preallocate;
1572 /* If we preallocated stack space, compute the address of each argument
1573 and store it into the ARGS array.
1575 We need not ensure it is a valid memory address here; it will be
1576 validized when it is used.
1578 ARGBLOCK is an rtx for the address of the outgoing arguments. */
1580 static void
1581 compute_argument_addresses (args, argblock, num_actuals)
1582 struct arg_data *args;
1583 rtx argblock;
1584 int num_actuals;
1586 if (argblock)
1588 rtx arg_reg = argblock;
1589 int i, arg_offset = 0;
1591 if (GET_CODE (argblock) == PLUS)
1592 arg_reg = XEXP (argblock, 0), arg_offset = INTVAL (XEXP (argblock, 1));
1594 for (i = 0; i < num_actuals; i++)
1596 rtx offset = ARGS_SIZE_RTX (args[i].offset);
1597 rtx slot_offset = ARGS_SIZE_RTX (args[i].slot_offset);
1598 rtx addr;
1600 /* Skip this parm if it will not be passed on the stack. */
1601 if (! args[i].pass_on_stack && args[i].reg != 0)
1602 continue;
1604 if (GET_CODE (offset) == CONST_INT)
1605 addr = plus_constant (arg_reg, INTVAL (offset));
1606 else
1607 addr = gen_rtx_PLUS (Pmode, arg_reg, offset);
1609 addr = plus_constant (addr, arg_offset);
1610 args[i].stack = gen_rtx_MEM (args[i].mode, addr);
1611 set_mem_attributes (args[i].stack,
1612 TREE_TYPE (args[i].tree_value), 1);
1614 if (GET_CODE (slot_offset) == CONST_INT)
1615 addr = plus_constant (arg_reg, INTVAL (slot_offset));
1616 else
1617 addr = gen_rtx_PLUS (Pmode, arg_reg, slot_offset);
1619 addr = plus_constant (addr, arg_offset);
1620 args[i].stack_slot = gen_rtx_MEM (args[i].mode, addr);
1621 set_mem_attributes (args[i].stack_slot,
1622 TREE_TYPE (args[i].tree_value), 1);
1624 /* Function incoming arguments may overlap with sibling call
1625 outgoing arguments and we cannot allow reordering of reads
1626 from function arguments with stores to outgoing arguments
1627 of sibling calls. */
1628 MEM_ALIAS_SET (args[i].stack) = 0;
1629 MEM_ALIAS_SET (args[i].stack_slot) = 0;
1634 /* Given a FNDECL and EXP, return an rtx suitable for use as a target address
1635 in a call instruction.
1637 FNDECL is the tree node for the target function. For an indirect call
1638 FNDECL will be NULL_TREE.
1640 EXP is the CALL_EXPR for this call. */
1642 static rtx
1643 rtx_for_function_call (fndecl, exp)
1644 tree fndecl;
1645 tree exp;
1647 rtx funexp;
1649 /* Get the function to call, in the form of RTL. */
1650 if (fndecl)
1652 /* If this is the first use of the function, see if we need to
1653 make an external definition for it. */
1654 if (! TREE_USED (fndecl))
1656 assemble_external (fndecl);
1657 TREE_USED (fndecl) = 1;
1660 /* Get a SYMBOL_REF rtx for the function address. */
1661 funexp = XEXP (DECL_RTL (fndecl), 0);
1663 else
1664 /* Generate an rtx (probably a pseudo-register) for the address. */
1666 rtx funaddr;
1667 push_temp_slots ();
1668 funaddr = funexp =
1669 expand_expr (TREE_OPERAND (exp, 0), NULL_RTX, VOIDmode, 0);
1670 pop_temp_slots (); /* FUNEXP can't be BLKmode. */
1672 /* Check the function is executable. */
1673 if (current_function_check_memory_usage)
1675 #ifdef POINTERS_EXTEND_UNSIGNED
1676 /* It might be OK to convert funexp in place, but there's
1677 a lot going on between here and when it happens naturally
1678 that this seems safer. */
1679 funaddr = convert_memory_address (Pmode, funexp);
1680 #endif
1681 emit_library_call (chkr_check_exec_libfunc, LCT_CONST_MAKE_BLOCK,
1682 VOIDmode, 1, funaddr, Pmode);
1684 emit_queue ();
1686 return funexp;
1689 /* Do the register loads required for any wholly-register parms or any
1690 parms which are passed both on the stack and in a register. Their
1691 expressions were already evaluated.
1693 Mark all register-parms as living through the call, putting these USE
1694 insns in the CALL_INSN_FUNCTION_USAGE field. */
1696 static void
1697 load_register_parameters (args, num_actuals, call_fusage, flags)
1698 struct arg_data *args;
1699 int num_actuals;
1700 rtx *call_fusage;
1701 int flags;
1703 int i, j;
1705 #ifdef LOAD_ARGS_REVERSED
1706 for (i = num_actuals - 1; i >= 0; i--)
1707 #else
1708 for (i = 0; i < num_actuals; i++)
1709 #endif
1711 rtx reg = ((flags & ECF_SIBCALL)
1712 ? args[i].tail_call_reg : args[i].reg);
1713 int partial = args[i].partial;
1714 int nregs;
1716 if (reg)
1718 /* Set to non-negative if must move a word at a time, even if just
1719 one word (e.g, partial == 1 && mode == DFmode). Set to -1 if
1720 we just use a normal move insn. This value can be zero if the
1721 argument is a zero size structure with no fields. */
1722 nregs = (partial ? partial
1723 : (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode
1724 ? ((int_size_in_bytes (TREE_TYPE (args[i].tree_value))
1725 + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD)
1726 : -1));
1728 /* Handle calls that pass values in multiple non-contiguous
1729 locations. The Irix 6 ABI has examples of this. */
1731 if (GET_CODE (reg) == PARALLEL)
1732 emit_group_load (reg, args[i].value,
1733 int_size_in_bytes (TREE_TYPE (args[i].tree_value)),
1734 TYPE_ALIGN (TREE_TYPE (args[i].tree_value)));
1736 /* If simple case, just do move. If normal partial, store_one_arg
1737 has already loaded the register for us. In all other cases,
1738 load the register(s) from memory. */
1740 else if (nregs == -1)
1741 emit_move_insn (reg, args[i].value);
1743 /* If we have pre-computed the values to put in the registers in
1744 the case of non-aligned structures, copy them in now. */
1746 else if (args[i].n_aligned_regs != 0)
1747 for (j = 0; j < args[i].n_aligned_regs; j++)
1748 emit_move_insn (gen_rtx_REG (word_mode, REGNO (reg) + j),
1749 args[i].aligned_regs[j]);
1751 else if (partial == 0 || args[i].pass_on_stack)
1752 move_block_to_reg (REGNO (reg),
1753 validize_mem (args[i].value), nregs,
1754 args[i].mode);
1756 /* Handle calls that pass values in multiple non-contiguous
1757 locations. The Irix 6 ABI has examples of this. */
1758 if (GET_CODE (reg) == PARALLEL)
1759 use_group_regs (call_fusage, reg);
1760 else if (nregs == -1)
1761 use_reg (call_fusage, reg);
1762 else
1763 use_regs (call_fusage, REGNO (reg), nregs == 0 ? 1 : nregs);
1768 /* Try to integrate function. See expand_inline_function for documentation
1769 about the parameters. */
1771 static rtx
1772 try_to_integrate (fndecl, actparms, target, ignore, type, structure_value_addr)
1773 tree fndecl;
1774 tree actparms;
1775 rtx target;
1776 int ignore;
1777 tree type;
1778 rtx structure_value_addr;
1780 rtx temp;
1781 rtx before_call;
1782 int i;
1783 rtx old_stack_level = 0;
1784 int reg_parm_stack_space = 0;
1786 #ifdef REG_PARM_STACK_SPACE
1787 #ifdef MAYBE_REG_PARM_STACK_SPACE
1788 reg_parm_stack_space = MAYBE_REG_PARM_STACK_SPACE;
1789 #else
1790 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
1791 #endif
1792 #endif
1794 before_call = get_last_insn ();
1796 timevar_push (TV_INTEGRATION);
1798 temp = expand_inline_function (fndecl, actparms, target,
1799 ignore, type,
1800 structure_value_addr);
1802 timevar_pop (TV_INTEGRATION);
1804 /* If inlining succeeded, return. */
1805 if (temp != (rtx) (HOST_WIDE_INT) - 1)
1807 if (ACCUMULATE_OUTGOING_ARGS)
1809 /* If the outgoing argument list must be preserved, push
1810 the stack before executing the inlined function if it
1811 makes any calls. */
1813 for (i = reg_parm_stack_space - 1; i >= 0; i--)
1814 if (i < highest_outgoing_arg_in_use && stack_usage_map[i] != 0)
1815 break;
1817 if (stack_arg_under_construction || i >= 0)
1819 rtx first_insn
1820 = before_call ? NEXT_INSN (before_call) : get_insns ();
1821 rtx insn = NULL_RTX, seq;
1823 /* Look for a call in the inline function code.
1824 If DECL_SAVED_INSNS (fndecl)->outgoing_args_size is
1825 nonzero then there is a call and it is not necessary
1826 to scan the insns. */
1828 if (DECL_SAVED_INSNS (fndecl)->outgoing_args_size == 0)
1829 for (insn = first_insn; insn; insn = NEXT_INSN (insn))
1830 if (GET_CODE (insn) == CALL_INSN)
1831 break;
1833 if (insn)
1835 /* Reserve enough stack space so that the largest
1836 argument list of any function call in the inline
1837 function does not overlap the argument list being
1838 evaluated. This is usually an overestimate because
1839 allocate_dynamic_stack_space reserves space for an
1840 outgoing argument list in addition to the requested
1841 space, but there is no way to ask for stack space such
1842 that an argument list of a certain length can be
1843 safely constructed.
1845 Add the stack space reserved for register arguments, if
1846 any, in the inline function. What is really needed is the
1847 largest value of reg_parm_stack_space in the inline
1848 function, but that is not available. Using the current
1849 value of reg_parm_stack_space is wrong, but gives
1850 correct results on all supported machines. */
1852 int adjust = (DECL_SAVED_INSNS (fndecl)->outgoing_args_size
1853 + reg_parm_stack_space);
1855 start_sequence ();
1856 emit_stack_save (SAVE_BLOCK, &old_stack_level, NULL_RTX);
1857 allocate_dynamic_stack_space (GEN_INT (adjust),
1858 NULL_RTX, BITS_PER_UNIT);
1859 seq = get_insns ();
1860 end_sequence ();
1861 emit_insns_before (seq, first_insn);
1862 emit_stack_restore (SAVE_BLOCK, old_stack_level, NULL_RTX);
1867 /* If the result is equivalent to TARGET, return TARGET to simplify
1868 checks in store_expr. They can be equivalent but not equal in the
1869 case of a function that returns BLKmode. */
1870 if (temp != target && rtx_equal_p (temp, target))
1871 return target;
1872 return temp;
1875 /* If inlining failed, mark FNDECL as needing to be compiled
1876 separately after all. If function was declared inline,
1877 give a warning. */
1878 if (DECL_INLINE (fndecl) && warn_inline && !flag_no_inline
1879 && optimize > 0 && !TREE_ADDRESSABLE (fndecl))
1881 warning_with_decl (fndecl, "inlining failed in call to `%s'");
1882 warning ("called from here");
1884 mark_addressable (fndecl);
1885 return (rtx) (HOST_WIDE_INT) - 1;
1888 /* We need to pop PENDING_STACK_ADJUST bytes. But, if the arguments
1889 wouldn't fill up an even multiple of PREFERRED_UNIT_STACK_BOUNDARY
1890 bytes, then we would need to push some additional bytes to pad the
1891 arguments. So, we compute an adjust to the stack pointer for an
1892 amount that will leave the stack under-aligned by UNADJUSTED_ARGS_SIZE
1893 bytes. Then, when the arguments are pushed the stack will be perfectly
1894 aligned. ARGS_SIZE->CONSTANT is set to the number of bytes that should
1895 be popped after the call. Returns the adjustment. */
1897 static int
1898 combine_pending_stack_adjustment_and_call (unadjusted_args_size,
1899 args_size,
1900 preferred_unit_stack_boundary)
1901 int unadjusted_args_size;
1902 struct args_size *args_size;
1903 int preferred_unit_stack_boundary;
1905 /* The number of bytes to pop so that the stack will be
1906 under-aligned by UNADJUSTED_ARGS_SIZE bytes. */
1907 HOST_WIDE_INT adjustment;
1908 /* The alignment of the stack after the arguments are pushed, if we
1909 just pushed the arguments without adjust the stack here. */
1910 HOST_WIDE_INT unadjusted_alignment;
1912 unadjusted_alignment
1913 = ((stack_pointer_delta + unadjusted_args_size)
1914 % preferred_unit_stack_boundary);
1916 /* We want to get rid of as many of the PENDING_STACK_ADJUST bytes
1917 as possible -- leaving just enough left to cancel out the
1918 UNADJUSTED_ALIGNMENT. In other words, we want to ensure that the
1919 PENDING_STACK_ADJUST is non-negative, and congruent to
1920 -UNADJUSTED_ALIGNMENT modulo the PREFERRED_UNIT_STACK_BOUNDARY. */
1922 /* Begin by trying to pop all the bytes. */
1923 unadjusted_alignment
1924 = (unadjusted_alignment
1925 - (pending_stack_adjust % preferred_unit_stack_boundary));
1926 adjustment = pending_stack_adjust;
1927 /* Push enough additional bytes that the stack will be aligned
1928 after the arguments are pushed. */
1929 if (preferred_unit_stack_boundary > 1)
1931 if (unadjusted_alignment > 0)
1932 adjustment -= preferred_unit_stack_boundary - unadjusted_alignment;
1933 else
1934 adjustment += unadjusted_alignment;
1937 /* Now, sets ARGS_SIZE->CONSTANT so that we pop the right number of
1938 bytes after the call. The right number is the entire
1939 PENDING_STACK_ADJUST less our ADJUSTMENT plus the amount required
1940 by the arguments in the first place. */
1941 args_size->constant
1942 = pending_stack_adjust - adjustment + unadjusted_args_size;
1944 return adjustment;
1947 /* Scan X expression if it does not dereference any argument slots
1948 we already clobbered by tail call arguments (as noted in stored_args_map
1949 bitmap).
1950 Return non-zero if X expression dereferences such argument slots,
1951 zero otherwise. */
1953 static int
1954 check_sibcall_argument_overlap_1 (x)
1955 rtx x;
1957 RTX_CODE code;
1958 int i, j;
1959 unsigned int k;
1960 const char *fmt;
1962 if (x == NULL_RTX)
1963 return 0;
1965 code = GET_CODE (x);
1967 if (code == MEM)
1969 if (XEXP (x, 0) == current_function_internal_arg_pointer)
1970 i = 0;
1971 else if (GET_CODE (XEXP (x, 0)) == PLUS
1972 && XEXP (XEXP (x, 0), 0) ==
1973 current_function_internal_arg_pointer
1974 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
1975 i = INTVAL (XEXP (XEXP (x, 0), 1));
1976 else
1977 return 0;
1979 #ifdef ARGS_GROW_DOWNWARD
1980 i = -i - GET_MODE_SIZE (GET_MODE (x));
1981 #endif
1983 for (k = 0; k < GET_MODE_SIZE (GET_MODE (x)); k++)
1984 if (i + k < stored_args_map->n_bits
1985 && TEST_BIT (stored_args_map, i + k))
1986 return 1;
1988 return 0;
1991 /* Scan all subexpressions. */
1992 fmt = GET_RTX_FORMAT (code);
1993 for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
1995 if (*fmt == 'e')
1997 if (check_sibcall_argument_overlap_1 (XEXP (x, i)))
1998 return 1;
2000 else if (*fmt == 'E')
2002 for (j = 0; j < XVECLEN (x, i); j++)
2003 if (check_sibcall_argument_overlap_1 (XVECEXP (x, i, j)))
2004 return 1;
2007 return 0;
2010 /* Scan sequence after INSN if it does not dereference any argument slots
2011 we already clobbered by tail call arguments (as noted in stored_args_map
2012 bitmap). Add stack slots for ARG to stored_args_map bitmap afterwards.
2013 Return non-zero if sequence after INSN dereferences such argument slots,
2014 zero otherwise. */
2016 static int
2017 check_sibcall_argument_overlap (insn, arg)
2018 rtx insn;
2019 struct arg_data *arg;
2021 int low, high;
2023 if (insn == NULL_RTX)
2024 insn = get_insns ();
2025 else
2026 insn = NEXT_INSN (insn);
2028 for (; insn; insn = NEXT_INSN (insn))
2029 if (INSN_P (insn)
2030 && check_sibcall_argument_overlap_1 (PATTERN (insn)))
2031 break;
2033 #ifdef ARGS_GROW_DOWNWARD
2034 low = -arg->offset.constant - arg->size.constant;
2035 #else
2036 low = arg->offset.constant;
2037 #endif
2039 for (high = low + arg->size.constant; low < high; low++)
2040 SET_BIT (stored_args_map, low);
2041 return insn != NULL_RTX;
2044 /* Generate all the code for a function call
2045 and return an rtx for its value.
2046 Store the value in TARGET (specified as an rtx) if convenient.
2047 If the value is stored in TARGET then TARGET is returned.
2048 If IGNORE is nonzero, then we ignore the value of the function call. */
2051 expand_call (exp, target, ignore)
2052 tree exp;
2053 rtx target;
2054 int ignore;
2056 /* Nonzero if we are currently expanding a call. */
2057 static int currently_expanding_call = 0;
2059 /* List of actual parameters. */
2060 tree actparms = TREE_OPERAND (exp, 1);
2061 /* RTX for the function to be called. */
2062 rtx funexp;
2063 /* Sequence of insns to perform a tail recursive "call". */
2064 rtx tail_recursion_insns = NULL_RTX;
2065 /* Sequence of insns to perform a normal "call". */
2066 rtx normal_call_insns = NULL_RTX;
2067 /* Sequence of insns to perform a tail recursive "call". */
2068 rtx tail_call_insns = NULL_RTX;
2069 /* Data type of the function. */
2070 tree funtype;
2071 /* Declaration of the function being called,
2072 or 0 if the function is computed (not known by name). */
2073 tree fndecl = 0;
2074 rtx insn;
2075 int try_tail_call = 1;
2076 int try_tail_recursion = 1;
2077 int pass;
2079 /* Register in which non-BLKmode value will be returned,
2080 or 0 if no value or if value is BLKmode. */
2081 rtx valreg;
2082 /* Address where we should return a BLKmode value;
2083 0 if value not BLKmode. */
2084 rtx structure_value_addr = 0;
2085 /* Nonzero if that address is being passed by treating it as
2086 an extra, implicit first parameter. Otherwise,
2087 it is passed by being copied directly into struct_value_rtx. */
2088 int structure_value_addr_parm = 0;
2089 /* Size of aggregate value wanted, or zero if none wanted
2090 or if we are using the non-reentrant PCC calling convention
2091 or expecting the value in registers. */
2092 HOST_WIDE_INT struct_value_size = 0;
2093 /* Nonzero if called function returns an aggregate in memory PCC style,
2094 by returning the address of where to find it. */
2095 int pcc_struct_value = 0;
2097 /* Number of actual parameters in this call, including struct value addr. */
2098 int num_actuals;
2099 /* Number of named args. Args after this are anonymous ones
2100 and they must all go on the stack. */
2101 int n_named_args;
2103 /* Vector of information about each argument.
2104 Arguments are numbered in the order they will be pushed,
2105 not the order they are written. */
2106 struct arg_data *args;
2108 /* Total size in bytes of all the stack-parms scanned so far. */
2109 struct args_size args_size;
2110 struct args_size adjusted_args_size;
2111 /* Size of arguments before any adjustments (such as rounding). */
2112 int unadjusted_args_size;
2113 /* Data on reg parms scanned so far. */
2114 CUMULATIVE_ARGS args_so_far;
2115 /* Nonzero if a reg parm has been scanned. */
2116 int reg_parm_seen;
2117 /* Nonzero if this is an indirect function call. */
2119 /* Nonzero if we must avoid push-insns in the args for this call.
2120 If stack space is allocated for register parameters, but not by the
2121 caller, then it is preallocated in the fixed part of the stack frame.
2122 So the entire argument block must then be preallocated (i.e., we
2123 ignore PUSH_ROUNDING in that case). */
2125 int must_preallocate = !PUSH_ARGS;
2127 /* Size of the stack reserved for parameter registers. */
2128 int reg_parm_stack_space = 0;
2130 /* Address of space preallocated for stack parms
2131 (on machines that lack push insns), or 0 if space not preallocated. */
2132 rtx argblock = 0;
2134 /* Mask of ECF_ flags. */
2135 int flags = 0;
2136 /* Nonzero if this is a call to an inline function. */
2137 int is_integrable = 0;
2138 #ifdef REG_PARM_STACK_SPACE
2139 /* Define the boundary of the register parm stack space that needs to be
2140 save, if any. */
2141 int low_to_save = -1, high_to_save;
2142 rtx save_area = 0; /* Place that it is saved */
2143 #endif
2145 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
2146 char *initial_stack_usage_map = stack_usage_map;
2147 int old_stack_arg_under_construction = 0;
2149 rtx old_stack_level = 0;
2150 int old_pending_adj = 0;
2151 int old_inhibit_defer_pop = inhibit_defer_pop;
2152 int old_stack_allocated;
2153 rtx call_fusage;
2154 register tree p = TREE_OPERAND (exp, 0);
2155 register int i;
2156 /* The alignment of the stack, in bits. */
2157 HOST_WIDE_INT preferred_stack_boundary;
2158 /* The alignment of the stack, in bytes. */
2159 HOST_WIDE_INT preferred_unit_stack_boundary;
2161 /* The value of the function call can be put in a hard register. But
2162 if -fcheck-memory-usage, code which invokes functions (and thus
2163 damages some hard registers) can be inserted before using the value.
2164 So, target is always a pseudo-register in that case. */
2165 if (current_function_check_memory_usage)
2166 target = 0;
2168 /* See if this is "nothrow" function call. */
2169 if (TREE_NOTHROW (exp))
2170 flags |= ECF_NOTHROW;
2172 /* See if we can find a DECL-node for the actual function.
2173 As a result, decide whether this is a call to an integrable function. */
2175 fndecl = get_callee_fndecl (exp);
2176 if (fndecl)
2178 if (!flag_no_inline
2179 && fndecl != current_function_decl
2180 && DECL_INLINE (fndecl)
2181 && DECL_SAVED_INSNS (fndecl)
2182 && DECL_SAVED_INSNS (fndecl)->inlinable)
2183 is_integrable = 1;
2184 else if (! TREE_ADDRESSABLE (fndecl))
2186 /* In case this function later becomes inlinable,
2187 record that there was already a non-inline call to it.
2189 Use abstraction instead of setting TREE_ADDRESSABLE
2190 directly. */
2191 if (DECL_INLINE (fndecl) && warn_inline && !flag_no_inline
2192 && optimize > 0)
2194 warning_with_decl (fndecl, "can't inline call to `%s'");
2195 warning ("called from here");
2197 mark_addressable (fndecl);
2200 flags |= flags_from_decl_or_type (fndecl);
2203 /* If we don't have specific function to call, see if we have a
2204 attributes set in the type. */
2205 else
2206 flags |= flags_from_decl_or_type (TREE_TYPE (TREE_TYPE (p)));
2208 /* Mark if the function returns with the stack pointer depressed. */
2209 if (TREE_CODE (TREE_TYPE (TREE_TYPE (p))) == FUNCTION_TYPE
2210 && TYPE_RETURNS_STACK_DEPRESSED (TREE_TYPE (TREE_TYPE (p))))
2212 flags |= ECF_SP_DEPRESSED;
2213 flags &= ~(ECF_PURE | ECF_CONST);
2216 #ifdef REG_PARM_STACK_SPACE
2217 #ifdef MAYBE_REG_PARM_STACK_SPACE
2218 reg_parm_stack_space = MAYBE_REG_PARM_STACK_SPACE;
2219 #else
2220 reg_parm_stack_space = REG_PARM_STACK_SPACE (fndecl);
2221 #endif
2222 #endif
2224 #ifndef OUTGOING_REG_PARM_STACK_SPACE
2225 if (reg_parm_stack_space > 0 && PUSH_ARGS)
2226 must_preallocate = 1;
2227 #endif
2229 /* Warn if this value is an aggregate type,
2230 regardless of which calling convention we are using for it. */
2231 if (warn_aggregate_return && AGGREGATE_TYPE_P (TREE_TYPE (exp)))
2232 warning ("function call has aggregate value");
2234 /* Set up a place to return a structure. */
2236 /* Cater to broken compilers. */
2237 if (aggregate_value_p (exp))
2239 /* This call returns a big structure. */
2240 flags &= ~(ECF_CONST | ECF_PURE);
2242 #ifdef PCC_STATIC_STRUCT_RETURN
2244 pcc_struct_value = 1;
2245 /* Easier than making that case work right. */
2246 if (is_integrable)
2248 /* In case this is a static function, note that it has been
2249 used. */
2250 if (! TREE_ADDRESSABLE (fndecl))
2251 mark_addressable (fndecl);
2252 is_integrable = 0;
2255 #else /* not PCC_STATIC_STRUCT_RETURN */
2257 struct_value_size = int_size_in_bytes (TREE_TYPE (exp));
2259 if (target && GET_CODE (target) == MEM)
2260 structure_value_addr = XEXP (target, 0);
2261 else
2263 rtx d;
2265 /* For variable-sized objects, we must be called with a target
2266 specified. If we were to allocate space on the stack here,
2267 we would have no way of knowing when to free it. */
2269 if (struct_value_size < 0)
2270 abort ();
2272 d = assign_temp (TREE_TYPE (exp), 1, 1, 1);
2273 mark_temp_addr_taken (d);
2274 structure_value_addr = XEXP (d, 0);
2275 target = 0;
2278 #endif /* not PCC_STATIC_STRUCT_RETURN */
2281 /* If called function is inline, try to integrate it. */
2283 if (is_integrable)
2285 rtx temp = try_to_integrate (fndecl, actparms, target,
2286 ignore, TREE_TYPE (exp),
2287 structure_value_addr);
2288 if (temp != (rtx) (HOST_WIDE_INT) - 1)
2289 return temp;
2292 /* Figure out the amount to which the stack should be aligned. */
2293 #ifdef PREFERRED_STACK_BOUNDARY
2294 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
2295 #else
2296 preferred_stack_boundary = STACK_BOUNDARY;
2297 #endif
2299 /* Operand 0 is a pointer-to-function; get the type of the function. */
2300 funtype = TREE_TYPE (TREE_OPERAND (exp, 0));
2301 if (! POINTER_TYPE_P (funtype))
2302 abort ();
2303 funtype = TREE_TYPE (funtype);
2305 /* See if this is a call to a function that can return more than once
2306 or a call to longjmp or malloc. */
2307 flags |= special_function_p (fndecl, flags);
2309 if (flags & ECF_MAY_BE_ALLOCA)
2310 current_function_calls_alloca = 1;
2312 /* If struct_value_rtx is 0, it means pass the address
2313 as if it were an extra parameter. */
2314 if (structure_value_addr && struct_value_rtx == 0)
2316 /* If structure_value_addr is a REG other than
2317 virtual_outgoing_args_rtx, we can use always use it. If it
2318 is not a REG, we must always copy it into a register.
2319 If it is virtual_outgoing_args_rtx, we must copy it to another
2320 register in some cases. */
2321 rtx temp = (GET_CODE (structure_value_addr) != REG
2322 || (ACCUMULATE_OUTGOING_ARGS
2323 && stack_arg_under_construction
2324 && structure_value_addr == virtual_outgoing_args_rtx)
2325 ? copy_addr_to_reg (structure_value_addr)
2326 : structure_value_addr);
2328 actparms
2329 = tree_cons (error_mark_node,
2330 make_tree (build_pointer_type (TREE_TYPE (funtype)),
2331 temp),
2332 actparms);
2333 structure_value_addr_parm = 1;
2336 /* Count the arguments and set NUM_ACTUALS. */
2337 for (p = actparms, num_actuals = 0; p; p = TREE_CHAIN (p))
2338 num_actuals++;
2340 /* Compute number of named args.
2341 Normally, don't include the last named arg if anonymous args follow.
2342 We do include the last named arg if STRICT_ARGUMENT_NAMING is nonzero.
2343 (If no anonymous args follow, the result of list_length is actually
2344 one too large. This is harmless.)
2346 If PRETEND_OUTGOING_VARARGS_NAMED is set and STRICT_ARGUMENT_NAMING is
2347 zero, this machine will be able to place unnamed args that were
2348 passed in registers into the stack. So treat all args as named.
2349 This allows the insns emitting for a specific argument list to be
2350 independent of the function declaration.
2352 If PRETEND_OUTGOING_VARARGS_NAMED is not set, we do not have any
2353 reliable way to pass unnamed args in registers, so we must force
2354 them into memory. */
2356 if ((STRICT_ARGUMENT_NAMING
2357 || ! PRETEND_OUTGOING_VARARGS_NAMED)
2358 && TYPE_ARG_TYPES (funtype) != 0)
2359 n_named_args
2360 = (list_length (TYPE_ARG_TYPES (funtype))
2361 /* Don't include the last named arg. */
2362 - (STRICT_ARGUMENT_NAMING ? 0 : 1)
2363 /* Count the struct value address, if it is passed as a parm. */
2364 + structure_value_addr_parm);
2365 else
2366 /* If we know nothing, treat all args as named. */
2367 n_named_args = num_actuals;
2369 /* Start updating where the next arg would go.
2371 On some machines (such as the PA) indirect calls have a different
2372 calling convention than normal calls. The last argument in
2373 INIT_CUMULATIVE_ARGS tells the backend if this is an indirect call
2374 or not. */
2375 INIT_CUMULATIVE_ARGS (args_so_far, funtype, NULL_RTX, (fndecl == 0));
2377 /* Make a vector to hold all the information about each arg. */
2378 args = (struct arg_data *) alloca (num_actuals * sizeof (struct arg_data));
2379 memset ((char *) args, 0, num_actuals * sizeof (struct arg_data));
2381 /* Build up entries inthe ARGS array, compute the size of the arguments
2382 into ARGS_SIZE, etc. */
2383 initialize_argument_information (num_actuals, args, &args_size,
2384 n_named_args, actparms, fndecl,
2385 &args_so_far, reg_parm_stack_space,
2386 &old_stack_level, &old_pending_adj,
2387 &must_preallocate, &flags);
2389 if (args_size.var)
2391 /* If this function requires a variable-sized argument list, don't
2392 try to make a cse'able block for this call. We may be able to
2393 do this eventually, but it is too complicated to keep track of
2394 what insns go in the cse'able block and which don't. */
2396 flags &= ~(ECF_CONST | ECF_PURE);
2397 must_preallocate = 1;
2400 /* Now make final decision about preallocating stack space. */
2401 must_preallocate = finalize_must_preallocate (must_preallocate,
2402 num_actuals, args,
2403 &args_size);
2405 /* If the structure value address will reference the stack pointer, we
2406 must stabilize it. We don't need to do this if we know that we are
2407 not going to adjust the stack pointer in processing this call. */
2409 if (structure_value_addr
2410 && (reg_mentioned_p (virtual_stack_dynamic_rtx, structure_value_addr)
2411 || reg_mentioned_p (virtual_outgoing_args_rtx,
2412 structure_value_addr))
2413 && (args_size.var
2414 || (!ACCUMULATE_OUTGOING_ARGS && args_size.constant)))
2415 structure_value_addr = copy_to_reg (structure_value_addr);
2417 /* Tail calls can make things harder to debug, and we're traditionally
2418 pushed these optimizations into -O2. Don't try if we're already
2419 expanding a call, as that means we're an argument. Don't try if
2420 there's cleanups, as we know there's code to follow the call.
2422 If rtx_equal_function_value_matters is false, that means we've
2423 finished with regular parsing. Which means that some of the
2424 machinery we use to generate tail-calls is no longer in place.
2425 This is most often true of sjlj-exceptions, which we couldn't
2426 tail-call to anyway. */
2428 if (currently_expanding_call++ != 0
2429 || !flag_optimize_sibling_calls
2430 || !rtx_equal_function_value_matters
2431 || any_pending_cleanups (1)
2432 || args_size.var)
2433 try_tail_call = try_tail_recursion = 0;
2435 /* Tail recursion fails, when we are not dealing with recursive calls. */
2436 if (!try_tail_recursion
2437 || TREE_CODE (TREE_OPERAND (exp, 0)) != ADDR_EXPR
2438 || TREE_OPERAND (TREE_OPERAND (exp, 0), 0) != current_function_decl)
2439 try_tail_recursion = 0;
2441 /* Rest of purposes for tail call optimizations to fail. */
2442 if (
2443 #ifdef HAVE_sibcall_epilogue
2444 !HAVE_sibcall_epilogue
2445 #else
2447 #endif
2448 || !try_tail_call
2449 /* Doing sibling call optimization needs some work, since
2450 structure_value_addr can be allocated on the stack.
2451 It does not seem worth the effort since few optimizable
2452 sibling calls will return a structure. */
2453 || structure_value_addr != NULL_RTX
2454 /* If the register holding the address is a callee saved
2455 register, then we lose. We have no way to prevent that,
2456 so we only allow calls to named functions. */
2457 /* ??? This could be done by having the insn constraints
2458 use a register class that is all call-clobbered. Any
2459 reload insns generated to fix things up would appear
2460 before the sibcall_epilogue. */
2461 || fndecl == NULL_TREE
2462 || (flags & (ECF_RETURNS_TWICE | ECF_LONGJMP))
2463 || TREE_THIS_VOLATILE (fndecl)
2464 || !FUNCTION_OK_FOR_SIBCALL (fndecl)
2465 /* If this function requires more stack slots than the current
2466 function, we cannot change it into a sibling call. */
2467 || args_size.constant > current_function_args_size
2468 /* If the callee pops its own arguments, then it must pop exactly
2469 the same number of arguments as the current function. */
2470 || RETURN_POPS_ARGS (fndecl, funtype, args_size.constant)
2471 != RETURN_POPS_ARGS (current_function_decl,
2472 TREE_TYPE (current_function_decl),
2473 current_function_args_size))
2474 try_tail_call = 0;
2476 if (try_tail_call || try_tail_recursion)
2478 int end, inc;
2479 actparms = NULL_TREE;
2480 /* Ok, we're going to give the tail call the old college try.
2481 This means we're going to evaluate the function arguments
2482 up to three times. There are two degrees of badness we can
2483 encounter, those that can be unsaved and those that can't.
2484 (See unsafe_for_reeval commentary for details.)
2486 Generate a new argument list. Pass safe arguments through
2487 unchanged. For the easy badness wrap them in UNSAVE_EXPRs.
2488 For hard badness, evaluate them now and put their resulting
2489 rtx in a temporary VAR_DECL.
2491 initialize_argument_information has ordered the array for the
2492 order to be pushed, and we must remember this when reconstructing
2493 the original argument orde. */
2495 if (PUSH_ARGS_REVERSED)
2497 inc = 1;
2498 i = 0;
2499 end = num_actuals;
2501 else
2503 inc = -1;
2504 i = num_actuals - 1;
2505 end = -1;
2508 for (; i != end; i += inc)
2510 switch (unsafe_for_reeval (args[i].tree_value))
2512 case 0: /* Safe. */
2513 break;
2515 case 1: /* Mildly unsafe. */
2516 args[i].tree_value = unsave_expr (args[i].tree_value);
2517 break;
2519 case 2: /* Wildly unsafe. */
2521 tree var = build_decl (VAR_DECL, NULL_TREE,
2522 TREE_TYPE (args[i].tree_value));
2523 DECL_RTL (var) = expand_expr (args[i].tree_value, NULL_RTX,
2524 VOIDmode, EXPAND_NORMAL);
2525 args[i].tree_value = var;
2527 break;
2529 default:
2530 abort ();
2532 /* We need to build actparms for optimize_tail_recursion. We can
2533 safely trash away TREE_PURPOSE, since it is unused by this
2534 function. */
2535 if (try_tail_recursion)
2536 actparms = tree_cons (NULL_TREE, args[i].tree_value, actparms);
2538 /* Expanding one of those dangerous arguments could have added
2539 cleanups, but otherwise give it a whirl. */
2540 if (any_pending_cleanups (1))
2541 try_tail_call = try_tail_recursion = 0;
2544 /* Generate a tail recursion sequence when calling ourselves. */
2546 if (try_tail_recursion)
2548 /* We want to emit any pending stack adjustments before the tail
2549 recursion "call". That way we know any adjustment after the tail
2550 recursion call can be ignored if we indeed use the tail recursion
2551 call expansion. */
2552 int save_pending_stack_adjust = pending_stack_adjust;
2553 int save_stack_pointer_delta = stack_pointer_delta;
2555 /* Emit any queued insns now; otherwise they would end up in
2556 only one of the alternates. */
2557 emit_queue ();
2559 /* Use a new sequence to hold any RTL we generate. We do not even
2560 know if we will use this RTL yet. The final decision can not be
2561 made until after RTL generation for the entire function is
2562 complete. */
2563 start_sequence ();
2564 /* If expanding any of the arguments creates cleanups, we can't
2565 do a tailcall. So, we'll need to pop the pending cleanups
2566 list. If, however, all goes well, and there are no cleanups
2567 then the call to expand_start_target_temps will have no
2568 effect. */
2569 expand_start_target_temps ();
2570 if (optimize_tail_recursion (actparms, get_last_insn ()))
2572 if (any_pending_cleanups (1))
2573 try_tail_call = try_tail_recursion = 0;
2574 else
2575 tail_recursion_insns = get_insns ();
2577 expand_end_target_temps ();
2578 end_sequence ();
2580 /* Restore the original pending stack adjustment for the sibling and
2581 normal call cases below. */
2582 pending_stack_adjust = save_pending_stack_adjust;
2583 stack_pointer_delta = save_stack_pointer_delta;
2586 if (profile_arc_flag && (flags & ECF_FORK_OR_EXEC))
2588 /* A fork duplicates the profile information, and an exec discards
2589 it. We can't rely on fork/exec to be paired. So write out the
2590 profile information we have gathered so far, and clear it. */
2591 /* ??? When Linux's __clone is called with CLONE_VM set, profiling
2592 is subject to race conditions, just as with multithreaded
2593 programs. */
2595 emit_library_call (gen_rtx_SYMBOL_REF (Pmode, "__bb_fork_func"), 0,
2596 VOIDmode, 0);
2599 /* Ensure current function's preferred stack boundary is at least
2600 what we need. We don't have to increase alignment for recursive
2601 functions. */
2602 if (cfun->preferred_stack_boundary < preferred_stack_boundary
2603 && fndecl != current_function_decl)
2604 cfun->preferred_stack_boundary = preferred_stack_boundary;
2606 preferred_unit_stack_boundary = preferred_stack_boundary / BITS_PER_UNIT;
2608 function_call_count++;
2610 /* We want to make two insn chains; one for a sibling call, the other
2611 for a normal call. We will select one of the two chains after
2612 initial RTL generation is complete. */
2613 for (pass = 0; pass < 2; pass++)
2615 int sibcall_failure = 0;
2616 /* We want to emit ay pending stack adjustments before the tail
2617 recursion "call". That way we know any adjustment after the tail
2618 recursion call can be ignored if we indeed use the tail recursion
2619 call expansion. */
2620 int save_pending_stack_adjust = 0;
2621 int save_stack_pointer_delta = 0;
2622 rtx insns;
2623 rtx before_call, next_arg_reg;
2625 if (pass == 0)
2627 if (! try_tail_call)
2628 continue;
2630 /* Emit any queued insns now; otherwise they would end up in
2631 only one of the alternates. */
2632 emit_queue ();
2634 /* State variables we need to save and restore between
2635 iterations. */
2636 save_pending_stack_adjust = pending_stack_adjust;
2637 save_stack_pointer_delta = stack_pointer_delta;
2639 if (pass)
2640 flags &= ~ECF_SIBCALL;
2641 else
2642 flags |= ECF_SIBCALL;
2644 /* Other state variables that we must reinitialize each time
2645 through the loop (that are not initialized by the loop itself). */
2646 argblock = 0;
2647 call_fusage = 0;
2649 /* Start a new sequence for the normal call case.
2651 From this point on, if the sibling call fails, we want to set
2652 sibcall_failure instead of continuing the loop. */
2653 start_sequence ();
2655 if (pass == 0)
2657 /* We know at this point that there are not currently any
2658 pending cleanups. If, however, in the process of evaluating
2659 the arguments we were to create some, we'll need to be
2660 able to get rid of them. */
2661 expand_start_target_temps ();
2664 /* Don't let pending stack adjusts add up to too much.
2665 Also, do all pending adjustments now if there is any chance
2666 this might be a call to alloca or if we are expanding a sibling
2667 call sequence. */
2668 if (pending_stack_adjust >= 32
2669 || (pending_stack_adjust > 0 && (flags & ECF_MAY_BE_ALLOCA))
2670 || pass == 0)
2671 do_pending_stack_adjust ();
2673 /* When calling a const function, we must pop the stack args right away,
2674 so that the pop is deleted or moved with the call. */
2675 if (flags & (ECF_CONST | ECF_PURE))
2676 NO_DEFER_POP;
2678 /* Push the temporary stack slot level so that we can free any
2679 temporaries we make. */
2680 push_temp_slots ();
2682 #ifdef FINAL_REG_PARM_STACK_SPACE
2683 reg_parm_stack_space = FINAL_REG_PARM_STACK_SPACE (args_size.constant,
2684 args_size.var);
2685 #endif
2686 /* Precompute any arguments as needed. */
2687 if (pass)
2688 precompute_arguments (flags, num_actuals, args);
2690 /* Now we are about to start emitting insns that can be deleted
2691 if a libcall is deleted. */
2692 if (flags & (ECF_CONST | ECF_PURE | ECF_MALLOC))
2693 start_sequence ();
2695 adjusted_args_size = args_size;
2696 /* Compute the actual size of the argument block required. The variable
2697 and constant sizes must be combined, the size may have to be rounded,
2698 and there may be a minimum required size. When generating a sibcall
2699 pattern, do not round up, since we'll be re-using whatever space our
2700 caller provided. */
2701 unadjusted_args_size
2702 = compute_argument_block_size (reg_parm_stack_space,
2703 &adjusted_args_size,
2704 (pass == 0 ? 0
2705 : preferred_stack_boundary));
2707 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
2709 /* The argument block when performing a sibling call is the
2710 incoming argument block. */
2711 if (pass == 0)
2713 argblock = virtual_incoming_args_rtx;
2714 stored_args_map = sbitmap_alloc (args_size.constant);
2715 sbitmap_zero (stored_args_map);
2718 /* If we have no actual push instructions, or shouldn't use them,
2719 make space for all args right now. */
2720 else if (adjusted_args_size.var != 0)
2722 if (old_stack_level == 0)
2724 emit_stack_save (SAVE_BLOCK, &old_stack_level, NULL_RTX);
2725 old_pending_adj = pending_stack_adjust;
2726 pending_stack_adjust = 0;
2727 /* stack_arg_under_construction says whether a stack arg is
2728 being constructed at the old stack level. Pushing the stack
2729 gets a clean outgoing argument block. */
2730 old_stack_arg_under_construction = stack_arg_under_construction;
2731 stack_arg_under_construction = 0;
2733 argblock = push_block (ARGS_SIZE_RTX (adjusted_args_size), 0, 0);
2735 else
2737 /* Note that we must go through the motions of allocating an argument
2738 block even if the size is zero because we may be storing args
2739 in the area reserved for register arguments, which may be part of
2740 the stack frame. */
2742 int needed = adjusted_args_size.constant;
2744 /* Store the maximum argument space used. It will be pushed by
2745 the prologue (if ACCUMULATE_OUTGOING_ARGS, or stack overflow
2746 checking). */
2748 if (needed > current_function_outgoing_args_size)
2749 current_function_outgoing_args_size = needed;
2751 if (must_preallocate)
2753 if (ACCUMULATE_OUTGOING_ARGS)
2755 /* Since the stack pointer will never be pushed, it is
2756 possible for the evaluation of a parm to clobber
2757 something we have already written to the stack.
2758 Since most function calls on RISC machines do not use
2759 the stack, this is uncommon, but must work correctly.
2761 Therefore, we save any area of the stack that was already
2762 written and that we are using. Here we set up to do this
2763 by making a new stack usage map from the old one. The
2764 actual save will be done by store_one_arg.
2766 Another approach might be to try to reorder the argument
2767 evaluations to avoid this conflicting stack usage. */
2769 #ifndef OUTGOING_REG_PARM_STACK_SPACE
2770 /* Since we will be writing into the entire argument area,
2771 the map must be allocated for its entire size, not just
2772 the part that is the responsibility of the caller. */
2773 needed += reg_parm_stack_space;
2774 #endif
2776 #ifdef ARGS_GROW_DOWNWARD
2777 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2778 needed + 1);
2779 #else
2780 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
2781 needed);
2782 #endif
2783 stack_usage_map
2784 = (char *) alloca (highest_outgoing_arg_in_use);
2786 if (initial_highest_arg_in_use)
2787 memcpy (stack_usage_map, initial_stack_usage_map,
2788 initial_highest_arg_in_use);
2790 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
2791 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
2792 (highest_outgoing_arg_in_use
2793 - initial_highest_arg_in_use));
2794 needed = 0;
2796 /* The address of the outgoing argument list must not be
2797 copied to a register here, because argblock would be left
2798 pointing to the wrong place after the call to
2799 allocate_dynamic_stack_space below. */
2801 argblock = virtual_outgoing_args_rtx;
2803 else
2805 if (inhibit_defer_pop == 0)
2807 /* Try to reuse some or all of the pending_stack_adjust
2808 to get this space. */
2809 needed
2810 = (combine_pending_stack_adjustment_and_call
2811 (unadjusted_args_size,
2812 &adjusted_args_size,
2813 preferred_unit_stack_boundary));
2815 /* combine_pending_stack_adjustment_and_call computes
2816 an adjustment before the arguments are allocated.
2817 Account for them and see whether or not the stack
2818 needs to go up or down. */
2819 needed = unadjusted_args_size - needed;
2821 if (needed < 0)
2823 /* We're releasing stack space. */
2824 /* ??? We can avoid any adjustment at all if we're
2825 already aligned. FIXME. */
2826 pending_stack_adjust = -needed;
2827 do_pending_stack_adjust ();
2828 needed = 0;
2830 else
2831 /* We need to allocate space. We'll do that in
2832 push_block below. */
2833 pending_stack_adjust = 0;
2836 /* Special case this because overhead of `push_block' in
2837 this case is non-trivial. */
2838 if (needed == 0)
2839 argblock = virtual_outgoing_args_rtx;
2840 else
2841 argblock = push_block (GEN_INT (needed), 0, 0);
2843 /* We only really need to call `copy_to_reg' in the case
2844 where push insns are going to be used to pass ARGBLOCK
2845 to a function call in ARGS. In that case, the stack
2846 pointer changes value from the allocation point to the
2847 call point, and hence the value of
2848 VIRTUAL_OUTGOING_ARGS_RTX changes as well. But might
2849 as well always do it. */
2850 argblock = copy_to_reg (argblock);
2852 /* The save/restore code in store_one_arg handles all
2853 cases except one: a constructor call (including a C
2854 function returning a BLKmode struct) to initialize
2855 an argument. */
2856 if (stack_arg_under_construction)
2858 #ifndef OUTGOING_REG_PARM_STACK_SPACE
2859 rtx push_size = GEN_INT (reg_parm_stack_space
2860 + adjusted_args_size.constant);
2861 #else
2862 rtx push_size = GEN_INT (adjusted_args_size.constant);
2863 #endif
2864 if (old_stack_level == 0)
2866 emit_stack_save (SAVE_BLOCK, &old_stack_level,
2867 NULL_RTX);
2868 old_pending_adj = pending_stack_adjust;
2869 pending_stack_adjust = 0;
2870 /* stack_arg_under_construction says whether a stack
2871 arg is being constructed at the old stack level.
2872 Pushing the stack gets a clean outgoing argument
2873 block. */
2874 old_stack_arg_under_construction
2875 = stack_arg_under_construction;
2876 stack_arg_under_construction = 0;
2877 /* Make a new map for the new argument list. */
2878 stack_usage_map = (char *)
2879 alloca (highest_outgoing_arg_in_use);
2880 memset (stack_usage_map, 0, highest_outgoing_arg_in_use);
2881 highest_outgoing_arg_in_use = 0;
2883 allocate_dynamic_stack_space (push_size, NULL_RTX,
2884 BITS_PER_UNIT);
2886 /* If argument evaluation might modify the stack pointer,
2887 copy the address of the argument list to a register. */
2888 for (i = 0; i < num_actuals; i++)
2889 if (args[i].pass_on_stack)
2891 argblock = copy_addr_to_reg (argblock);
2892 break;
2898 compute_argument_addresses (args, argblock, num_actuals);
2900 #ifdef PREFERRED_STACK_BOUNDARY
2901 /* If we push args individually in reverse order, perform stack alignment
2902 before the first push (the last arg). */
2903 if (PUSH_ARGS_REVERSED && argblock == 0
2904 && adjusted_args_size.constant != unadjusted_args_size)
2906 /* When the stack adjustment is pending, we get better code
2907 by combining the adjustments. */
2908 if (pending_stack_adjust
2909 && ! (flags & (ECF_CONST | ECF_PURE))
2910 && ! inhibit_defer_pop)
2912 pending_stack_adjust
2913 = (combine_pending_stack_adjustment_and_call
2914 (unadjusted_args_size,
2915 &adjusted_args_size,
2916 preferred_unit_stack_boundary));
2917 do_pending_stack_adjust ();
2919 else if (argblock == 0)
2920 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
2921 - unadjusted_args_size));
2923 /* Now that the stack is properly aligned, pops can't safely
2924 be deferred during the evaluation of the arguments. */
2925 NO_DEFER_POP;
2926 #endif
2928 /* Don't try to defer pops if preallocating, not even from the first arg,
2929 since ARGBLOCK probably refers to the SP. */
2930 if (argblock)
2931 NO_DEFER_POP;
2933 funexp = rtx_for_function_call (fndecl, exp);
2935 /* Figure out the register where the value, if any, will come back. */
2936 valreg = 0;
2937 if (TYPE_MODE (TREE_TYPE (exp)) != VOIDmode
2938 && ! structure_value_addr)
2940 if (pcc_struct_value)
2941 valreg = hard_function_value (build_pointer_type (TREE_TYPE (exp)),
2942 fndecl, (pass == 0));
2943 else
2944 valreg = hard_function_value (TREE_TYPE (exp), fndecl, (pass == 0));
2947 /* Precompute all register parameters. It isn't safe to compute anything
2948 once we have started filling any specific hard regs. */
2949 precompute_register_parameters (num_actuals, args, &reg_parm_seen);
2951 #ifdef REG_PARM_STACK_SPACE
2952 /* Save the fixed argument area if it's part of the caller's frame and
2953 is clobbered by argument setup for this call. */
2954 if (ACCUMULATE_OUTGOING_ARGS && pass)
2955 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
2956 &low_to_save, &high_to_save);
2957 #endif
2959 /* Now store (and compute if necessary) all non-register parms.
2960 These come before register parms, since they can require block-moves,
2961 which could clobber the registers used for register parms.
2962 Parms which have partial registers are not stored here,
2963 but we do preallocate space here if they want that. */
2965 for (i = 0; i < num_actuals; i++)
2966 if (args[i].reg == 0 || args[i].pass_on_stack)
2968 rtx before_arg = get_last_insn ();
2970 if (store_one_arg (&args[i], argblock, flags,
2971 adjusted_args_size.var != 0,
2972 reg_parm_stack_space)
2973 || (pass == 0
2974 && check_sibcall_argument_overlap (before_arg,
2975 &args[i])))
2976 sibcall_failure = 1;
2979 /* If we have a parm that is passed in registers but not in memory
2980 and whose alignment does not permit a direct copy into registers,
2981 make a group of pseudos that correspond to each register that we
2982 will later fill. */
2983 if (STRICT_ALIGNMENT)
2984 store_unaligned_arguments_into_pseudos (args, num_actuals);
2986 /* Now store any partially-in-registers parm.
2987 This is the last place a block-move can happen. */
2988 if (reg_parm_seen)
2989 for (i = 0; i < num_actuals; i++)
2990 if (args[i].partial != 0 && ! args[i].pass_on_stack)
2992 rtx before_arg = get_last_insn ();
2994 if (store_one_arg (&args[i], argblock, flags,
2995 adjusted_args_size.var != 0,
2996 reg_parm_stack_space)
2997 || (pass == 0
2998 && check_sibcall_argument_overlap (before_arg,
2999 &args[i])))
3000 sibcall_failure = 1;
3003 #ifdef PREFERRED_STACK_BOUNDARY
3004 /* If we pushed args in forward order, perform stack alignment
3005 after pushing the last arg. */
3006 if (!PUSH_ARGS_REVERSED && argblock == 0)
3007 anti_adjust_stack (GEN_INT (adjusted_args_size.constant
3008 - unadjusted_args_size));
3009 #endif
3011 /* If register arguments require space on the stack and stack space
3012 was not preallocated, allocate stack space here for arguments
3013 passed in registers. */
3014 #ifdef OUTGOING_REG_PARM_STACK_SPACE
3015 if (!ACCUMULATE_OUTGOING_ARGS
3016 && must_preallocate == 0 && reg_parm_stack_space > 0)
3017 anti_adjust_stack (GEN_INT (reg_parm_stack_space));
3018 #endif
3020 /* Pass the function the address in which to return a
3021 structure value. */
3022 if (pass != 0 && structure_value_addr && ! structure_value_addr_parm)
3024 emit_move_insn (struct_value_rtx,
3025 force_reg (Pmode,
3026 force_operand (structure_value_addr,
3027 NULL_RTX)));
3029 /* Mark the memory for the aggregate as write-only. */
3030 if (current_function_check_memory_usage)
3031 emit_library_call (chkr_set_right_libfunc, LCT_CONST_MAKE_BLOCK,
3032 VOIDmode, 3,
3033 structure_value_addr, ptr_mode,
3034 GEN_INT (struct_value_size),
3035 TYPE_MODE (sizetype),
3036 GEN_INT (MEMORY_USE_WO),
3037 TYPE_MODE (integer_type_node));
3039 if (GET_CODE (struct_value_rtx) == REG)
3040 use_reg (&call_fusage, struct_value_rtx);
3043 funexp = prepare_call_address (funexp, fndecl, &call_fusage,
3044 reg_parm_seen);
3046 load_register_parameters (args, num_actuals, &call_fusage, flags);
3048 /* Perform postincrements before actually calling the function. */
3049 emit_queue ();
3051 /* Save a pointer to the last insn before the call, so that we can
3052 later safely search backwards to find the CALL_INSN. */
3053 before_call = get_last_insn ();
3055 /* Set up next argument register. For sibling calls on machines
3056 with register windows this should be the incoming register. */
3057 #ifdef FUNCTION_INCOMING_ARG
3058 if (pass == 0)
3059 next_arg_reg = FUNCTION_INCOMING_ARG (args_so_far, VOIDmode,
3060 void_type_node, 1);
3061 else
3062 #endif
3063 next_arg_reg = FUNCTION_ARG (args_so_far, VOIDmode,
3064 void_type_node, 1);
3066 /* All arguments and registers used for the call must be set up by
3067 now! */
3069 #ifdef PREFERRED_STACK_BOUNDARY
3070 /* Stack must be properly aligned now. */
3071 if (pass && stack_pointer_delta % preferred_unit_stack_boundary)
3072 abort ();
3073 #endif
3075 /* Generate the actual call instruction. */
3076 emit_call_1 (funexp, fndecl, funtype, unadjusted_args_size,
3077 adjusted_args_size.constant, struct_value_size,
3078 next_arg_reg, valreg, old_inhibit_defer_pop, call_fusage,
3079 flags);
3081 /* Verify that we've deallocated all the stack we used. */
3082 if (pass
3083 && old_stack_allocated != stack_pointer_delta - pending_stack_adjust)
3084 abort ();
3086 /* If call is cse'able, make appropriate pair of reg-notes around it.
3087 Test valreg so we don't crash; may safely ignore `const'
3088 if return type is void. Disable for PARALLEL return values, because
3089 we have no way to move such values into a pseudo register. */
3090 if (pass
3091 && (flags & (ECF_CONST | ECF_PURE))
3092 && valreg != 0 && GET_CODE (valreg) != PARALLEL)
3094 rtx note = 0;
3095 rtx temp = gen_reg_rtx (GET_MODE (valreg));
3096 rtx insns;
3098 /* Mark the return value as a pointer if needed. */
3099 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
3100 mark_reg_pointer (temp, TYPE_ALIGN (TREE_TYPE (TREE_TYPE (exp))));
3102 /* Construct an "equal form" for the value which mentions all the
3103 arguments in order as well as the function name. */
3104 for (i = 0; i < num_actuals; i++)
3105 note = gen_rtx_EXPR_LIST (VOIDmode, args[i].initial_value, note);
3106 note = gen_rtx_EXPR_LIST (VOIDmode, funexp, note);
3108 insns = get_insns ();
3109 end_sequence ();
3111 if (flags & ECF_PURE)
3112 note = gen_rtx_EXPR_LIST (VOIDmode,
3113 gen_rtx_USE (VOIDmode,
3114 gen_rtx_MEM (BLKmode,
3115 gen_rtx_SCRATCH (VOIDmode))), note);
3117 emit_libcall_block (insns, temp, valreg, note);
3119 valreg = temp;
3121 else if (flags & (ECF_CONST | ECF_PURE))
3123 /* Otherwise, just write out the sequence without a note. */
3124 rtx insns = get_insns ();
3126 end_sequence ();
3127 emit_insns (insns);
3129 else if (flags & ECF_MALLOC)
3131 rtx temp = gen_reg_rtx (GET_MODE (valreg));
3132 rtx last, insns;
3134 /* The return value from a malloc-like function is a pointer. */
3135 if (TREE_CODE (TREE_TYPE (exp)) == POINTER_TYPE)
3136 mark_reg_pointer (temp, BIGGEST_ALIGNMENT);
3138 emit_move_insn (temp, valreg);
3140 /* The return value from a malloc-like function can not alias
3141 anything else. */
3142 last = get_last_insn ();
3143 REG_NOTES (last) =
3144 gen_rtx_EXPR_LIST (REG_NOALIAS, temp, REG_NOTES (last));
3146 /* Write out the sequence. */
3147 insns = get_insns ();
3148 end_sequence ();
3149 emit_insns (insns);
3150 valreg = temp;
3153 /* For calls to `setjmp', etc., inform flow.c it should complain
3154 if nonvolatile values are live. For functions that cannot return,
3155 inform flow that control does not fall through. */
3157 if ((flags & (ECF_RETURNS_TWICE | ECF_NORETURN | ECF_LONGJMP)) || pass == 0)
3159 /* The barrier or NOTE_INSN_SETJMP note must be emitted
3160 immediately after the CALL_INSN. Some ports emit more
3161 than just a CALL_INSN above, so we must search for it here. */
3163 rtx last = get_last_insn ();
3164 while (GET_CODE (last) != CALL_INSN)
3166 last = PREV_INSN (last);
3167 /* There was no CALL_INSN? */
3168 if (last == before_call)
3169 abort ();
3172 if (flags & ECF_RETURNS_TWICE)
3174 emit_note_after (NOTE_INSN_SETJMP, last);
3175 current_function_calls_setjmp = 1;
3177 else
3178 emit_barrier_after (last);
3181 if (flags & ECF_LONGJMP)
3182 current_function_calls_longjmp = 1;
3184 /* If this function is returning into a memory location marked as
3185 readonly, it means it is initializing that location. But we normally
3186 treat functions as not clobbering such locations, so we need to
3187 specify that this one does. */
3188 if (target != 0 && GET_CODE (target) == MEM
3189 && structure_value_addr != 0 && RTX_UNCHANGING_P (target))
3190 emit_insn (gen_rtx_CLOBBER (VOIDmode, target));
3192 /* If value type not void, return an rtx for the value. */
3194 /* If there are cleanups to be called, don't use a hard reg as target.
3195 We need to double check this and see if it matters anymore. */
3196 if (any_pending_cleanups (1))
3198 if (target && REG_P (target)
3199 && REGNO (target) < FIRST_PSEUDO_REGISTER)
3200 target = 0;
3201 sibcall_failure = 1;
3204 if (TYPE_MODE (TREE_TYPE (exp)) == VOIDmode
3205 || ignore)
3207 target = const0_rtx;
3209 else if (structure_value_addr)
3211 if (target == 0 || GET_CODE (target) != MEM)
3213 target
3214 = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
3215 memory_address (TYPE_MODE (TREE_TYPE (exp)),
3216 structure_value_addr));
3217 set_mem_attributes (target, exp, 1);
3220 else if (pcc_struct_value)
3222 /* This is the special C++ case where we need to
3223 know what the true target was. We take care to
3224 never use this value more than once in one expression. */
3225 target = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (exp)),
3226 copy_to_reg (valreg));
3227 set_mem_attributes (target, exp, 1);
3229 /* Handle calls that return values in multiple non-contiguous locations.
3230 The Irix 6 ABI has examples of this. */
3231 else if (GET_CODE (valreg) == PARALLEL)
3233 int bytes = int_size_in_bytes (TREE_TYPE (exp));
3235 if (target == 0)
3237 target = assign_stack_temp (TYPE_MODE (TREE_TYPE (exp)),
3238 bytes, 0);
3239 MEM_SET_IN_STRUCT_P (target, AGGREGATE_TYPE_P (TREE_TYPE (exp)));
3240 preserve_temp_slots (target);
3243 if (! rtx_equal_p (target, valreg))
3244 emit_group_store (target, valreg, bytes,
3245 TYPE_ALIGN (TREE_TYPE (exp)));
3247 /* We can not support sibling calls for this case. */
3248 sibcall_failure = 1;
3250 else if (target
3251 && GET_MODE (target) == TYPE_MODE (TREE_TYPE (exp))
3252 && GET_MODE (target) == GET_MODE (valreg))
3254 /* TARGET and VALREG cannot be equal at this point because the
3255 latter would not have REG_FUNCTION_VALUE_P true, while the
3256 former would if it were referring to the same register.
3258 If they refer to the same register, this move will be a no-op,
3259 except when function inlining is being done. */
3260 emit_move_insn (target, valreg);
3262 else if (TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
3264 target = copy_blkmode_from_reg (target, valreg, TREE_TYPE (exp));
3266 /* We can not support sibling calls for this case. */
3267 sibcall_failure = 1;
3269 else
3270 target = copy_to_reg (valreg);
3272 #ifdef PROMOTE_FUNCTION_RETURN
3273 /* If we promoted this return value, make the proper SUBREG. TARGET
3274 might be const0_rtx here, so be careful. */
3275 if (GET_CODE (target) == REG
3276 && TYPE_MODE (TREE_TYPE (exp)) != BLKmode
3277 && GET_MODE (target) != TYPE_MODE (TREE_TYPE (exp)))
3279 tree type = TREE_TYPE (exp);
3280 int unsignedp = TREE_UNSIGNED (type);
3282 /* If we don't promote as expected, something is wrong. */
3283 if (GET_MODE (target)
3284 != promote_mode (type, TYPE_MODE (type), &unsignedp, 1))
3285 abort ();
3287 target = gen_rtx_SUBREG (TYPE_MODE (type), target, 0);
3288 SUBREG_PROMOTED_VAR_P (target) = 1;
3289 SUBREG_PROMOTED_UNSIGNED_P (target) = unsignedp;
3291 #endif
3293 /* If size of args is variable or this was a constructor call for a stack
3294 argument, restore saved stack-pointer value. */
3296 if (old_stack_level && ! (flags & ECF_SP_DEPRESSED))
3298 emit_stack_restore (SAVE_BLOCK, old_stack_level, NULL_RTX);
3299 pending_stack_adjust = old_pending_adj;
3300 stack_arg_under_construction = old_stack_arg_under_construction;
3301 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3302 stack_usage_map = initial_stack_usage_map;
3303 sibcall_failure = 1;
3305 else if (ACCUMULATE_OUTGOING_ARGS && pass)
3307 #ifdef REG_PARM_STACK_SPACE
3308 if (save_area)
3310 restore_fixed_argument_area (save_area, argblock,
3311 high_to_save, low_to_save);
3313 #endif
3315 /* If we saved any argument areas, restore them. */
3316 for (i = 0; i < num_actuals; i++)
3317 if (args[i].save_area)
3319 enum machine_mode save_mode = GET_MODE (args[i].save_area);
3320 rtx stack_area
3321 = gen_rtx_MEM (save_mode,
3322 memory_address (save_mode,
3323 XEXP (args[i].stack_slot, 0)));
3325 if (save_mode != BLKmode)
3326 emit_move_insn (stack_area, args[i].save_area);
3327 else
3328 emit_block_move (stack_area,
3329 validize_mem (args[i].save_area),
3330 GEN_INT (args[i].size.constant),
3331 PARM_BOUNDARY);
3334 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
3335 stack_usage_map = initial_stack_usage_map;
3338 /* If this was alloca, record the new stack level for nonlocal gotos.
3339 Check for the handler slots since we might not have a save area
3340 for non-local gotos. */
3342 if ((flags & ECF_MAY_BE_ALLOCA) && nonlocal_goto_handler_slots != 0)
3343 emit_stack_save (SAVE_NONLOCAL, &nonlocal_goto_stack_level, NULL_RTX);
3345 pop_temp_slots ();
3347 /* Free up storage we no longer need. */
3348 for (i = 0; i < num_actuals; ++i)
3349 if (args[i].aligned_regs)
3350 free (args[i].aligned_regs);
3352 if (pass == 0)
3354 /* Undo the fake expand_start_target_temps we did earlier. If
3355 there had been any cleanups created, we've already set
3356 sibcall_failure. */
3357 expand_end_target_temps ();
3360 insns = get_insns ();
3361 end_sequence ();
3363 if (pass == 0)
3365 tail_call_insns = insns;
3367 /* Restore the pending stack adjustment now that we have
3368 finished generating the sibling call sequence. */
3370 pending_stack_adjust = save_pending_stack_adjust;
3371 stack_pointer_delta = save_stack_pointer_delta;
3373 /* Prepare arg structure for next iteration. */
3374 for (i = 0; i < num_actuals; i++)
3376 args[i].value = 0;
3377 args[i].aligned_regs = 0;
3378 args[i].stack = 0;
3381 sbitmap_free (stored_args_map);
3383 else
3384 normal_call_insns = insns;
3386 /* If something prevents making this a sibling call,
3387 zero out the sequence. */
3388 if (sibcall_failure)
3389 tail_call_insns = NULL_RTX;
3392 /* The function optimize_sibling_and_tail_recursive_calls doesn't
3393 handle CALL_PLACEHOLDERs inside other CALL_PLACEHOLDERs. This
3394 can happen if the arguments to this function call an inline
3395 function who's expansion contains another CALL_PLACEHOLDER.
3397 If there are any C_Ps in any of these sequences, replace them
3398 with their normal call. */
3400 for (insn = normal_call_insns; insn; insn = NEXT_INSN (insn))
3401 if (GET_CODE (insn) == CALL_INSN
3402 && GET_CODE (PATTERN (insn)) == CALL_PLACEHOLDER)
3403 replace_call_placeholder (insn, sibcall_use_normal);
3405 for (insn = tail_call_insns; insn; insn = NEXT_INSN (insn))
3406 if (GET_CODE (insn) == CALL_INSN
3407 && GET_CODE (PATTERN (insn)) == CALL_PLACEHOLDER)
3408 replace_call_placeholder (insn, sibcall_use_normal);
3410 for (insn = tail_recursion_insns; insn; insn = NEXT_INSN (insn))
3411 if (GET_CODE (insn) == CALL_INSN
3412 && GET_CODE (PATTERN (insn)) == CALL_PLACEHOLDER)
3413 replace_call_placeholder (insn, sibcall_use_normal);
3415 /* If this was a potential tail recursion site, then emit a
3416 CALL_PLACEHOLDER with the normal and the tail recursion streams.
3417 One of them will be selected later. */
3418 if (tail_recursion_insns || tail_call_insns)
3420 /* The tail recursion label must be kept around. We could expose
3421 its use in the CALL_PLACEHOLDER, but that creates unwanted edges
3422 and makes determining true tail recursion sites difficult.
3424 So we set LABEL_PRESERVE_P here, then clear it when we select
3425 one of the call sequences after rtl generation is complete. */
3426 if (tail_recursion_insns)
3427 LABEL_PRESERVE_P (tail_recursion_label) = 1;
3428 emit_call_insn (gen_rtx_CALL_PLACEHOLDER (VOIDmode, normal_call_insns,
3429 tail_call_insns,
3430 tail_recursion_insns,
3431 tail_recursion_label));
3433 else
3434 emit_insns (normal_call_insns);
3436 currently_expanding_call--;
3438 /* If this function returns with the stack pointer depressed, ensure
3439 this block saves and restores the stack pointer, show it was
3440 changed, and adjust for any outgoing arg space. */
3441 if (flags & ECF_SP_DEPRESSED)
3443 clear_pending_stack_adjust ();
3444 emit_insn (gen_rtx (CLOBBER, VOIDmode, stack_pointer_rtx));
3445 emit_move_insn (virtual_stack_dynamic_rtx, stack_pointer_rtx);
3446 save_stack_pointer ();
3449 return target;
3452 /* Returns nonzero if FUN is the symbol for a library function which can
3453 not throw. */
3455 static int
3456 libfunc_nothrow (fun)
3457 rtx fun;
3459 if (fun == throw_libfunc
3460 || fun == rethrow_libfunc
3461 || fun == sjthrow_libfunc
3462 || fun == sjpopnthrow_libfunc)
3463 return 0;
3465 return 1;
3468 /* Output a library call to function FUN (a SYMBOL_REF rtx).
3469 The RETVAL parameter specifies whether return value needs to be saved, other
3470 parameters are documented in the emit_library_call function bellow. */
3471 static rtx
3472 emit_library_call_value_1 (retval, orgfun, value, fn_type, outmode, nargs, p)
3473 int retval;
3474 rtx orgfun;
3475 rtx value;
3476 enum libcall_type fn_type;
3477 enum machine_mode outmode;
3478 int nargs;
3479 va_list p;
3481 /* Total size in bytes of all the stack-parms scanned so far. */
3482 struct args_size args_size;
3483 /* Size of arguments before any adjustments (such as rounding). */
3484 struct args_size original_args_size;
3485 register int argnum;
3486 rtx fun;
3487 int inc;
3488 int count;
3489 struct args_size alignment_pad;
3490 rtx argblock = 0;
3491 CUMULATIVE_ARGS args_so_far;
3492 struct arg
3494 rtx value;
3495 enum machine_mode mode;
3496 rtx reg;
3497 int partial;
3498 struct args_size offset;
3499 struct args_size size;
3500 rtx save_area;
3502 struct arg *argvec;
3503 int old_inhibit_defer_pop = inhibit_defer_pop;
3504 rtx call_fusage = 0;
3505 rtx mem_value = 0;
3506 rtx valreg;
3507 int pcc_struct_value = 0;
3508 int struct_value_size = 0;
3509 int flags = 0;
3510 int reg_parm_stack_space = 0;
3511 int needed;
3513 #ifdef REG_PARM_STACK_SPACE
3514 /* Define the boundary of the register parm stack space that needs to be
3515 save, if any. */
3516 int low_to_save = -1, high_to_save = 0;
3517 rtx save_area = 0; /* Place that it is saved. */
3518 #endif
3520 /* Size of the stack reserved for parameter registers. */
3521 int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
3522 char *initial_stack_usage_map = stack_usage_map;
3524 #ifdef REG_PARM_STACK_SPACE
3525 #ifdef MAYBE_REG_PARM_STACK_SPACE
3526 reg_parm_stack_space = MAYBE_REG_PARM_STACK_SPACE;
3527 #else
3528 reg_parm_stack_space = REG_PARM_STACK_SPACE ((tree) 0);
3529 #endif
3530 #endif
3532 if (fn_type == LCT_CONST_MAKE_BLOCK)
3533 flags |= ECF_CONST;
3534 else if (fn_type == LCT_PURE_MAKE_BLOCK)
3535 flags |= ECF_PURE;
3536 fun = orgfun;
3538 if (libfunc_nothrow (fun))
3539 flags |= ECF_NOTHROW;
3541 #ifdef PREFERRED_STACK_BOUNDARY
3542 /* Ensure current function's preferred stack boundary is at least
3543 what we need. */
3544 if (cfun->preferred_stack_boundary < PREFERRED_STACK_BOUNDARY)
3545 cfun->preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
3546 #endif
3548 /* If this kind of value comes back in memory,
3549 decide where in memory it should come back. */
3550 if (outmode != VOIDmode && aggregate_value_p (type_for_mode (outmode, 0)))
3552 #ifdef PCC_STATIC_STRUCT_RETURN
3553 rtx pointer_reg
3554 = hard_function_value (build_pointer_type (type_for_mode (outmode, 0)),
3555 0, 0);
3556 mem_value = gen_rtx_MEM (outmode, pointer_reg);
3557 pcc_struct_value = 1;
3558 if (value == 0)
3559 value = gen_reg_rtx (outmode);
3560 #else /* not PCC_STATIC_STRUCT_RETURN */
3561 struct_value_size = GET_MODE_SIZE (outmode);
3562 if (value != 0 && GET_CODE (value) == MEM)
3563 mem_value = value;
3564 else
3565 mem_value = assign_stack_temp (outmode, GET_MODE_SIZE (outmode), 0);
3566 #endif
3568 /* This call returns a big structure. */
3569 flags &= ~(ECF_CONST | ECF_PURE);
3572 /* ??? Unfinished: must pass the memory address as an argument. */
3574 /* Copy all the libcall-arguments out of the varargs data
3575 and into a vector ARGVEC.
3577 Compute how to pass each argument. We only support a very small subset
3578 of the full argument passing conventions to limit complexity here since
3579 library functions shouldn't have many args. */
3581 argvec = (struct arg *) alloca ((nargs + 1) * sizeof (struct arg));
3582 memset ((char *) argvec, 0, (nargs + 1) * sizeof (struct arg));
3584 INIT_CUMULATIVE_ARGS (args_so_far, NULL_TREE, fun, 0);
3586 args_size.constant = 0;
3587 args_size.var = 0;
3589 count = 0;
3591 /* Now we are about to start emitting insns that can be deleted
3592 if a libcall is deleted. */
3593 if (flags & (ECF_CONST | ECF_PURE))
3594 start_sequence ();
3596 push_temp_slots ();
3598 /* If there's a structure value address to be passed,
3599 either pass it in the special place, or pass it as an extra argument. */
3600 if (mem_value && struct_value_rtx == 0 && ! pcc_struct_value)
3602 rtx addr = XEXP (mem_value, 0);
3603 nargs++;
3605 /* Make sure it is a reasonable operand for a move or push insn. */
3606 if (GET_CODE (addr) != REG && GET_CODE (addr) != MEM
3607 && ! (CONSTANT_P (addr) && LEGITIMATE_CONSTANT_P (addr)))
3608 addr = force_operand (addr, NULL_RTX);
3610 argvec[count].value = addr;
3611 argvec[count].mode = Pmode;
3612 argvec[count].partial = 0;
3614 argvec[count].reg = FUNCTION_ARG (args_so_far, Pmode, NULL_TREE, 1);
3615 #ifdef FUNCTION_ARG_PARTIAL_NREGS
3616 if (FUNCTION_ARG_PARTIAL_NREGS (args_so_far, Pmode, NULL_TREE, 1))
3617 abort ();
3618 #endif
3620 locate_and_pad_parm (Pmode, NULL_TREE,
3621 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3623 #else
3624 argvec[count].reg != 0,
3625 #endif
3626 NULL_TREE, &args_size, &argvec[count].offset,
3627 &argvec[count].size, &alignment_pad);
3629 if (argvec[count].reg == 0 || argvec[count].partial != 0
3630 || reg_parm_stack_space > 0)
3631 args_size.constant += argvec[count].size.constant;
3633 FUNCTION_ARG_ADVANCE (args_so_far, Pmode, (tree) 0, 1);
3635 count++;
3638 for (; count < nargs; count++)
3640 rtx val = va_arg (p, rtx);
3641 enum machine_mode mode = va_arg (p, enum machine_mode);
3643 /* We cannot convert the arg value to the mode the library wants here;
3644 must do it earlier where we know the signedness of the arg. */
3645 if (mode == BLKmode
3646 || (GET_MODE (val) != mode && GET_MODE (val) != VOIDmode))
3647 abort ();
3649 /* On some machines, there's no way to pass a float to a library fcn.
3650 Pass it as a double instead. */
3651 #ifdef LIBGCC_NEEDS_DOUBLE
3652 if (LIBGCC_NEEDS_DOUBLE && mode == SFmode)
3653 val = convert_modes (DFmode, SFmode, val, 0), mode = DFmode;
3654 #endif
3656 /* There's no need to call protect_from_queue, because
3657 either emit_move_insn or emit_push_insn will do that. */
3659 /* Make sure it is a reasonable operand for a move or push insn. */
3660 if (GET_CODE (val) != REG && GET_CODE (val) != MEM
3661 && ! (CONSTANT_P (val) && LEGITIMATE_CONSTANT_P (val)))
3662 val = force_operand (val, NULL_RTX);
3664 #ifdef FUNCTION_ARG_PASS_BY_REFERENCE
3665 if (FUNCTION_ARG_PASS_BY_REFERENCE (args_so_far, mode, NULL_TREE, 1))
3667 /* We do not support FUNCTION_ARG_CALLEE_COPIES here since it can
3668 be viewed as just an efficiency improvement. */
3669 rtx slot = assign_stack_temp (mode, GET_MODE_SIZE (mode), 0);
3670 emit_move_insn (slot, val);
3671 val = force_operand (XEXP (slot, 0), NULL_RTX);
3672 mode = Pmode;
3674 #endif
3676 argvec[count].value = val;
3677 argvec[count].mode = mode;
3679 argvec[count].reg = FUNCTION_ARG (args_so_far, mode, NULL_TREE, 1);
3681 #ifdef FUNCTION_ARG_PARTIAL_NREGS
3682 argvec[count].partial
3683 = FUNCTION_ARG_PARTIAL_NREGS (args_so_far, mode, NULL_TREE, 1);
3684 #else
3685 argvec[count].partial = 0;
3686 #endif
3688 locate_and_pad_parm (mode, NULL_TREE,
3689 #ifdef STACK_PARMS_IN_REG_PARM_AREA
3691 #else
3692 argvec[count].reg != 0,
3693 #endif
3694 NULL_TREE, &args_size, &argvec[count].offset,
3695 &argvec[count].size, &alignment_pad);
3697 if (argvec[count].size.var)
3698 abort ();
3700 if (reg_parm_stack_space == 0 && argvec[count].partial)
3701 argvec[count].size.constant -= argvec[count].partial * UNITS_PER_WORD;
3703 if (argvec[count].reg == 0 || argvec[count].partial != 0
3704 || reg_parm_stack_space > 0)
3705 args_size.constant += argvec[count].size.constant;
3707 FUNCTION_ARG_ADVANCE (args_so_far, mode, (tree) 0, 1);
3710 #ifdef FINAL_REG_PARM_STACK_SPACE
3711 reg_parm_stack_space = FINAL_REG_PARM_STACK_SPACE (args_size.constant,
3712 args_size.var);
3713 #endif
3714 /* If this machine requires an external definition for library
3715 functions, write one out. */
3716 assemble_external_libcall (fun);
3718 original_args_size = args_size;
3719 #ifdef PREFERRED_STACK_BOUNDARY
3720 args_size.constant = (((args_size.constant
3721 + stack_pointer_delta
3722 + STACK_BYTES - 1)
3723 / STACK_BYTES
3724 * STACK_BYTES)
3725 - stack_pointer_delta);
3726 #endif
3728 args_size.constant = MAX (args_size.constant,
3729 reg_parm_stack_space);
3731 #ifndef OUTGOING_REG_PARM_STACK_SPACE
3732 args_size.constant -= reg_parm_stack_space;
3733 #endif
3735 if (args_size.constant > current_function_outgoing_args_size)
3736 current_function_outgoing_args_size = args_size.constant;
3738 if (ACCUMULATE_OUTGOING_ARGS)
3740 /* Since the stack pointer will never be pushed, it is possible for
3741 the evaluation of a parm to clobber something we have already
3742 written to the stack. Since most function calls on RISC machines
3743 do not use the stack, this is uncommon, but must work correctly.
3745 Therefore, we save any area of the stack that was already written
3746 and that we are using. Here we set up to do this by making a new
3747 stack usage map from the old one.
3749 Another approach might be to try to reorder the argument
3750 evaluations to avoid this conflicting stack usage. */
3752 needed = args_size.constant;
3754 #ifndef OUTGOING_REG_PARM_STACK_SPACE
3755 /* Since we will be writing into the entire argument area, the
3756 map must be allocated for its entire size, not just the part that
3757 is the responsibility of the caller. */
3758 needed += reg_parm_stack_space;
3759 #endif
3761 #ifdef ARGS_GROW_DOWNWARD
3762 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3763 needed + 1);
3764 #else
3765 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
3766 needed);
3767 #endif
3768 stack_usage_map = (char *) alloca (highest_outgoing_arg_in_use);
3770 if (initial_highest_arg_in_use)
3771 memcpy (stack_usage_map, initial_stack_usage_map,
3772 initial_highest_arg_in_use);
3774 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
3775 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
3776 highest_outgoing_arg_in_use - initial_highest_arg_in_use);
3777 needed = 0;
3779 /* The address of the outgoing argument list must not be copied to a
3780 register here, because argblock would be left pointing to the
3781 wrong place after the call to allocate_dynamic_stack_space below. */
3783 argblock = virtual_outgoing_args_rtx;
3785 else
3787 if (!PUSH_ARGS)
3788 argblock = push_block (GEN_INT (args_size.constant), 0, 0);
3791 #ifdef PREFERRED_STACK_BOUNDARY
3792 /* If we push args individually in reverse order, perform stack alignment
3793 before the first push (the last arg). */
3794 if (argblock == 0 && PUSH_ARGS_REVERSED)
3795 anti_adjust_stack (GEN_INT (args_size.constant
3796 - original_args_size.constant));
3797 #endif
3799 if (PUSH_ARGS_REVERSED)
3801 inc = -1;
3802 argnum = nargs - 1;
3804 else
3806 inc = 1;
3807 argnum = 0;
3810 #ifdef REG_PARM_STACK_SPACE
3811 if (ACCUMULATE_OUTGOING_ARGS)
3813 /* The argument list is the property of the called routine and it
3814 may clobber it. If the fixed area has been used for previous
3815 parameters, we must save and restore it.
3817 Here we compute the boundary of the that needs to be saved, if any. */
3819 #ifdef ARGS_GROW_DOWNWARD
3820 for (count = 0; count < reg_parm_stack_space + 1; count++)
3821 #else
3822 for (count = 0; count < reg_parm_stack_space; count++)
3823 #endif
3825 if (count >= highest_outgoing_arg_in_use
3826 || stack_usage_map[count] == 0)
3827 continue;
3829 if (low_to_save == -1)
3830 low_to_save = count;
3832 high_to_save = count;
3835 if (low_to_save >= 0)
3837 int num_to_save = high_to_save - low_to_save + 1;
3838 enum machine_mode save_mode
3839 = mode_for_size (num_to_save * BITS_PER_UNIT, MODE_INT, 1);
3840 rtx stack_area;
3842 /* If we don't have the required alignment, must do this in BLKmode. */
3843 if ((low_to_save & (MIN (GET_MODE_SIZE (save_mode),
3844 BIGGEST_ALIGNMENT / UNITS_PER_WORD) - 1)))
3845 save_mode = BLKmode;
3847 #ifdef ARGS_GROW_DOWNWARD
3848 stack_area = gen_rtx_MEM (save_mode,
3849 memory_address (save_mode,
3850 plus_constant (argblock,
3851 -high_to_save)));
3852 #else
3853 stack_area = gen_rtx_MEM (save_mode,
3854 memory_address (save_mode,
3855 plus_constant (argblock,
3856 low_to_save)));
3857 #endif
3858 if (save_mode == BLKmode)
3860 save_area = assign_stack_temp (BLKmode, num_to_save, 0);
3861 emit_block_move (validize_mem (save_area), stack_area,
3862 GEN_INT (num_to_save), PARM_BOUNDARY);
3864 else
3866 save_area = gen_reg_rtx (save_mode);
3867 emit_move_insn (save_area, stack_area);
3871 #endif
3873 /* Push the args that need to be pushed. */
3875 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3876 are to be pushed. */
3877 for (count = 0; count < nargs; count++, argnum += inc)
3879 register enum machine_mode mode = argvec[argnum].mode;
3880 register rtx val = argvec[argnum].value;
3881 rtx reg = argvec[argnum].reg;
3882 int partial = argvec[argnum].partial;
3883 int lower_bound = 0, upper_bound = 0, i;
3885 if (! (reg != 0 && partial == 0))
3887 if (ACCUMULATE_OUTGOING_ARGS)
3889 /* If this is being stored into a pre-allocated, fixed-size,
3890 stack area, save any previous data at that location. */
3892 #ifdef ARGS_GROW_DOWNWARD
3893 /* stack_slot is negative, but we want to index stack_usage_map
3894 with positive values. */
3895 upper_bound = -argvec[argnum].offset.constant + 1;
3896 lower_bound = upper_bound - argvec[argnum].size.constant;
3897 #else
3898 lower_bound = argvec[argnum].offset.constant;
3899 upper_bound = lower_bound + argvec[argnum].size.constant;
3900 #endif
3902 for (i = lower_bound; i < upper_bound; i++)
3903 if (stack_usage_map[i]
3904 /* Don't store things in the fixed argument area at this
3905 point; it has already been saved. */
3906 && i > reg_parm_stack_space)
3907 break;
3909 if (i != upper_bound)
3911 /* We need to make a save area. See what mode we can make
3912 it. */
3913 enum machine_mode save_mode
3914 = mode_for_size (argvec[argnum].size.constant
3915 * BITS_PER_UNIT,
3916 MODE_INT, 1);
3917 rtx stack_area
3918 = gen_rtx_MEM
3919 (save_mode,
3920 memory_address
3921 (save_mode,
3922 plus_constant (argblock,
3923 argvec[argnum].offset.constant)));
3924 argvec[argnum].save_area = gen_reg_rtx (save_mode);
3926 emit_move_insn (argvec[argnum].save_area, stack_area);
3930 emit_push_insn (val, mode, NULL_TREE, NULL_RTX, 0, partial, reg, 0,
3931 argblock, GEN_INT (argvec[argnum].offset.constant),
3932 reg_parm_stack_space, ARGS_SIZE_RTX (alignment_pad));
3934 /* Now mark the segment we just used. */
3935 if (ACCUMULATE_OUTGOING_ARGS)
3936 for (i = lower_bound; i < upper_bound; i++)
3937 stack_usage_map[i] = 1;
3939 NO_DEFER_POP;
3943 #ifdef PREFERRED_STACK_BOUNDARY
3944 /* If we pushed args in forward order, perform stack alignment
3945 after pushing the last arg. */
3946 if (argblock == 0 && !PUSH_ARGS_REVERSED)
3947 anti_adjust_stack (GEN_INT (args_size.constant
3948 - original_args_size.constant));
3949 #endif
3951 if (PUSH_ARGS_REVERSED)
3952 argnum = nargs - 1;
3953 else
3954 argnum = 0;
3956 fun = prepare_call_address (fun, NULL_TREE, &call_fusage, 0);
3958 /* Now load any reg parms into their regs. */
3960 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
3961 are to be pushed. */
3962 for (count = 0; count < nargs; count++, argnum += inc)
3964 register rtx val = argvec[argnum].value;
3965 rtx reg = argvec[argnum].reg;
3966 int partial = argvec[argnum].partial;
3968 /* Handle calls that pass values in multiple non-contiguous
3969 locations. The PA64 has examples of this for library calls. */
3970 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3971 emit_group_load (reg, val,
3972 GET_MODE_SIZE (GET_MODE (val)),
3973 GET_MODE_ALIGNMENT (GET_MODE (val)));
3974 else if (reg != 0 && partial == 0)
3975 emit_move_insn (reg, val);
3977 NO_DEFER_POP;
3980 /* Any regs containing parms remain in use through the call. */
3981 for (count = 0; count < nargs; count++)
3983 rtx reg = argvec[count].reg;
3984 if (reg != 0 && GET_CODE (reg) == PARALLEL)
3985 use_group_regs (&call_fusage, reg);
3986 else if (reg != 0)
3987 use_reg (&call_fusage, reg);
3990 /* Pass the function the address in which to return a structure value. */
3991 if (mem_value != 0 && struct_value_rtx != 0 && ! pcc_struct_value)
3993 emit_move_insn (struct_value_rtx,
3994 force_reg (Pmode,
3995 force_operand (XEXP (mem_value, 0),
3996 NULL_RTX)));
3997 if (GET_CODE (struct_value_rtx) == REG)
3998 use_reg (&call_fusage, struct_value_rtx);
4001 /* Don't allow popping to be deferred, since then
4002 cse'ing of library calls could delete a call and leave the pop. */
4003 NO_DEFER_POP;
4004 valreg = (mem_value == 0 && outmode != VOIDmode
4005 ? hard_libcall_value (outmode) : NULL_RTX);
4007 #ifdef PREFERRED_STACK_BOUNDARY
4008 /* Stack must be properly aligned now. */
4009 if (stack_pointer_delta & (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT - 1))
4010 abort ();
4011 #endif
4013 /* We pass the old value of inhibit_defer_pop + 1 to emit_call_1, which
4014 will set inhibit_defer_pop to that value. */
4015 /* The return type is needed to decide how many bytes the function pops.
4016 Signedness plays no role in that, so for simplicity, we pretend it's
4017 always signed. We also assume that the list of arguments passed has
4018 no impact, so we pretend it is unknown. */
4020 emit_call_1 (fun,
4021 get_identifier (XSTR (orgfun, 0)),
4022 build_function_type (outmode == VOIDmode ? void_type_node
4023 : type_for_mode (outmode, 0), NULL_TREE),
4024 original_args_size.constant, args_size.constant,
4025 struct_value_size,
4026 FUNCTION_ARG (args_so_far, VOIDmode, void_type_node, 1),
4027 valreg,
4028 old_inhibit_defer_pop + 1, call_fusage, flags);
4030 /* Now restore inhibit_defer_pop to its actual original value. */
4031 OK_DEFER_POP;
4033 /* If call is cse'able, make appropriate pair of reg-notes around it.
4034 Test valreg so we don't crash; may safely ignore `const'
4035 if return type is void. Disable for PARALLEL return values, because
4036 we have no way to move such values into a pseudo register. */
4037 if ((flags & (ECF_CONST | ECF_PURE))
4038 && valreg != 0 && GET_CODE (valreg) != PARALLEL)
4040 rtx note = 0;
4041 rtx temp = gen_reg_rtx (GET_MODE (valreg));
4042 rtx insns;
4043 int i;
4045 /* Construct an "equal form" for the value which mentions all the
4046 arguments in order as well as the function name. */
4047 for (i = 0; i < nargs; i++)
4048 note = gen_rtx_EXPR_LIST (VOIDmode, argvec[i].value, note);
4049 note = gen_rtx_EXPR_LIST (VOIDmode, fun, note);
4051 insns = get_insns ();
4052 end_sequence ();
4054 if (flags & ECF_PURE)
4055 note = gen_rtx_EXPR_LIST (VOIDmode,
4056 gen_rtx_USE (VOIDmode,
4057 gen_rtx_MEM (BLKmode,
4058 gen_rtx_SCRATCH (VOIDmode))), note);
4060 emit_libcall_block (insns, temp, valreg, note);
4062 valreg = temp;
4064 else if (flags & (ECF_CONST | ECF_PURE))
4066 /* Otherwise, just write out the sequence without a note. */
4067 rtx insns = get_insns ();
4069 end_sequence ();
4070 emit_insns (insns);
4072 pop_temp_slots ();
4074 /* Copy the value to the right place. */
4075 if (outmode != VOIDmode && retval)
4077 if (mem_value)
4079 if (value == 0)
4080 value = mem_value;
4081 if (value != mem_value)
4082 emit_move_insn (value, mem_value);
4084 else if (value != 0)
4085 emit_move_insn (value, hard_libcall_value (outmode));
4086 else
4087 value = hard_libcall_value (outmode);
4090 if (ACCUMULATE_OUTGOING_ARGS)
4092 #ifdef REG_PARM_STACK_SPACE
4093 if (save_area)
4095 enum machine_mode save_mode = GET_MODE (save_area);
4096 #ifdef ARGS_GROW_DOWNWARD
4097 rtx stack_area
4098 = gen_rtx_MEM (save_mode,
4099 memory_address (save_mode,
4100 plus_constant (argblock,
4101 - high_to_save)));
4102 #else
4103 rtx stack_area
4104 = gen_rtx_MEM (save_mode,
4105 memory_address (save_mode,
4106 plus_constant (argblock, low_to_save)));
4107 #endif
4108 if (save_mode != BLKmode)
4109 emit_move_insn (stack_area, save_area);
4110 else
4111 emit_block_move (stack_area, validize_mem (save_area),
4112 GEN_INT (high_to_save - low_to_save + 1),
4113 PARM_BOUNDARY);
4115 #endif
4117 /* If we saved any argument areas, restore them. */
4118 for (count = 0; count < nargs; count++)
4119 if (argvec[count].save_area)
4121 enum machine_mode save_mode = GET_MODE (argvec[count].save_area);
4122 rtx stack_area
4123 = gen_rtx_MEM (save_mode,
4124 memory_address
4125 (save_mode,
4126 plus_constant (argblock,
4127 argvec[count].offset.constant)));
4129 emit_move_insn (stack_area, argvec[count].save_area);
4132 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
4133 stack_usage_map = initial_stack_usage_map;
4136 return value;
4140 /* Output a library call to function FUN (a SYMBOL_REF rtx)
4141 (emitting the queue unless NO_QUEUE is nonzero),
4142 for a value of mode OUTMODE,
4143 with NARGS different arguments, passed as alternating rtx values
4144 and machine_modes to convert them to.
4145 The rtx values should have been passed through protect_from_queue already.
4147 FN_TYPE will is zero for `normal' calls, one for `const' calls, wich
4148 which will be enclosed in REG_LIBCALL/REG_RETVAL notes and two for `pure'
4149 calls, that are handled like `const' calls with extra
4150 (use (memory (scratch)). */
4152 void
4153 emit_library_call VPARAMS((rtx orgfun, enum libcall_type fn_type,
4154 enum machine_mode outmode, int nargs, ...))
4156 #ifndef ANSI_PROTOTYPES
4157 rtx orgfun;
4158 int fn_type;
4159 enum machine_mode outmode;
4160 int nargs;
4161 #endif
4162 va_list p;
4164 VA_START (p, nargs);
4166 #ifndef ANSI_PROTOTYPES
4167 orgfun = va_arg (p, rtx);
4168 fn_type = va_arg (p, int);
4169 outmode = va_arg (p, enum machine_mode);
4170 nargs = va_arg (p, int);
4171 #endif
4173 emit_library_call_value_1 (0, orgfun, NULL_RTX, fn_type, outmode, nargs, p);
4175 va_end (p);
4178 /* Like emit_library_call except that an extra argument, VALUE,
4179 comes second and says where to store the result.
4180 (If VALUE is zero, this function chooses a convenient way
4181 to return the value.
4183 This function returns an rtx for where the value is to be found.
4184 If VALUE is nonzero, VALUE is returned. */
4187 emit_library_call_value VPARAMS((rtx orgfun, rtx value,
4188 enum libcall_type fn_type,
4189 enum machine_mode outmode, int nargs, ...))
4191 #ifndef ANSI_PROTOTYPES
4192 rtx orgfun;
4193 rtx value;
4194 int fn_type;
4195 enum machine_mode outmode;
4196 int nargs;
4197 #endif
4198 va_list p;
4200 VA_START (p, nargs);
4202 #ifndef ANSI_PROTOTYPES
4203 orgfun = va_arg (p, rtx);
4204 value = va_arg (p, rtx);
4205 fn_type = va_arg (p, int);
4206 outmode = va_arg (p, enum machine_mode);
4207 nargs = va_arg (p, int);
4208 #endif
4210 value = emit_library_call_value_1 (1, orgfun, value, fn_type, outmode, nargs, p);
4212 va_end (p);
4214 return value;
4217 #if 0
4218 /* Return an rtx which represents a suitable home on the stack
4219 given TYPE, the type of the argument looking for a home.
4220 This is called only for BLKmode arguments.
4222 SIZE is the size needed for this target.
4223 ARGS_ADDR is the address of the bottom of the argument block for this call.
4224 OFFSET describes this parameter's offset into ARGS_ADDR. It is meaningless
4225 if this machine uses push insns. */
4227 static rtx
4228 target_for_arg (type, size, args_addr, offset)
4229 tree type;
4230 rtx size;
4231 rtx args_addr;
4232 struct args_size offset;
4234 rtx target;
4235 rtx offset_rtx = ARGS_SIZE_RTX (offset);
4237 /* We do not call memory_address if possible,
4238 because we want to address as close to the stack
4239 as possible. For non-variable sized arguments,
4240 this will be stack-pointer relative addressing. */
4241 if (GET_CODE (offset_rtx) == CONST_INT)
4242 target = plus_constant (args_addr, INTVAL (offset_rtx));
4243 else
4245 /* I have no idea how to guarantee that this
4246 will work in the presence of register parameters. */
4247 target = gen_rtx_PLUS (Pmode, args_addr, offset_rtx);
4248 target = memory_address (QImode, target);
4251 return gen_rtx_MEM (BLKmode, target);
4253 #endif
4255 /* Store a single argument for a function call
4256 into the register or memory area where it must be passed.
4257 *ARG describes the argument value and where to pass it.
4259 ARGBLOCK is the address of the stack-block for all the arguments,
4260 or 0 on a machine where arguments are pushed individually.
4262 MAY_BE_ALLOCA nonzero says this could be a call to `alloca'
4263 so must be careful about how the stack is used.
4265 VARIABLE_SIZE nonzero says that this was a variable-sized outgoing
4266 argument stack. This is used if ACCUMULATE_OUTGOING_ARGS to indicate
4267 that we need not worry about saving and restoring the stack.
4269 FNDECL is the declaration of the function we are calling.
4271 Return non-zero if this arg should cause sibcall failure,
4272 zero otherwise. */
4274 static int
4275 store_one_arg (arg, argblock, flags, variable_size, reg_parm_stack_space)
4276 struct arg_data *arg;
4277 rtx argblock;
4278 int flags;
4279 int variable_size ATTRIBUTE_UNUSED;
4280 int reg_parm_stack_space;
4282 register tree pval = arg->tree_value;
4283 rtx reg = 0;
4284 int partial = 0;
4285 int used = 0;
4286 int i, lower_bound = 0, upper_bound = 0;
4287 int sibcall_failure = 0;
4289 if (TREE_CODE (pval) == ERROR_MARK)
4290 return 1;
4292 /* Push a new temporary level for any temporaries we make for
4293 this argument. */
4294 push_temp_slots ();
4296 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL))
4298 /* If this is being stored into a pre-allocated, fixed-size, stack area,
4299 save any previous data at that location. */
4300 if (argblock && ! variable_size && arg->stack)
4302 #ifdef ARGS_GROW_DOWNWARD
4303 /* stack_slot is negative, but we want to index stack_usage_map
4304 with positive values. */
4305 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
4306 upper_bound = -INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1)) + 1;
4307 else
4308 upper_bound = 0;
4310 lower_bound = upper_bound - arg->size.constant;
4311 #else
4312 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
4313 lower_bound = INTVAL (XEXP (XEXP (arg->stack_slot, 0), 1));
4314 else
4315 lower_bound = 0;
4317 upper_bound = lower_bound + arg->size.constant;
4318 #endif
4320 for (i = lower_bound; i < upper_bound; i++)
4321 if (stack_usage_map[i]
4322 /* Don't store things in the fixed argument area at this point;
4323 it has already been saved. */
4324 && i > reg_parm_stack_space)
4325 break;
4327 if (i != upper_bound)
4329 /* We need to make a save area. See what mode we can make it. */
4330 enum machine_mode save_mode
4331 = mode_for_size (arg->size.constant * BITS_PER_UNIT, MODE_INT, 1);
4332 rtx stack_area
4333 = gen_rtx_MEM (save_mode,
4334 memory_address (save_mode,
4335 XEXP (arg->stack_slot, 0)));
4337 if (save_mode == BLKmode)
4339 arg->save_area = assign_stack_temp (BLKmode,
4340 arg->size.constant, 0);
4341 MEM_SET_IN_STRUCT_P (arg->save_area,
4342 AGGREGATE_TYPE_P (TREE_TYPE
4343 (arg->tree_value)));
4344 preserve_temp_slots (arg->save_area);
4345 emit_block_move (validize_mem (arg->save_area), stack_area,
4346 GEN_INT (arg->size.constant),
4347 PARM_BOUNDARY);
4349 else
4351 arg->save_area = gen_reg_rtx (save_mode);
4352 emit_move_insn (arg->save_area, stack_area);
4356 /* Now that we have saved any slots that will be overwritten by this
4357 store, mark all slots this store will use. We must do this before
4358 we actually expand the argument since the expansion itself may
4359 trigger library calls which might need to use the same stack slot. */
4360 if (argblock && ! variable_size && arg->stack)
4361 for (i = lower_bound; i < upper_bound; i++)
4362 stack_usage_map[i] = 1;
4365 /* If this isn't going to be placed on both the stack and in registers,
4366 set up the register and number of words. */
4367 if (! arg->pass_on_stack)
4368 reg = arg->reg, partial = arg->partial;
4370 if (reg != 0 && partial == 0)
4371 /* Being passed entirely in a register. We shouldn't be called in
4372 this case. */
4373 abort ();
4375 /* If this arg needs special alignment, don't load the registers
4376 here. */
4377 if (arg->n_aligned_regs != 0)
4378 reg = 0;
4380 /* If this is being passed partially in a register, we can't evaluate
4381 it directly into its stack slot. Otherwise, we can. */
4382 if (arg->value == 0)
4384 /* stack_arg_under_construction is nonzero if a function argument is
4385 being evaluated directly into the outgoing argument list and
4386 expand_call must take special action to preserve the argument list
4387 if it is called recursively.
4389 For scalar function arguments stack_usage_map is sufficient to
4390 determine which stack slots must be saved and restored. Scalar
4391 arguments in general have pass_on_stack == 0.
4393 If this argument is initialized by a function which takes the
4394 address of the argument (a C++ constructor or a C function
4395 returning a BLKmode structure), then stack_usage_map is
4396 insufficient and expand_call must push the stack around the
4397 function call. Such arguments have pass_on_stack == 1.
4399 Note that it is always safe to set stack_arg_under_construction,
4400 but this generates suboptimal code if set when not needed. */
4402 if (arg->pass_on_stack)
4403 stack_arg_under_construction++;
4405 arg->value = expand_expr (pval,
4406 (partial
4407 || TYPE_MODE (TREE_TYPE (pval)) != arg->mode)
4408 ? NULL_RTX : arg->stack,
4409 VOIDmode, 0);
4411 /* If we are promoting object (or for any other reason) the mode
4412 doesn't agree, convert the mode. */
4414 if (arg->mode != TYPE_MODE (TREE_TYPE (pval)))
4415 arg->value = convert_modes (arg->mode, TYPE_MODE (TREE_TYPE (pval)),
4416 arg->value, arg->unsignedp);
4418 if (arg->pass_on_stack)
4419 stack_arg_under_construction--;
4422 /* Don't allow anything left on stack from computation
4423 of argument to alloca. */
4424 if (flags & ECF_MAY_BE_ALLOCA)
4425 do_pending_stack_adjust ();
4427 if (arg->value == arg->stack)
4429 /* If the value is already in the stack slot, we are done. */
4430 if (current_function_check_memory_usage && GET_CODE (arg->stack) == MEM)
4432 emit_library_call (chkr_set_right_libfunc, LCT_CONST_MAKE_BLOCK,
4433 VOIDmode, 3, XEXP (arg->stack, 0), Pmode,
4434 ARGS_SIZE_RTX (arg->size),
4435 TYPE_MODE (sizetype),
4436 GEN_INT (MEMORY_USE_RW),
4437 TYPE_MODE (integer_type_node));
4440 else if (arg->mode != BLKmode)
4442 register int size;
4444 /* Argument is a scalar, not entirely passed in registers.
4445 (If part is passed in registers, arg->partial says how much
4446 and emit_push_insn will take care of putting it there.)
4448 Push it, and if its size is less than the
4449 amount of space allocated to it,
4450 also bump stack pointer by the additional space.
4451 Note that in C the default argument promotions
4452 will prevent such mismatches. */
4454 size = GET_MODE_SIZE (arg->mode);
4455 /* Compute how much space the push instruction will push.
4456 On many machines, pushing a byte will advance the stack
4457 pointer by a halfword. */
4458 #ifdef PUSH_ROUNDING
4459 size = PUSH_ROUNDING (size);
4460 #endif
4461 used = size;
4463 /* Compute how much space the argument should get:
4464 round up to a multiple of the alignment for arguments. */
4465 if (none != FUNCTION_ARG_PADDING (arg->mode, TREE_TYPE (pval)))
4466 used = (((size + PARM_BOUNDARY / BITS_PER_UNIT - 1)
4467 / (PARM_BOUNDARY / BITS_PER_UNIT))
4468 * (PARM_BOUNDARY / BITS_PER_UNIT));
4470 /* This isn't already where we want it on the stack, so put it there.
4471 This can either be done with push or copy insns. */
4472 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), NULL_RTX, 0,
4473 partial, reg, used - size, argblock,
4474 ARGS_SIZE_RTX (arg->offset), reg_parm_stack_space,
4475 ARGS_SIZE_RTX (arg->alignment_pad));
4477 else
4479 /* BLKmode, at least partly to be pushed. */
4481 register int excess;
4482 rtx size_rtx;
4484 /* Pushing a nonscalar.
4485 If part is passed in registers, PARTIAL says how much
4486 and emit_push_insn will take care of putting it there. */
4488 /* Round its size up to a multiple
4489 of the allocation unit for arguments. */
4491 if (arg->size.var != 0)
4493 excess = 0;
4494 size_rtx = ARGS_SIZE_RTX (arg->size);
4496 else
4498 /* PUSH_ROUNDING has no effect on us, because
4499 emit_push_insn for BLKmode is careful to avoid it. */
4500 excess = (arg->size.constant - int_size_in_bytes (TREE_TYPE (pval))
4501 + partial * UNITS_PER_WORD);
4502 size_rtx = expr_size (pval);
4505 if ((flags & ECF_SIBCALL) && GET_CODE (arg->value) == MEM)
4507 /* emit_push_insn might not work properly if arg->value and
4508 argblock + arg->offset areas overlap. */
4509 rtx x = arg->value;
4510 int i = 0;
4512 if (XEXP (x, 0) == current_function_internal_arg_pointer
4513 || (GET_CODE (XEXP (x, 0)) == PLUS
4514 && XEXP (XEXP (x, 0), 0) ==
4515 current_function_internal_arg_pointer
4516 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT))
4518 if (XEXP (x, 0) != current_function_internal_arg_pointer)
4519 i = INTVAL (XEXP (XEXP (x, 0), 1));
4521 /* expand_call should ensure this */
4522 if (arg->offset.var || GET_CODE (size_rtx) != CONST_INT)
4523 abort ();
4525 if (arg->offset.constant > i)
4527 if (arg->offset.constant < i + INTVAL (size_rtx))
4528 sibcall_failure = 1;
4530 else if (arg->offset.constant < i)
4532 if (i < arg->offset.constant + INTVAL (size_rtx))
4533 sibcall_failure = 1;
4538 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), size_rtx,
4539 TYPE_ALIGN (TREE_TYPE (pval)), partial, reg, excess,
4540 argblock, ARGS_SIZE_RTX (arg->offset),
4541 reg_parm_stack_space,
4542 ARGS_SIZE_RTX (arg->alignment_pad));
4545 /* Unless this is a partially-in-register argument, the argument is now
4546 in the stack.
4548 ??? Note that this can change arg->value from arg->stack to
4549 arg->stack_slot and it matters when they are not the same.
4550 It isn't totally clear that this is correct in all cases. */
4551 if (partial == 0)
4552 arg->value = arg->stack_slot;
4554 /* Once we have pushed something, pops can't safely
4555 be deferred during the rest of the arguments. */
4556 NO_DEFER_POP;
4558 /* ANSI doesn't require a sequence point here,
4559 but PCC has one, so this will avoid some problems. */
4560 emit_queue ();
4562 /* Free any temporary slots made in processing this argument. Show
4563 that we might have taken the address of something and pushed that
4564 as an operand. */
4565 preserve_temp_slots (NULL_RTX);
4566 free_temp_slots ();
4567 pop_temp_slots ();
4569 return sibcall_failure;