[19/46] Make vect_dr_stmt return a stmt_vec_info
[official-gcc.git] / gcc / calls.c
blob384c0238748d1748d3f0b12438ae4d5009cf70ec
1 /* Convert function calls to rtl insns, for GNU C compiler.
2 Copyright (C) 1989-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "predict.h"
29 #include "memmodel.h"
30 #include "tm_p.h"
31 #include "stringpool.h"
32 #include "expmed.h"
33 #include "optabs.h"
34 #include "emit-rtl.h"
35 #include "cgraph.h"
36 #include "diagnostic-core.h"
37 #include "fold-const.h"
38 #include "stor-layout.h"
39 #include "varasm.h"
40 #include "internal-fn.h"
41 #include "dojump.h"
42 #include "explow.h"
43 #include "calls.h"
44 #include "expr.h"
45 #include "output.h"
46 #include "langhooks.h"
47 #include "except.h"
48 #include "dbgcnt.h"
49 #include "rtl-iter.h"
50 #include "tree-vrp.h"
51 #include "tree-ssanames.h"
52 #include "tree-ssa-strlen.h"
53 #include "intl.h"
54 #include "stringpool.h"
55 #include "attribs.h"
56 #include "builtins.h"
57 #include "gimple-fold.h"
59 /* Like PREFERRED_STACK_BOUNDARY but in units of bytes, not bits. */
60 #define STACK_BYTES (PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT)
62 /* Data structure and subroutines used within expand_call. */
64 struct arg_data
66 /* Tree node for this argument. */
67 tree tree_value;
68 /* Mode for value; TYPE_MODE unless promoted. */
69 machine_mode mode;
70 /* Current RTL value for argument, or 0 if it isn't precomputed. */
71 rtx value;
72 /* Initially-compute RTL value for argument; only for const functions. */
73 rtx initial_value;
74 /* Register to pass this argument in, 0 if passed on stack, or an
75 PARALLEL if the arg is to be copied into multiple non-contiguous
76 registers. */
77 rtx reg;
78 /* Register to pass this argument in when generating tail call sequence.
79 This is not the same register as for normal calls on machines with
80 register windows. */
81 rtx tail_call_reg;
82 /* If REG is a PARALLEL, this is a copy of VALUE pulled into the correct
83 form for emit_group_move. */
84 rtx parallel_value;
85 /* If value is passed in neither reg nor stack, this field holds a number
86 of a special slot to be used. */
87 rtx special_slot;
88 /* For pointer bounds hold an index of parm bounds are bound to. -1 if
89 there is no such pointer. */
90 int pointer_arg;
91 /* If pointer_arg refers a structure, then pointer_offset holds an offset
92 of a pointer in this structure. */
93 int pointer_offset;
94 /* If REG was promoted from the actual mode of the argument expression,
95 indicates whether the promotion is sign- or zero-extended. */
96 int unsignedp;
97 /* Number of bytes to put in registers. 0 means put the whole arg
98 in registers. Also 0 if not passed in registers. */
99 int partial;
100 /* Nonzero if argument must be passed on stack.
101 Note that some arguments may be passed on the stack
102 even though pass_on_stack is zero, just because FUNCTION_ARG says so.
103 pass_on_stack identifies arguments that *cannot* go in registers. */
104 int pass_on_stack;
105 /* Some fields packaged up for locate_and_pad_parm. */
106 struct locate_and_pad_arg_data locate;
107 /* Location on the stack at which parameter should be stored. The store
108 has already been done if STACK == VALUE. */
109 rtx stack;
110 /* Location on the stack of the start of this argument slot. This can
111 differ from STACK if this arg pads downward. This location is known
112 to be aligned to TARGET_FUNCTION_ARG_BOUNDARY. */
113 rtx stack_slot;
114 /* Place that this stack area has been saved, if needed. */
115 rtx save_area;
116 /* If an argument's alignment does not permit direct copying into registers,
117 copy in smaller-sized pieces into pseudos. These are stored in a
118 block pointed to by this field. The next field says how many
119 word-sized pseudos we made. */
120 rtx *aligned_regs;
121 int n_aligned_regs;
124 /* A vector of one char per byte of stack space. A byte if nonzero if
125 the corresponding stack location has been used.
126 This vector is used to prevent a function call within an argument from
127 clobbering any stack already set up. */
128 static char *stack_usage_map;
130 /* Size of STACK_USAGE_MAP. */
131 static unsigned int highest_outgoing_arg_in_use;
133 /* Assume that any stack location at this byte index is used,
134 without checking the contents of stack_usage_map. */
135 static unsigned HOST_WIDE_INT stack_usage_watermark = HOST_WIDE_INT_M1U;
137 /* A bitmap of virtual-incoming stack space. Bit is set if the corresponding
138 stack location's tail call argument has been already stored into the stack.
139 This bitmap is used to prevent sibling call optimization if function tries
140 to use parent's incoming argument slots when they have been already
141 overwritten with tail call arguments. */
142 static sbitmap stored_args_map;
144 /* Assume that any virtual-incoming location at this byte index has been
145 stored, without checking the contents of stored_args_map. */
146 static unsigned HOST_WIDE_INT stored_args_watermark;
148 /* stack_arg_under_construction is nonzero when an argument may be
149 initialized with a constructor call (including a C function that
150 returns a BLKmode struct) and expand_call must take special action
151 to make sure the object being constructed does not overlap the
152 argument list for the constructor call. */
153 static int stack_arg_under_construction;
155 static void precompute_register_parameters (int, struct arg_data *, int *);
156 static int store_one_arg (struct arg_data *, rtx, int, int, int);
157 static void store_unaligned_arguments_into_pseudos (struct arg_data *, int);
158 static int finalize_must_preallocate (int, int, struct arg_data *,
159 struct args_size *);
160 static void precompute_arguments (int, struct arg_data *);
161 static void compute_argument_addresses (struct arg_data *, rtx, int);
162 static rtx rtx_for_function_call (tree, tree);
163 static void load_register_parameters (struct arg_data *, int, rtx *, int,
164 int, int *);
165 static int special_function_p (const_tree, int);
166 static int check_sibcall_argument_overlap_1 (rtx);
167 static int check_sibcall_argument_overlap (rtx_insn *, struct arg_data *, int);
169 static tree split_complex_types (tree);
171 #ifdef REG_PARM_STACK_SPACE
172 static rtx save_fixed_argument_area (int, rtx, int *, int *);
173 static void restore_fixed_argument_area (rtx, rtx, int, int);
174 #endif
176 /* Return true if bytes [LOWER_BOUND, UPPER_BOUND) of the outgoing
177 stack region might already be in use. */
179 static bool
180 stack_region_maybe_used_p (poly_uint64 lower_bound, poly_uint64 upper_bound,
181 unsigned int reg_parm_stack_space)
183 unsigned HOST_WIDE_INT const_lower, const_upper;
184 const_lower = constant_lower_bound (lower_bound);
185 if (!upper_bound.is_constant (&const_upper))
186 const_upper = HOST_WIDE_INT_M1U;
188 if (const_upper > stack_usage_watermark)
189 return true;
191 /* Don't worry about things in the fixed argument area;
192 it has already been saved. */
193 const_lower = MAX (const_lower, reg_parm_stack_space);
194 const_upper = MIN (const_upper, highest_outgoing_arg_in_use);
195 for (unsigned HOST_WIDE_INT i = const_lower; i < const_upper; ++i)
196 if (stack_usage_map[i])
197 return true;
198 return false;
201 /* Record that bytes [LOWER_BOUND, UPPER_BOUND) of the outgoing
202 stack region are now in use. */
204 static void
205 mark_stack_region_used (poly_uint64 lower_bound, poly_uint64 upper_bound)
207 unsigned HOST_WIDE_INT const_lower, const_upper;
208 const_lower = constant_lower_bound (lower_bound);
209 if (upper_bound.is_constant (&const_upper))
210 for (unsigned HOST_WIDE_INT i = const_lower; i < const_upper; ++i)
211 stack_usage_map[i] = 1;
212 else
213 stack_usage_watermark = MIN (stack_usage_watermark, const_lower);
216 /* Force FUNEXP into a form suitable for the address of a CALL,
217 and return that as an rtx. Also load the static chain register
218 if FNDECL is a nested function.
220 CALL_FUSAGE points to a variable holding the prospective
221 CALL_INSN_FUNCTION_USAGE information. */
224 prepare_call_address (tree fndecl_or_type, rtx funexp, rtx static_chain_value,
225 rtx *call_fusage, int reg_parm_seen, int flags)
227 /* Make a valid memory address and copy constants through pseudo-regs,
228 but not for a constant address if -fno-function-cse. */
229 if (GET_CODE (funexp) != SYMBOL_REF)
231 /* If it's an indirect call by descriptor, generate code to perform
232 runtime identification of the pointer and load the descriptor. */
233 if ((flags & ECF_BY_DESCRIPTOR) && !flag_trampolines)
235 const int bit_val = targetm.calls.custom_function_descriptors;
236 rtx call_lab = gen_label_rtx ();
238 gcc_assert (fndecl_or_type && TYPE_P (fndecl_or_type));
239 fndecl_or_type
240 = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL, NULL_TREE,
241 fndecl_or_type);
242 DECL_STATIC_CHAIN (fndecl_or_type) = 1;
243 rtx chain = targetm.calls.static_chain (fndecl_or_type, false);
245 if (GET_MODE (funexp) != Pmode)
246 funexp = convert_memory_address (Pmode, funexp);
248 /* Avoid long live ranges around function calls. */
249 funexp = copy_to_mode_reg (Pmode, funexp);
251 if (REG_P (chain))
252 emit_insn (gen_rtx_CLOBBER (VOIDmode, chain));
254 /* Emit the runtime identification pattern. */
255 rtx mask = gen_rtx_AND (Pmode, funexp, GEN_INT (bit_val));
256 emit_cmp_and_jump_insns (mask, const0_rtx, EQ, NULL_RTX, Pmode, 1,
257 call_lab);
259 /* Statically predict the branch to very likely taken. */
260 rtx_insn *insn = get_last_insn ();
261 if (JUMP_P (insn))
262 predict_insn_def (insn, PRED_BUILTIN_EXPECT, TAKEN);
264 /* Load the descriptor. */
265 rtx mem = gen_rtx_MEM (ptr_mode,
266 plus_constant (Pmode, funexp, - bit_val));
267 MEM_NOTRAP_P (mem) = 1;
268 mem = convert_memory_address (Pmode, mem);
269 emit_move_insn (chain, mem);
271 mem = gen_rtx_MEM (ptr_mode,
272 plus_constant (Pmode, funexp,
273 POINTER_SIZE / BITS_PER_UNIT
274 - bit_val));
275 MEM_NOTRAP_P (mem) = 1;
276 mem = convert_memory_address (Pmode, mem);
277 emit_move_insn (funexp, mem);
279 emit_label (call_lab);
281 if (REG_P (chain))
283 use_reg (call_fusage, chain);
284 STATIC_CHAIN_REG_P (chain) = 1;
287 /* Make sure we're not going to be overwritten below. */
288 gcc_assert (!static_chain_value);
291 /* If we are using registers for parameters, force the
292 function address into a register now. */
293 funexp = ((reg_parm_seen
294 && targetm.small_register_classes_for_mode_p (FUNCTION_MODE))
295 ? force_not_mem (memory_address (FUNCTION_MODE, funexp))
296 : memory_address (FUNCTION_MODE, funexp));
298 else
300 /* funexp could be a SYMBOL_REF represents a function pointer which is
301 of ptr_mode. In this case, it should be converted into address mode
302 to be a valid address for memory rtx pattern. See PR 64971. */
303 if (GET_MODE (funexp) != Pmode)
304 funexp = convert_memory_address (Pmode, funexp);
306 if (!(flags & ECF_SIBCALL))
308 if (!NO_FUNCTION_CSE && optimize && ! flag_no_function_cse)
309 funexp = force_reg (Pmode, funexp);
313 if (static_chain_value != 0
314 && (TREE_CODE (fndecl_or_type) != FUNCTION_DECL
315 || DECL_STATIC_CHAIN (fndecl_or_type)))
317 rtx chain;
319 chain = targetm.calls.static_chain (fndecl_or_type, false);
320 static_chain_value = convert_memory_address (Pmode, static_chain_value);
322 emit_move_insn (chain, static_chain_value);
323 if (REG_P (chain))
325 use_reg (call_fusage, chain);
326 STATIC_CHAIN_REG_P (chain) = 1;
330 return funexp;
333 /* Generate instructions to call function FUNEXP,
334 and optionally pop the results.
335 The CALL_INSN is the first insn generated.
337 FNDECL is the declaration node of the function. This is given to the
338 hook TARGET_RETURN_POPS_ARGS to determine whether this function pops
339 its own args.
341 FUNTYPE is the data type of the function. This is given to the hook
342 TARGET_RETURN_POPS_ARGS to determine whether this function pops its
343 own args. We used to allow an identifier for library functions, but
344 that doesn't work when the return type is an aggregate type and the
345 calling convention says that the pointer to this aggregate is to be
346 popped by the callee.
348 STACK_SIZE is the number of bytes of arguments on the stack,
349 ROUNDED_STACK_SIZE is that number rounded up to
350 PREFERRED_STACK_BOUNDARY; zero if the size is variable. This is
351 both to put into the call insn and to generate explicit popping
352 code if necessary.
354 STRUCT_VALUE_SIZE is the number of bytes wanted in a structure value.
355 It is zero if this call doesn't want a structure value.
357 NEXT_ARG_REG is the rtx that results from executing
358 targetm.calls.function_arg (&args_so_far, VOIDmode, void_type_node, true)
359 just after all the args have had their registers assigned.
360 This could be whatever you like, but normally it is the first
361 arg-register beyond those used for args in this call,
362 or 0 if all the arg-registers are used in this call.
363 It is passed on to `gen_call' so you can put this info in the call insn.
365 VALREG is a hard register in which a value is returned,
366 or 0 if the call does not return a value.
368 OLD_INHIBIT_DEFER_POP is the value that `inhibit_defer_pop' had before
369 the args to this call were processed.
370 We restore `inhibit_defer_pop' to that value.
372 CALL_FUSAGE is either empty or an EXPR_LIST of USE expressions that
373 denote registers used by the called function. */
375 static void
376 emit_call_1 (rtx funexp, tree fntree ATTRIBUTE_UNUSED, tree fndecl ATTRIBUTE_UNUSED,
377 tree funtype ATTRIBUTE_UNUSED,
378 poly_int64 stack_size ATTRIBUTE_UNUSED,
379 poly_int64 rounded_stack_size,
380 poly_int64 struct_value_size ATTRIBUTE_UNUSED,
381 rtx next_arg_reg ATTRIBUTE_UNUSED, rtx valreg,
382 int old_inhibit_defer_pop, rtx call_fusage, int ecf_flags,
383 cumulative_args_t args_so_far ATTRIBUTE_UNUSED)
385 rtx rounded_stack_size_rtx = gen_int_mode (rounded_stack_size, Pmode);
386 rtx call, funmem, pat;
387 int already_popped = 0;
388 poly_int64 n_popped = 0;
390 /* Sibling call patterns never pop arguments (no sibcall(_value)_pop
391 patterns exist). Any popping that the callee does on return will
392 be from our caller's frame rather than ours. */
393 if (!(ecf_flags & ECF_SIBCALL))
395 n_popped += targetm.calls.return_pops_args (fndecl, funtype, stack_size);
397 #ifdef CALL_POPS_ARGS
398 n_popped += CALL_POPS_ARGS (*get_cumulative_args (args_so_far));
399 #endif
402 /* Ensure address is valid. SYMBOL_REF is already valid, so no need,
403 and we don't want to load it into a register as an optimization,
404 because prepare_call_address already did it if it should be done. */
405 if (GET_CODE (funexp) != SYMBOL_REF)
406 funexp = memory_address (FUNCTION_MODE, funexp);
408 funmem = gen_rtx_MEM (FUNCTION_MODE, funexp);
409 if (fndecl && TREE_CODE (fndecl) == FUNCTION_DECL)
411 tree t = fndecl;
413 /* Although a built-in FUNCTION_DECL and its non-__builtin
414 counterpart compare equal and get a shared mem_attrs, they
415 produce different dump output in compare-debug compilations,
416 if an entry gets garbage collected in one compilation, then
417 adds a different (but equivalent) entry, while the other
418 doesn't run the garbage collector at the same spot and then
419 shares the mem_attr with the equivalent entry. */
420 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
422 tree t2 = builtin_decl_explicit (DECL_FUNCTION_CODE (t));
423 if (t2)
424 t = t2;
427 set_mem_expr (funmem, t);
429 else if (fntree)
430 set_mem_expr (funmem, build_simple_mem_ref (CALL_EXPR_FN (fntree)));
432 if (ecf_flags & ECF_SIBCALL)
434 if (valreg)
435 pat = targetm.gen_sibcall_value (valreg, funmem,
436 rounded_stack_size_rtx,
437 next_arg_reg, NULL_RTX);
438 else
439 pat = targetm.gen_sibcall (funmem, rounded_stack_size_rtx,
440 next_arg_reg,
441 gen_int_mode (struct_value_size, Pmode));
443 /* If the target has "call" or "call_value" insns, then prefer them
444 if no arguments are actually popped. If the target does not have
445 "call" or "call_value" insns, then we must use the popping versions
446 even if the call has no arguments to pop. */
447 else if (maybe_ne (n_popped, 0)
448 || !(valreg
449 ? targetm.have_call_value ()
450 : targetm.have_call ()))
452 rtx n_pop = gen_int_mode (n_popped, Pmode);
454 /* If this subroutine pops its own args, record that in the call insn
455 if possible, for the sake of frame pointer elimination. */
457 if (valreg)
458 pat = targetm.gen_call_value_pop (valreg, funmem,
459 rounded_stack_size_rtx,
460 next_arg_reg, n_pop);
461 else
462 pat = targetm.gen_call_pop (funmem, rounded_stack_size_rtx,
463 next_arg_reg, n_pop);
465 already_popped = 1;
467 else
469 if (valreg)
470 pat = targetm.gen_call_value (valreg, funmem, rounded_stack_size_rtx,
471 next_arg_reg, NULL_RTX);
472 else
473 pat = targetm.gen_call (funmem, rounded_stack_size_rtx, next_arg_reg,
474 gen_int_mode (struct_value_size, Pmode));
476 emit_insn (pat);
478 /* Find the call we just emitted. */
479 rtx_call_insn *call_insn = last_call_insn ();
481 /* Some target create a fresh MEM instead of reusing the one provided
482 above. Set its MEM_EXPR. */
483 call = get_call_rtx_from (call_insn);
484 if (call
485 && MEM_EXPR (XEXP (call, 0)) == NULL_TREE
486 && MEM_EXPR (funmem) != NULL_TREE)
487 set_mem_expr (XEXP (call, 0), MEM_EXPR (funmem));
489 /* Put the register usage information there. */
490 add_function_usage_to (call_insn, call_fusage);
492 /* If this is a const call, then set the insn's unchanging bit. */
493 if (ecf_flags & ECF_CONST)
494 RTL_CONST_CALL_P (call_insn) = 1;
496 /* If this is a pure call, then set the insn's unchanging bit. */
497 if (ecf_flags & ECF_PURE)
498 RTL_PURE_CALL_P (call_insn) = 1;
500 /* If this is a const call, then set the insn's unchanging bit. */
501 if (ecf_flags & ECF_LOOPING_CONST_OR_PURE)
502 RTL_LOOPING_CONST_OR_PURE_CALL_P (call_insn) = 1;
504 /* Create a nothrow REG_EH_REGION note, if needed. */
505 make_reg_eh_region_note (call_insn, ecf_flags, 0);
507 if (ecf_flags & ECF_NORETURN)
508 add_reg_note (call_insn, REG_NORETURN, const0_rtx);
510 if (ecf_flags & ECF_RETURNS_TWICE)
512 add_reg_note (call_insn, REG_SETJMP, const0_rtx);
513 cfun->calls_setjmp = 1;
516 SIBLING_CALL_P (call_insn) = ((ecf_flags & ECF_SIBCALL) != 0);
518 /* Restore this now, so that we do defer pops for this call's args
519 if the context of the call as a whole permits. */
520 inhibit_defer_pop = old_inhibit_defer_pop;
522 if (maybe_ne (n_popped, 0))
524 if (!already_popped)
525 CALL_INSN_FUNCTION_USAGE (call_insn)
526 = gen_rtx_EXPR_LIST (VOIDmode,
527 gen_rtx_CLOBBER (VOIDmode, stack_pointer_rtx),
528 CALL_INSN_FUNCTION_USAGE (call_insn));
529 rounded_stack_size -= n_popped;
530 rounded_stack_size_rtx = gen_int_mode (rounded_stack_size, Pmode);
531 stack_pointer_delta -= n_popped;
533 add_args_size_note (call_insn, stack_pointer_delta);
535 /* If popup is needed, stack realign must use DRAP */
536 if (SUPPORTS_STACK_ALIGNMENT)
537 crtl->need_drap = true;
539 /* For noreturn calls when not accumulating outgoing args force
540 REG_ARGS_SIZE note to prevent crossjumping of calls with different
541 args sizes. */
542 else if (!ACCUMULATE_OUTGOING_ARGS && (ecf_flags & ECF_NORETURN) != 0)
543 add_args_size_note (call_insn, stack_pointer_delta);
545 if (!ACCUMULATE_OUTGOING_ARGS)
547 /* If returning from the subroutine does not automatically pop the args,
548 we need an instruction to pop them sooner or later.
549 Perhaps do it now; perhaps just record how much space to pop later.
551 If returning from the subroutine does pop the args, indicate that the
552 stack pointer will be changed. */
554 if (maybe_ne (rounded_stack_size, 0))
556 if (ecf_flags & ECF_NORETURN)
557 /* Just pretend we did the pop. */
558 stack_pointer_delta -= rounded_stack_size;
559 else if (flag_defer_pop && inhibit_defer_pop == 0
560 && ! (ecf_flags & (ECF_CONST | ECF_PURE)))
561 pending_stack_adjust += rounded_stack_size;
562 else
563 adjust_stack (rounded_stack_size_rtx);
566 /* When we accumulate outgoing args, we must avoid any stack manipulations.
567 Restore the stack pointer to its original value now. Usually
568 ACCUMULATE_OUTGOING_ARGS targets don't get here, but there are exceptions.
569 On i386 ACCUMULATE_OUTGOING_ARGS can be enabled on demand, and
570 popping variants of functions exist as well.
572 ??? We may optimize similar to defer_pop above, but it is
573 probably not worthwhile.
575 ??? It will be worthwhile to enable combine_stack_adjustments even for
576 such machines. */
577 else if (maybe_ne (n_popped, 0))
578 anti_adjust_stack (gen_int_mode (n_popped, Pmode));
581 /* Determine if the function identified by FNDECL is one with
582 special properties we wish to know about. Modify FLAGS accordingly.
584 For example, if the function might return more than one time (setjmp), then
585 set ECF_RETURNS_TWICE.
587 Set ECF_MAY_BE_ALLOCA for any memory allocation function that might allocate
588 space from the stack such as alloca. */
590 static int
591 special_function_p (const_tree fndecl, int flags)
593 tree name_decl = DECL_NAME (fndecl);
595 if (fndecl && name_decl
596 && IDENTIFIER_LENGTH (name_decl) <= 11
597 /* Exclude functions not at the file scope, or not `extern',
598 since they are not the magic functions we would otherwise
599 think they are.
600 FIXME: this should be handled with attributes, not with this
601 hacky imitation of DECL_ASSEMBLER_NAME. It's (also) wrong
602 because you can declare fork() inside a function if you
603 wish. */
604 && (DECL_CONTEXT (fndecl) == NULL_TREE
605 || TREE_CODE (DECL_CONTEXT (fndecl)) == TRANSLATION_UNIT_DECL)
606 && TREE_PUBLIC (fndecl))
608 const char *name = IDENTIFIER_POINTER (name_decl);
609 const char *tname = name;
611 /* We assume that alloca will always be called by name. It
612 makes no sense to pass it as a pointer-to-function to
613 anything that does not understand its behavior. */
614 if (IDENTIFIER_LENGTH (name_decl) == 6
615 && name[0] == 'a'
616 && ! strcmp (name, "alloca"))
617 flags |= ECF_MAY_BE_ALLOCA;
619 /* Disregard prefix _ or __. */
620 if (name[0] == '_')
622 if (name[1] == '_')
623 tname += 2;
624 else
625 tname += 1;
628 /* ECF_RETURNS_TWICE is safe even for -ffreestanding. */
629 if (! strcmp (tname, "setjmp")
630 || ! strcmp (tname, "sigsetjmp")
631 || ! strcmp (name, "savectx")
632 || ! strcmp (name, "vfork")
633 || ! strcmp (name, "getcontext"))
634 flags |= ECF_RETURNS_TWICE;
637 if (DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
638 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (fndecl)))
639 flags |= ECF_MAY_BE_ALLOCA;
641 return flags;
644 /* Similar to special_function_p; return a set of ERF_ flags for the
645 function FNDECL. */
646 static int
647 decl_return_flags (tree fndecl)
649 tree attr;
650 tree type = TREE_TYPE (fndecl);
651 if (!type)
652 return 0;
654 attr = lookup_attribute ("fn spec", TYPE_ATTRIBUTES (type));
655 if (!attr)
656 return 0;
658 attr = TREE_VALUE (TREE_VALUE (attr));
659 if (!attr || TREE_STRING_LENGTH (attr) < 1)
660 return 0;
662 switch (TREE_STRING_POINTER (attr)[0])
664 case '1':
665 case '2':
666 case '3':
667 case '4':
668 return ERF_RETURNS_ARG | (TREE_STRING_POINTER (attr)[0] - '1');
670 case 'm':
671 return ERF_NOALIAS;
673 case '.':
674 default:
675 return 0;
679 /* Return nonzero when FNDECL represents a call to setjmp. */
682 setjmp_call_p (const_tree fndecl)
684 if (DECL_IS_RETURNS_TWICE (fndecl))
685 return ECF_RETURNS_TWICE;
686 return special_function_p (fndecl, 0) & ECF_RETURNS_TWICE;
690 /* Return true if STMT may be an alloca call. */
692 bool
693 gimple_maybe_alloca_call_p (const gimple *stmt)
695 tree fndecl;
697 if (!is_gimple_call (stmt))
698 return false;
700 fndecl = gimple_call_fndecl (stmt);
701 if (fndecl && (special_function_p (fndecl, 0) & ECF_MAY_BE_ALLOCA))
702 return true;
704 return false;
707 /* Return true if STMT is a builtin alloca call. */
709 bool
710 gimple_alloca_call_p (const gimple *stmt)
712 tree fndecl;
714 if (!is_gimple_call (stmt))
715 return false;
717 fndecl = gimple_call_fndecl (stmt);
718 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
719 switch (DECL_FUNCTION_CODE (fndecl))
721 CASE_BUILT_IN_ALLOCA:
722 return gimple_call_num_args (stmt) > 0;
723 default:
724 break;
727 return false;
730 /* Return true when exp contains a builtin alloca call. */
732 bool
733 alloca_call_p (const_tree exp)
735 tree fndecl;
736 if (TREE_CODE (exp) == CALL_EXPR
737 && (fndecl = get_callee_fndecl (exp))
738 && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
739 switch (DECL_FUNCTION_CODE (fndecl))
741 CASE_BUILT_IN_ALLOCA:
742 return true;
743 default:
744 break;
747 return false;
750 /* Return TRUE if FNDECL is either a TM builtin or a TM cloned
751 function. Return FALSE otherwise. */
753 static bool
754 is_tm_builtin (const_tree fndecl)
756 if (fndecl == NULL)
757 return false;
759 if (decl_is_tm_clone (fndecl))
760 return true;
762 if (DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
764 switch (DECL_FUNCTION_CODE (fndecl))
766 case BUILT_IN_TM_COMMIT:
767 case BUILT_IN_TM_COMMIT_EH:
768 case BUILT_IN_TM_ABORT:
769 case BUILT_IN_TM_IRREVOCABLE:
770 case BUILT_IN_TM_GETTMCLONE_IRR:
771 case BUILT_IN_TM_MEMCPY:
772 case BUILT_IN_TM_MEMMOVE:
773 case BUILT_IN_TM_MEMSET:
774 CASE_BUILT_IN_TM_STORE (1):
775 CASE_BUILT_IN_TM_STORE (2):
776 CASE_BUILT_IN_TM_STORE (4):
777 CASE_BUILT_IN_TM_STORE (8):
778 CASE_BUILT_IN_TM_STORE (FLOAT):
779 CASE_BUILT_IN_TM_STORE (DOUBLE):
780 CASE_BUILT_IN_TM_STORE (LDOUBLE):
781 CASE_BUILT_IN_TM_STORE (M64):
782 CASE_BUILT_IN_TM_STORE (M128):
783 CASE_BUILT_IN_TM_STORE (M256):
784 CASE_BUILT_IN_TM_LOAD (1):
785 CASE_BUILT_IN_TM_LOAD (2):
786 CASE_BUILT_IN_TM_LOAD (4):
787 CASE_BUILT_IN_TM_LOAD (8):
788 CASE_BUILT_IN_TM_LOAD (FLOAT):
789 CASE_BUILT_IN_TM_LOAD (DOUBLE):
790 CASE_BUILT_IN_TM_LOAD (LDOUBLE):
791 CASE_BUILT_IN_TM_LOAD (M64):
792 CASE_BUILT_IN_TM_LOAD (M128):
793 CASE_BUILT_IN_TM_LOAD (M256):
794 case BUILT_IN_TM_LOG:
795 case BUILT_IN_TM_LOG_1:
796 case BUILT_IN_TM_LOG_2:
797 case BUILT_IN_TM_LOG_4:
798 case BUILT_IN_TM_LOG_8:
799 case BUILT_IN_TM_LOG_FLOAT:
800 case BUILT_IN_TM_LOG_DOUBLE:
801 case BUILT_IN_TM_LOG_LDOUBLE:
802 case BUILT_IN_TM_LOG_M64:
803 case BUILT_IN_TM_LOG_M128:
804 case BUILT_IN_TM_LOG_M256:
805 return true;
806 default:
807 break;
810 return false;
813 /* Detect flags (function attributes) from the function decl or type node. */
816 flags_from_decl_or_type (const_tree exp)
818 int flags = 0;
820 if (DECL_P (exp))
822 /* The function exp may have the `malloc' attribute. */
823 if (DECL_IS_MALLOC (exp))
824 flags |= ECF_MALLOC;
826 /* The function exp may have the `returns_twice' attribute. */
827 if (DECL_IS_RETURNS_TWICE (exp))
828 flags |= ECF_RETURNS_TWICE;
830 /* Process the pure and const attributes. */
831 if (TREE_READONLY (exp))
832 flags |= ECF_CONST;
833 if (DECL_PURE_P (exp))
834 flags |= ECF_PURE;
835 if (DECL_LOOPING_CONST_OR_PURE_P (exp))
836 flags |= ECF_LOOPING_CONST_OR_PURE;
838 if (DECL_IS_NOVOPS (exp))
839 flags |= ECF_NOVOPS;
840 if (lookup_attribute ("leaf", DECL_ATTRIBUTES (exp)))
841 flags |= ECF_LEAF;
842 if (lookup_attribute ("cold", DECL_ATTRIBUTES (exp)))
843 flags |= ECF_COLD;
845 if (TREE_NOTHROW (exp))
846 flags |= ECF_NOTHROW;
848 if (flag_tm)
850 if (is_tm_builtin (exp))
851 flags |= ECF_TM_BUILTIN;
852 else if ((flags & (ECF_CONST|ECF_NOVOPS)) != 0
853 || lookup_attribute ("transaction_pure",
854 TYPE_ATTRIBUTES (TREE_TYPE (exp))))
855 flags |= ECF_TM_PURE;
858 flags = special_function_p (exp, flags);
860 else if (TYPE_P (exp))
862 if (TYPE_READONLY (exp))
863 flags |= ECF_CONST;
865 if (flag_tm
866 && ((flags & ECF_CONST) != 0
867 || lookup_attribute ("transaction_pure", TYPE_ATTRIBUTES (exp))))
868 flags |= ECF_TM_PURE;
870 else
871 gcc_unreachable ();
873 if (TREE_THIS_VOLATILE (exp))
875 flags |= ECF_NORETURN;
876 if (flags & (ECF_CONST|ECF_PURE))
877 flags |= ECF_LOOPING_CONST_OR_PURE;
880 return flags;
883 /* Detect flags from a CALL_EXPR. */
886 call_expr_flags (const_tree t)
888 int flags;
889 tree decl = get_callee_fndecl (t);
891 if (decl)
892 flags = flags_from_decl_or_type (decl);
893 else if (CALL_EXPR_FN (t) == NULL_TREE)
894 flags = internal_fn_flags (CALL_EXPR_IFN (t));
895 else
897 tree type = TREE_TYPE (CALL_EXPR_FN (t));
898 if (type && TREE_CODE (type) == POINTER_TYPE)
899 flags = flags_from_decl_or_type (TREE_TYPE (type));
900 else
901 flags = 0;
902 if (CALL_EXPR_BY_DESCRIPTOR (t))
903 flags |= ECF_BY_DESCRIPTOR;
906 return flags;
909 /* Return true if TYPE should be passed by invisible reference. */
911 bool
912 pass_by_reference (CUMULATIVE_ARGS *ca, machine_mode mode,
913 tree type, bool named_arg)
915 if (type)
917 /* If this type contains non-trivial constructors, then it is
918 forbidden for the middle-end to create any new copies. */
919 if (TREE_ADDRESSABLE (type))
920 return true;
922 /* GCC post 3.4 passes *all* variable sized types by reference. */
923 if (!TYPE_SIZE (type) || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
924 return true;
926 /* If a record type should be passed the same as its first (and only)
927 member, use the type and mode of that member. */
928 if (TREE_CODE (type) == RECORD_TYPE && TYPE_TRANSPARENT_AGGR (type))
930 type = TREE_TYPE (first_field (type));
931 mode = TYPE_MODE (type);
935 return targetm.calls.pass_by_reference (pack_cumulative_args (ca), mode,
936 type, named_arg);
939 /* Return true if TYPE, which is passed by reference, should be callee
940 copied instead of caller copied. */
942 bool
943 reference_callee_copied (CUMULATIVE_ARGS *ca, machine_mode mode,
944 tree type, bool named_arg)
946 if (type && TREE_ADDRESSABLE (type))
947 return false;
948 return targetm.calls.callee_copies (pack_cumulative_args (ca), mode, type,
949 named_arg);
953 /* Precompute all register parameters as described by ARGS, storing values
954 into fields within the ARGS array.
956 NUM_ACTUALS indicates the total number elements in the ARGS array.
958 Set REG_PARM_SEEN if we encounter a register parameter. */
960 static void
961 precompute_register_parameters (int num_actuals, struct arg_data *args,
962 int *reg_parm_seen)
964 int i;
966 *reg_parm_seen = 0;
968 for (i = 0; i < num_actuals; i++)
969 if (args[i].reg != 0 && ! args[i].pass_on_stack)
971 *reg_parm_seen = 1;
973 if (args[i].value == 0)
975 push_temp_slots ();
976 args[i].value = expand_normal (args[i].tree_value);
977 preserve_temp_slots (args[i].value);
978 pop_temp_slots ();
981 /* If we are to promote the function arg to a wider mode,
982 do it now. */
984 if (args[i].mode != TYPE_MODE (TREE_TYPE (args[i].tree_value)))
985 args[i].value
986 = convert_modes (args[i].mode,
987 TYPE_MODE (TREE_TYPE (args[i].tree_value)),
988 args[i].value, args[i].unsignedp);
990 /* If the value is a non-legitimate constant, force it into a
991 pseudo now. TLS symbols sometimes need a call to resolve. */
992 if (CONSTANT_P (args[i].value)
993 && !targetm.legitimate_constant_p (args[i].mode, args[i].value))
994 args[i].value = force_reg (args[i].mode, args[i].value);
996 /* If we're going to have to load the value by parts, pull the
997 parts into pseudos. The part extraction process can involve
998 non-trivial computation. */
999 if (GET_CODE (args[i].reg) == PARALLEL)
1001 tree type = TREE_TYPE (args[i].tree_value);
1002 args[i].parallel_value
1003 = emit_group_load_into_temps (args[i].reg, args[i].value,
1004 type, int_size_in_bytes (type));
1007 /* If the value is expensive, and we are inside an appropriately
1008 short loop, put the value into a pseudo and then put the pseudo
1009 into the hard reg.
1011 For small register classes, also do this if this call uses
1012 register parameters. This is to avoid reload conflicts while
1013 loading the parameters registers. */
1015 else if ((! (REG_P (args[i].value)
1016 || (GET_CODE (args[i].value) == SUBREG
1017 && REG_P (SUBREG_REG (args[i].value)))))
1018 && args[i].mode != BLKmode
1019 && (set_src_cost (args[i].value, args[i].mode,
1020 optimize_insn_for_speed_p ())
1021 > COSTS_N_INSNS (1))
1022 && ((*reg_parm_seen
1023 && targetm.small_register_classes_for_mode_p (args[i].mode))
1024 || optimize))
1025 args[i].value = copy_to_mode_reg (args[i].mode, args[i].value);
1029 #ifdef REG_PARM_STACK_SPACE
1031 /* The argument list is the property of the called routine and it
1032 may clobber it. If the fixed area has been used for previous
1033 parameters, we must save and restore it. */
1035 static rtx
1036 save_fixed_argument_area (int reg_parm_stack_space, rtx argblock, int *low_to_save, int *high_to_save)
1038 unsigned int low;
1039 unsigned int high;
1041 /* Compute the boundary of the area that needs to be saved, if any. */
1042 high = reg_parm_stack_space;
1043 if (ARGS_GROW_DOWNWARD)
1044 high += 1;
1046 if (high > highest_outgoing_arg_in_use)
1047 high = highest_outgoing_arg_in_use;
1049 for (low = 0; low < high; low++)
1050 if (stack_usage_map[low] != 0 || low >= stack_usage_watermark)
1052 int num_to_save;
1053 machine_mode save_mode;
1054 int delta;
1055 rtx addr;
1056 rtx stack_area;
1057 rtx save_area;
1059 while (stack_usage_map[--high] == 0)
1062 *low_to_save = low;
1063 *high_to_save = high;
1065 num_to_save = high - low + 1;
1067 /* If we don't have the required alignment, must do this
1068 in BLKmode. */
1069 scalar_int_mode imode;
1070 if (int_mode_for_size (num_to_save * BITS_PER_UNIT, 1).exists (&imode)
1071 && (low & (MIN (GET_MODE_SIZE (imode),
1072 BIGGEST_ALIGNMENT / UNITS_PER_WORD) - 1)) == 0)
1073 save_mode = imode;
1074 else
1075 save_mode = BLKmode;
1077 if (ARGS_GROW_DOWNWARD)
1078 delta = -high;
1079 else
1080 delta = low;
1082 addr = plus_constant (Pmode, argblock, delta);
1083 stack_area = gen_rtx_MEM (save_mode, memory_address (save_mode, addr));
1085 set_mem_align (stack_area, PARM_BOUNDARY);
1086 if (save_mode == BLKmode)
1088 save_area = assign_stack_temp (BLKmode, num_to_save);
1089 emit_block_move (validize_mem (save_area), stack_area,
1090 GEN_INT (num_to_save), BLOCK_OP_CALL_PARM);
1092 else
1094 save_area = gen_reg_rtx (save_mode);
1095 emit_move_insn (save_area, stack_area);
1098 return save_area;
1101 return NULL_RTX;
1104 static void
1105 restore_fixed_argument_area (rtx save_area, rtx argblock, int high_to_save, int low_to_save)
1107 machine_mode save_mode = GET_MODE (save_area);
1108 int delta;
1109 rtx addr, stack_area;
1111 if (ARGS_GROW_DOWNWARD)
1112 delta = -high_to_save;
1113 else
1114 delta = low_to_save;
1116 addr = plus_constant (Pmode, argblock, delta);
1117 stack_area = gen_rtx_MEM (save_mode, memory_address (save_mode, addr));
1118 set_mem_align (stack_area, PARM_BOUNDARY);
1120 if (save_mode != BLKmode)
1121 emit_move_insn (stack_area, save_area);
1122 else
1123 emit_block_move (stack_area, validize_mem (save_area),
1124 GEN_INT (high_to_save - low_to_save + 1),
1125 BLOCK_OP_CALL_PARM);
1127 #endif /* REG_PARM_STACK_SPACE */
1129 /* If any elements in ARGS refer to parameters that are to be passed in
1130 registers, but not in memory, and whose alignment does not permit a
1131 direct copy into registers. Copy the values into a group of pseudos
1132 which we will later copy into the appropriate hard registers.
1134 Pseudos for each unaligned argument will be stored into the array
1135 args[argnum].aligned_regs. The caller is responsible for deallocating
1136 the aligned_regs array if it is nonzero. */
1138 static void
1139 store_unaligned_arguments_into_pseudos (struct arg_data *args, int num_actuals)
1141 int i, j;
1143 for (i = 0; i < num_actuals; i++)
1144 if (args[i].reg != 0 && ! args[i].pass_on_stack
1145 && GET_CODE (args[i].reg) != PARALLEL
1146 && args[i].mode == BLKmode
1147 && MEM_P (args[i].value)
1148 && (MEM_ALIGN (args[i].value)
1149 < (unsigned int) MIN (BIGGEST_ALIGNMENT, BITS_PER_WORD)))
1151 int bytes = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
1152 int endian_correction = 0;
1154 if (args[i].partial)
1156 gcc_assert (args[i].partial % UNITS_PER_WORD == 0);
1157 args[i].n_aligned_regs = args[i].partial / UNITS_PER_WORD;
1159 else
1161 args[i].n_aligned_regs
1162 = (bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
1165 args[i].aligned_regs = XNEWVEC (rtx, args[i].n_aligned_regs);
1167 /* Structures smaller than a word are normally aligned to the
1168 least significant byte. On a BYTES_BIG_ENDIAN machine,
1169 this means we must skip the empty high order bytes when
1170 calculating the bit offset. */
1171 if (bytes < UNITS_PER_WORD
1172 #ifdef BLOCK_REG_PADDING
1173 && (BLOCK_REG_PADDING (args[i].mode,
1174 TREE_TYPE (args[i].tree_value), 1)
1175 == PAD_DOWNWARD)
1176 #else
1177 && BYTES_BIG_ENDIAN
1178 #endif
1180 endian_correction = BITS_PER_WORD - bytes * BITS_PER_UNIT;
1182 for (j = 0; j < args[i].n_aligned_regs; j++)
1184 rtx reg = gen_reg_rtx (word_mode);
1185 rtx word = operand_subword_force (args[i].value, j, BLKmode);
1186 int bitsize = MIN (bytes * BITS_PER_UNIT, BITS_PER_WORD);
1188 args[i].aligned_regs[j] = reg;
1189 word = extract_bit_field (word, bitsize, 0, 1, NULL_RTX,
1190 word_mode, word_mode, false, NULL);
1192 /* There is no need to restrict this code to loading items
1193 in TYPE_ALIGN sized hunks. The bitfield instructions can
1194 load up entire word sized registers efficiently.
1196 ??? This may not be needed anymore.
1197 We use to emit a clobber here but that doesn't let later
1198 passes optimize the instructions we emit. By storing 0 into
1199 the register later passes know the first AND to zero out the
1200 bitfield being set in the register is unnecessary. The store
1201 of 0 will be deleted as will at least the first AND. */
1203 emit_move_insn (reg, const0_rtx);
1205 bytes -= bitsize / BITS_PER_UNIT;
1206 store_bit_field (reg, bitsize, endian_correction, 0, 0,
1207 word_mode, word, false);
1212 /* The limit set by -Walloc-larger-than=. */
1213 static GTY(()) tree alloc_object_size_limit;
1215 /* Initialize ALLOC_OBJECT_SIZE_LIMIT based on the -Walloc-size-larger-than=
1216 setting if the option is specified, or to the maximum object size if it
1217 is not. Return the initialized value. */
1219 static tree
1220 alloc_max_size (void)
1222 if (alloc_object_size_limit)
1223 return alloc_object_size_limit;
1225 alloc_object_size_limit
1226 = build_int_cst (size_type_node, warn_alloc_size_limit);
1228 return alloc_object_size_limit;
1231 /* Return true when EXP's range can be determined and set RANGE[] to it
1232 after adjusting it if necessary to make EXP a represents a valid size
1233 of object, or a valid size argument to an allocation function declared
1234 with attribute alloc_size (whose argument may be signed), or to a string
1235 manipulation function like memset. When ALLOW_ZERO is true, allow
1236 returning a range of [0, 0] for a size in an anti-range [1, N] where
1237 N > PTRDIFF_MAX. A zero range is a (nearly) invalid argument to
1238 allocation functions like malloc but it is a valid argument to
1239 functions like memset. */
1241 bool
1242 get_size_range (tree exp, tree range[2], bool allow_zero /* = false */)
1244 if (tree_fits_uhwi_p (exp))
1246 /* EXP is a constant. */
1247 range[0] = range[1] = exp;
1248 return true;
1251 tree exptype = TREE_TYPE (exp);
1252 bool integral = INTEGRAL_TYPE_P (exptype);
1254 wide_int min, max;
1255 enum value_range_type range_type;
1257 if (integral)
1258 range_type = determine_value_range (exp, &min, &max);
1259 else
1260 range_type = VR_VARYING;
1262 if (range_type == VR_VARYING)
1264 if (integral)
1266 /* Use the full range of the type of the expression when
1267 no value range information is available. */
1268 range[0] = TYPE_MIN_VALUE (exptype);
1269 range[1] = TYPE_MAX_VALUE (exptype);
1270 return true;
1273 range[0] = NULL_TREE;
1274 range[1] = NULL_TREE;
1275 return false;
1278 unsigned expprec = TYPE_PRECISION (exptype);
1280 bool signed_p = !TYPE_UNSIGNED (exptype);
1282 if (range_type == VR_ANTI_RANGE)
1284 if (signed_p)
1286 if (wi::les_p (max, 0))
1288 /* EXP is not in a strictly negative range. That means
1289 it must be in some (not necessarily strictly) positive
1290 range which includes zero. Since in signed to unsigned
1291 conversions negative values end up converted to large
1292 positive values, and otherwise they are not valid sizes,
1293 the resulting range is in both cases [0, TYPE_MAX]. */
1294 min = wi::zero (expprec);
1295 max = wi::to_wide (TYPE_MAX_VALUE (exptype));
1297 else if (wi::les_p (min - 1, 0))
1299 /* EXP is not in a negative-positive range. That means EXP
1300 is either negative, or greater than max. Since negative
1301 sizes are invalid make the range [MAX + 1, TYPE_MAX]. */
1302 min = max + 1;
1303 max = wi::to_wide (TYPE_MAX_VALUE (exptype));
1305 else
1307 max = min - 1;
1308 min = wi::zero (expprec);
1311 else if (wi::eq_p (0, min - 1))
1313 /* EXP is unsigned and not in the range [1, MAX]. That means
1314 it's either zero or greater than MAX. Even though 0 would
1315 normally be detected by -Walloc-zero, unless ALLOW_ZERO
1316 is true, set the range to [MAX, TYPE_MAX] so that when MAX
1317 is greater than the limit the whole range is diagnosed. */
1318 if (allow_zero)
1319 min = max = wi::zero (expprec);
1320 else
1322 min = max + 1;
1323 max = wi::to_wide (TYPE_MAX_VALUE (exptype));
1326 else
1328 max = min - 1;
1329 min = wi::zero (expprec);
1333 range[0] = wide_int_to_tree (exptype, min);
1334 range[1] = wide_int_to_tree (exptype, max);
1336 return true;
1339 /* Diagnose a call EXP to function FN decorated with attribute alloc_size
1340 whose argument numbers given by IDX with values given by ARGS exceed
1341 the maximum object size or cause an unsigned oveflow (wrapping) when
1342 multiplied. When ARGS[0] is null the function does nothing. ARGS[1]
1343 may be null for functions like malloc, and non-null for those like
1344 calloc that are decorated with a two-argument attribute alloc_size. */
1346 void
1347 maybe_warn_alloc_args_overflow (tree fn, tree exp, tree args[2], int idx[2])
1349 /* The range each of the (up to) two arguments is known to be in. */
1350 tree argrange[2][2] = { { NULL_TREE, NULL_TREE }, { NULL_TREE, NULL_TREE } };
1352 /* Maximum object size set by -Walloc-size-larger-than= or SIZE_MAX / 2. */
1353 tree maxobjsize = alloc_max_size ();
1355 location_t loc = EXPR_LOCATION (exp);
1357 bool warned = false;
1359 /* Validate each argument individually. */
1360 for (unsigned i = 0; i != 2 && args[i]; ++i)
1362 if (TREE_CODE (args[i]) == INTEGER_CST)
1364 argrange[i][0] = args[i];
1365 argrange[i][1] = args[i];
1367 if (tree_int_cst_lt (args[i], integer_zero_node))
1369 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1370 "%Kargument %i value %qE is negative",
1371 exp, idx[i] + 1, args[i]);
1373 else if (integer_zerop (args[i]))
1375 /* Avoid issuing -Walloc-zero for allocation functions other
1376 than __builtin_alloca that are declared with attribute
1377 returns_nonnull because there's no portability risk. This
1378 avoids warning for such calls to libiberty's xmalloc and
1379 friends.
1380 Also avoid issuing the warning for calls to function named
1381 "alloca". */
1382 if ((DECL_FUNCTION_CODE (fn) == BUILT_IN_ALLOCA
1383 && IDENTIFIER_LENGTH (DECL_NAME (fn)) != 6)
1384 || (DECL_FUNCTION_CODE (fn) != BUILT_IN_ALLOCA
1385 && !lookup_attribute ("returns_nonnull",
1386 TYPE_ATTRIBUTES (TREE_TYPE (fn)))))
1387 warned = warning_at (loc, OPT_Walloc_zero,
1388 "%Kargument %i value is zero",
1389 exp, idx[i] + 1);
1391 else if (tree_int_cst_lt (maxobjsize, args[i]))
1393 /* G++ emits calls to ::operator new[](SIZE_MAX) in C++98
1394 mode and with -fno-exceptions as a way to indicate array
1395 size overflow. There's no good way to detect C++98 here
1396 so avoid diagnosing these calls for all C++ modes. */
1397 if (i == 0
1398 && !args[1]
1399 && lang_GNU_CXX ()
1400 && DECL_IS_OPERATOR_NEW (fn)
1401 && integer_all_onesp (args[i]))
1402 continue;
1404 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1405 "%Kargument %i value %qE exceeds "
1406 "maximum object size %E",
1407 exp, idx[i] + 1, args[i], maxobjsize);
1410 else if (TREE_CODE (args[i]) == SSA_NAME
1411 && get_size_range (args[i], argrange[i]))
1413 /* Verify that the argument's range is not negative (including
1414 upper bound of zero). */
1415 if (tree_int_cst_lt (argrange[i][0], integer_zero_node)
1416 && tree_int_cst_le (argrange[i][1], integer_zero_node))
1418 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1419 "%Kargument %i range [%E, %E] is negative",
1420 exp, idx[i] + 1,
1421 argrange[i][0], argrange[i][1]);
1423 else if (tree_int_cst_lt (maxobjsize, argrange[i][0]))
1425 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1426 "%Kargument %i range [%E, %E] exceeds "
1427 "maximum object size %E",
1428 exp, idx[i] + 1,
1429 argrange[i][0], argrange[i][1],
1430 maxobjsize);
1435 if (!argrange[0])
1436 return;
1438 /* For a two-argument alloc_size, validate the product of the two
1439 arguments if both of their values or ranges are known. */
1440 if (!warned && tree_fits_uhwi_p (argrange[0][0])
1441 && argrange[1][0] && tree_fits_uhwi_p (argrange[1][0])
1442 && !integer_onep (argrange[0][0])
1443 && !integer_onep (argrange[1][0]))
1445 /* Check for overflow in the product of a function decorated with
1446 attribute alloc_size (X, Y). */
1447 unsigned szprec = TYPE_PRECISION (size_type_node);
1448 wide_int x = wi::to_wide (argrange[0][0], szprec);
1449 wide_int y = wi::to_wide (argrange[1][0], szprec);
1451 wi::overflow_type vflow;
1452 wide_int prod = wi::umul (x, y, &vflow);
1454 if (vflow)
1455 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1456 "%Kproduct %<%E * %E%> of arguments %i and %i "
1457 "exceeds %<SIZE_MAX%>",
1458 exp, argrange[0][0], argrange[1][0],
1459 idx[0] + 1, idx[1] + 1);
1460 else if (wi::ltu_p (wi::to_wide (maxobjsize, szprec), prod))
1461 warned = warning_at (loc, OPT_Walloc_size_larger_than_,
1462 "%Kproduct %<%E * %E%> of arguments %i and %i "
1463 "exceeds maximum object size %E",
1464 exp, argrange[0][0], argrange[1][0],
1465 idx[0] + 1, idx[1] + 1,
1466 maxobjsize);
1468 if (warned)
1470 /* Print the full range of each of the two arguments to make
1471 it clear when it is, in fact, in a range and not constant. */
1472 if (argrange[0][0] != argrange [0][1])
1473 inform (loc, "argument %i in the range [%E, %E]",
1474 idx[0] + 1, argrange[0][0], argrange[0][1]);
1475 if (argrange[1][0] != argrange [1][1])
1476 inform (loc, "argument %i in the range [%E, %E]",
1477 idx[1] + 1, argrange[1][0], argrange[1][1]);
1481 if (warned)
1483 location_t fnloc = DECL_SOURCE_LOCATION (fn);
1485 if (DECL_IS_BUILTIN (fn))
1486 inform (loc,
1487 "in a call to built-in allocation function %qD", fn);
1488 else
1489 inform (fnloc,
1490 "in a call to allocation function %qD declared here", fn);
1494 /* If EXPR refers to a character array or pointer declared attribute
1495 nonstring return a decl for that array or pointer and set *REF to
1496 the referenced enclosing object or pointer. Otherwise returns
1497 null. */
1499 tree
1500 get_attr_nonstring_decl (tree expr, tree *ref)
1502 tree decl = expr;
1503 if (TREE_CODE (decl) == SSA_NAME)
1505 gimple *def = SSA_NAME_DEF_STMT (decl);
1507 if (is_gimple_assign (def))
1509 tree_code code = gimple_assign_rhs_code (def);
1510 if (code == ADDR_EXPR
1511 || code == COMPONENT_REF
1512 || code == VAR_DECL)
1513 decl = gimple_assign_rhs1 (def);
1515 else if (tree var = SSA_NAME_VAR (decl))
1516 decl = var;
1519 if (TREE_CODE (decl) == ADDR_EXPR)
1520 decl = TREE_OPERAND (decl, 0);
1522 if (ref)
1523 *ref = decl;
1525 if (TREE_CODE (decl) == ARRAY_REF)
1526 decl = TREE_OPERAND (decl, 0);
1527 else if (TREE_CODE (decl) == COMPONENT_REF)
1528 decl = TREE_OPERAND (decl, 1);
1529 else if (TREE_CODE (decl) == MEM_REF)
1530 return get_attr_nonstring_decl (TREE_OPERAND (decl, 0), ref);
1532 if (DECL_P (decl)
1533 && lookup_attribute ("nonstring", DECL_ATTRIBUTES (decl)))
1534 return decl;
1536 return NULL_TREE;
1539 /* Warn about passing a non-string array/pointer to a function that
1540 expects a nul-terminated string argument. */
1542 void
1543 maybe_warn_nonstring_arg (tree fndecl, tree exp)
1545 if (!fndecl || DECL_BUILT_IN_CLASS (fndecl) != BUILT_IN_NORMAL)
1546 return;
1548 if (TREE_NO_WARNING (exp))
1549 return;
1551 unsigned nargs = call_expr_nargs (exp);
1553 /* The bound argument to a bounded string function like strncpy. */
1554 tree bound = NULL_TREE;
1556 /* The range of lengths of a string argument to one of the comparison
1557 functions. If the length is less than the bound it is used instead. */
1558 tree lenrng[2] = { NULL_TREE, NULL_TREE };
1560 /* It's safe to call "bounded" string functions with a non-string
1561 argument since the functions provide an explicit bound for this
1562 purpose. The exception is strncat where the bound may refer to
1563 either the destination or the source. */
1564 int fncode = DECL_FUNCTION_CODE (fndecl);
1565 switch (fncode)
1567 case BUILT_IN_STRCMP:
1568 case BUILT_IN_STRNCMP:
1569 case BUILT_IN_STRNCASECMP:
1571 /* For these, if one argument refers to one or more of a set
1572 of string constants or arrays of known size, determine
1573 the range of their known or possible lengths and use it
1574 conservatively as the bound for the unbounded function,
1575 and to adjust the range of the bound of the bounded ones. */
1576 for (unsigned argno = 0; argno < nargs && !*lenrng; argno ++)
1578 tree arg = CALL_EXPR_ARG (exp, argno);
1579 if (!get_attr_nonstring_decl (arg))
1580 get_range_strlen (arg, lenrng);
1583 /* Fall through. */
1585 case BUILT_IN_STRNCAT:
1586 case BUILT_IN_STPNCPY:
1587 case BUILT_IN_STRNCPY:
1588 if (2 < nargs)
1589 bound = CALL_EXPR_ARG (exp, 2);
1590 break;
1592 case BUILT_IN_STRNDUP:
1593 if (1 < nargs)
1594 bound = CALL_EXPR_ARG (exp, 1);
1595 break;
1597 case BUILT_IN_STRNLEN:
1599 tree arg = CALL_EXPR_ARG (exp, 0);
1600 if (!get_attr_nonstring_decl (arg))
1601 get_range_strlen (arg, lenrng);
1603 if (1 < nargs)
1604 bound = CALL_EXPR_ARG (exp, 1);
1605 break;
1608 default:
1609 break;
1612 /* Determine the range of the bound argument (if specified). */
1613 tree bndrng[2] = { NULL_TREE, NULL_TREE };
1614 if (bound)
1616 STRIP_NOPS (bound);
1617 get_size_range (bound, bndrng);
1620 location_t loc = EXPR_LOCATION (exp);
1622 if (bndrng[0])
1624 /* Diagnose excessive bound prior the adjustment below and
1625 regardless of attribute nonstring. */
1626 tree maxobjsize = max_object_size ();
1627 if (tree_int_cst_lt (maxobjsize, bndrng[0]))
1629 if (tree_int_cst_equal (bndrng[0], bndrng[1]))
1630 warning_at (loc, OPT_Wstringop_overflow_,
1631 "%K%qD specified bound %E "
1632 "exceeds maximum object size %E",
1633 exp, fndecl, bndrng[0], maxobjsize);
1634 else
1635 warning_at (loc, OPT_Wstringop_overflow_,
1636 "%K%qD specified bound [%E, %E] "
1637 "exceeds maximum object size %E",
1638 exp, fndecl, bndrng[0], bndrng[1], maxobjsize);
1639 return;
1643 if (*lenrng)
1645 /* Add one for the nul. */
1646 lenrng[0] = const_binop (PLUS_EXPR, TREE_TYPE (lenrng[0]),
1647 lenrng[0], size_one_node);
1648 lenrng[1] = const_binop (PLUS_EXPR, TREE_TYPE (lenrng[1]),
1649 lenrng[1], size_one_node);
1651 if (!bndrng[0])
1653 /* Conservatively use the upper bound of the lengths for
1654 both the lower and the upper bound of the operation. */
1655 bndrng[0] = lenrng[1];
1656 bndrng[1] = lenrng[1];
1657 bound = void_type_node;
1659 else
1661 /* Replace the bound on the operation with the upper bound
1662 of the length of the string if the latter is smaller. */
1663 if (tree_int_cst_lt (lenrng[1], bndrng[0]))
1664 bndrng[0] = lenrng[1];
1665 else if (tree_int_cst_lt (lenrng[1], bndrng[1]))
1666 bndrng[1] = lenrng[1];
1670 /* Iterate over the built-in function's formal arguments and check
1671 each const char* against the actual argument. If the actual
1672 argument is declared attribute non-string issue a warning unless
1673 the argument's maximum length is bounded. */
1674 function_args_iterator it;
1675 function_args_iter_init (&it, TREE_TYPE (fndecl));
1677 for (unsigned argno = 0; ; ++argno, function_args_iter_next (&it))
1679 /* Avoid iterating past the declared argument in a call
1680 to function declared without a prototype. */
1681 if (argno >= nargs)
1682 break;
1684 tree argtype = function_args_iter_cond (&it);
1685 if (!argtype)
1686 break;
1688 if (TREE_CODE (argtype) != POINTER_TYPE)
1689 continue;
1691 argtype = TREE_TYPE (argtype);
1693 if (TREE_CODE (argtype) != INTEGER_TYPE
1694 || !TYPE_READONLY (argtype))
1695 continue;
1697 argtype = TYPE_MAIN_VARIANT (argtype);
1698 if (argtype != char_type_node)
1699 continue;
1701 tree callarg = CALL_EXPR_ARG (exp, argno);
1702 if (TREE_CODE (callarg) == ADDR_EXPR)
1703 callarg = TREE_OPERAND (callarg, 0);
1705 /* See if the destination is declared with attribute "nonstring". */
1706 tree decl = get_attr_nonstring_decl (callarg);
1707 if (!decl)
1708 continue;
1710 /* The maximum number of array elements accessed. */
1711 offset_int wibnd = 0;
1713 if (argno && fncode == BUILT_IN_STRNCAT)
1715 /* See if the bound in strncat is derived from the length
1716 of the strlen of the destination (as it's expected to be).
1717 If so, reset BOUND and FNCODE to trigger a warning. */
1718 tree dstarg = CALL_EXPR_ARG (exp, 0);
1719 if (is_strlen_related_p (dstarg, bound))
1721 /* The bound applies to the destination, not to the source,
1722 so reset these to trigger a warning without mentioning
1723 the bound. */
1724 bound = NULL;
1725 fncode = 0;
1727 else if (bndrng[1])
1728 /* Use the upper bound of the range for strncat. */
1729 wibnd = wi::to_offset (bndrng[1]);
1731 else if (bndrng[0])
1732 /* Use the lower bound of the range for functions other than
1733 strncat. */
1734 wibnd = wi::to_offset (bndrng[0]);
1736 /* Determine the size of the argument array if it is one. */
1737 offset_int asize = wibnd;
1738 bool known_size = false;
1739 tree type = TREE_TYPE (decl);
1741 /* Determine the array size. For arrays of unknown bound and
1742 pointers reset BOUND to trigger the appropriate warning. */
1743 if (TREE_CODE (type) == ARRAY_TYPE)
1745 if (tree arrbnd = TYPE_DOMAIN (type))
1747 if ((arrbnd = TYPE_MAX_VALUE (arrbnd)))
1749 asize = wi::to_offset (arrbnd) + 1;
1750 known_size = true;
1753 else if (bound == void_type_node)
1754 bound = NULL_TREE;
1756 else if (bound == void_type_node)
1757 bound = NULL_TREE;
1759 /* In a call to strncat with a bound in a range whose lower but
1760 not upper bound is less than the array size, reset ASIZE to
1761 be the same as the bound and the other variable to trigger
1762 the apprpriate warning below. */
1763 if (fncode == BUILT_IN_STRNCAT
1764 && bndrng[0] != bndrng[1]
1765 && wi::ltu_p (wi::to_offset (bndrng[0]), asize)
1766 && (!known_size
1767 || wi::ltu_p (asize, wibnd)))
1769 asize = wibnd;
1770 bound = NULL_TREE;
1771 fncode = 0;
1774 bool warned = false;
1776 if (wi::ltu_p (asize, wibnd))
1778 if (bndrng[0] == bndrng[1])
1779 warned = warning_at (loc, OPT_Wstringop_overflow_,
1780 "%qD argument %i declared attribute "
1781 "%<nonstring%> is smaller than the specified "
1782 "bound %wu",
1783 fndecl, argno + 1, wibnd.to_uhwi ());
1784 else if (wi::ltu_p (asize, wi::to_offset (bndrng[0])))
1785 warned = warning_at (loc, OPT_Wstringop_overflow_,
1786 "%qD argument %i declared attribute "
1787 "%<nonstring%> is smaller than "
1788 "the specified bound [%E, %E]",
1789 fndecl, argno + 1, bndrng[0], bndrng[1]);
1790 else
1791 warned = warning_at (loc, OPT_Wstringop_overflow_,
1792 "%qD argument %i declared attribute "
1793 "%<nonstring%> may be smaller than "
1794 "the specified bound [%E, %E]",
1795 fndecl, argno + 1, bndrng[0], bndrng[1]);
1797 else if (fncode == BUILT_IN_STRNCAT)
1798 ; /* Avoid warning for calls to strncat() when the bound
1799 is equal to the size of the non-string argument. */
1800 else if (!bound)
1801 warned = warning_at (loc, OPT_Wstringop_overflow_,
1802 "%qD argument %i declared attribute %<nonstring%>",
1803 fndecl, argno + 1);
1805 if (warned)
1806 inform (DECL_SOURCE_LOCATION (decl),
1807 "argument %qD declared here", decl);
1811 /* Issue an error if CALL_EXPR was flagged as requiring
1812 tall-call optimization. */
1814 static void
1815 maybe_complain_about_tail_call (tree call_expr, const char *reason)
1817 gcc_assert (TREE_CODE (call_expr) == CALL_EXPR);
1818 if (!CALL_EXPR_MUST_TAIL_CALL (call_expr))
1819 return;
1821 error_at (EXPR_LOCATION (call_expr), "cannot tail-call: %s", reason);
1824 /* Fill in ARGS_SIZE and ARGS array based on the parameters found in
1825 CALL_EXPR EXP.
1827 NUM_ACTUALS is the total number of parameters.
1829 N_NAMED_ARGS is the total number of named arguments.
1831 STRUCT_VALUE_ADDR_VALUE is the implicit argument for a struct return
1832 value, or null.
1834 FNDECL is the tree code for the target of this call (if known)
1836 ARGS_SO_FAR holds state needed by the target to know where to place
1837 the next argument.
1839 REG_PARM_STACK_SPACE is the number of bytes of stack space reserved
1840 for arguments which are passed in registers.
1842 OLD_STACK_LEVEL is a pointer to an rtx which olds the old stack level
1843 and may be modified by this routine.
1845 OLD_PENDING_ADJ, MUST_PREALLOCATE and FLAGS are pointers to integer
1846 flags which may be modified by this routine.
1848 MAY_TAILCALL is cleared if we encounter an invisible pass-by-reference
1849 that requires allocation of stack space.
1851 CALL_FROM_THUNK_P is true if this call is the jump from a thunk to
1852 the thunked-to function. */
1854 static void
1855 initialize_argument_information (int num_actuals ATTRIBUTE_UNUSED,
1856 struct arg_data *args,
1857 struct args_size *args_size,
1858 int n_named_args ATTRIBUTE_UNUSED,
1859 tree exp, tree struct_value_addr_value,
1860 tree fndecl, tree fntype,
1861 cumulative_args_t args_so_far,
1862 int reg_parm_stack_space,
1863 rtx *old_stack_level,
1864 poly_int64_pod *old_pending_adj,
1865 int *must_preallocate, int *ecf_flags,
1866 bool *may_tailcall, bool call_from_thunk_p)
1868 CUMULATIVE_ARGS *args_so_far_pnt = get_cumulative_args (args_so_far);
1869 location_t loc = EXPR_LOCATION (exp);
1871 /* Count arg position in order args appear. */
1872 int argpos;
1874 int i;
1876 args_size->constant = 0;
1877 args_size->var = 0;
1879 bitmap_obstack_initialize (NULL);
1881 /* In this loop, we consider args in the order they are written.
1882 We fill up ARGS from the back. */
1884 i = num_actuals - 1;
1886 int j = i;
1887 call_expr_arg_iterator iter;
1888 tree arg;
1889 bitmap slots = NULL;
1891 if (struct_value_addr_value)
1893 args[j].tree_value = struct_value_addr_value;
1894 j--;
1896 argpos = 0;
1897 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
1899 tree argtype = TREE_TYPE (arg);
1901 if (targetm.calls.split_complex_arg
1902 && argtype
1903 && TREE_CODE (argtype) == COMPLEX_TYPE
1904 && targetm.calls.split_complex_arg (argtype))
1906 tree subtype = TREE_TYPE (argtype);
1907 args[j].tree_value = build1 (REALPART_EXPR, subtype, arg);
1908 j--;
1909 args[j].tree_value = build1 (IMAGPART_EXPR, subtype, arg);
1911 else
1912 args[j].tree_value = arg;
1913 j--;
1914 argpos++;
1917 if (slots)
1918 BITMAP_FREE (slots);
1921 bitmap_obstack_release (NULL);
1923 /* Extract attribute alloc_size and if set, store the indices of
1924 the corresponding arguments in ALLOC_IDX, and then the actual
1925 argument(s) at those indices in ALLOC_ARGS. */
1926 int alloc_idx[2] = { -1, -1 };
1927 if (tree alloc_size
1928 = (fndecl ? lookup_attribute ("alloc_size",
1929 TYPE_ATTRIBUTES (TREE_TYPE (fndecl)))
1930 : NULL_TREE))
1932 tree args = TREE_VALUE (alloc_size);
1933 alloc_idx[0] = TREE_INT_CST_LOW (TREE_VALUE (args)) - 1;
1934 if (TREE_CHAIN (args))
1935 alloc_idx[1] = TREE_INT_CST_LOW (TREE_VALUE (TREE_CHAIN (args))) - 1;
1938 /* Array for up to the two attribute alloc_size arguments. */
1939 tree alloc_args[] = { NULL_TREE, NULL_TREE };
1941 /* I counts args in order (to be) pushed; ARGPOS counts in order written. */
1942 for (argpos = 0; argpos < num_actuals; i--, argpos++)
1944 tree type = TREE_TYPE (args[i].tree_value);
1945 int unsignedp;
1946 machine_mode mode;
1948 /* Replace erroneous argument with constant zero. */
1949 if (type == error_mark_node || !COMPLETE_TYPE_P (type))
1950 args[i].tree_value = integer_zero_node, type = integer_type_node;
1952 /* If TYPE is a transparent union or record, pass things the way
1953 we would pass the first field of the union or record. We have
1954 already verified that the modes are the same. */
1955 if ((TREE_CODE (type) == UNION_TYPE || TREE_CODE (type) == RECORD_TYPE)
1956 && TYPE_TRANSPARENT_AGGR (type))
1957 type = TREE_TYPE (first_field (type));
1959 /* Decide where to pass this arg.
1961 args[i].reg is nonzero if all or part is passed in registers.
1963 args[i].partial is nonzero if part but not all is passed in registers,
1964 and the exact value says how many bytes are passed in registers.
1966 args[i].pass_on_stack is nonzero if the argument must at least be
1967 computed on the stack. It may then be loaded back into registers
1968 if args[i].reg is nonzero.
1970 These decisions are driven by the FUNCTION_... macros and must agree
1971 with those made by function.c. */
1973 /* See if this argument should be passed by invisible reference. */
1974 if (pass_by_reference (args_so_far_pnt, TYPE_MODE (type),
1975 type, argpos < n_named_args))
1977 bool callee_copies;
1978 tree base = NULL_TREE;
1980 callee_copies
1981 = reference_callee_copied (args_so_far_pnt, TYPE_MODE (type),
1982 type, argpos < n_named_args);
1984 /* If we're compiling a thunk, pass through invisible references
1985 instead of making a copy. */
1986 if (call_from_thunk_p
1987 || (callee_copies
1988 && !TREE_ADDRESSABLE (type)
1989 && (base = get_base_address (args[i].tree_value))
1990 && TREE_CODE (base) != SSA_NAME
1991 && (!DECL_P (base) || MEM_P (DECL_RTL (base)))))
1993 /* We may have turned the parameter value into an SSA name.
1994 Go back to the original parameter so we can take the
1995 address. */
1996 if (TREE_CODE (args[i].tree_value) == SSA_NAME)
1998 gcc_assert (SSA_NAME_IS_DEFAULT_DEF (args[i].tree_value));
1999 args[i].tree_value = SSA_NAME_VAR (args[i].tree_value);
2000 gcc_assert (TREE_CODE (args[i].tree_value) == PARM_DECL);
2002 /* Argument setup code may have copied the value to register. We
2003 revert that optimization now because the tail call code must
2004 use the original location. */
2005 if (TREE_CODE (args[i].tree_value) == PARM_DECL
2006 && !MEM_P (DECL_RTL (args[i].tree_value))
2007 && DECL_INCOMING_RTL (args[i].tree_value)
2008 && MEM_P (DECL_INCOMING_RTL (args[i].tree_value)))
2009 set_decl_rtl (args[i].tree_value,
2010 DECL_INCOMING_RTL (args[i].tree_value));
2012 mark_addressable (args[i].tree_value);
2014 /* We can't use sibcalls if a callee-copied argument is
2015 stored in the current function's frame. */
2016 if (!call_from_thunk_p && DECL_P (base) && !TREE_STATIC (base))
2018 *may_tailcall = false;
2019 maybe_complain_about_tail_call (exp,
2020 "a callee-copied argument is"
2021 " stored in the current"
2022 " function's frame");
2025 args[i].tree_value = build_fold_addr_expr_loc (loc,
2026 args[i].tree_value);
2027 type = TREE_TYPE (args[i].tree_value);
2029 if (*ecf_flags & ECF_CONST)
2030 *ecf_flags &= ~(ECF_CONST | ECF_LOOPING_CONST_OR_PURE);
2032 else
2034 /* We make a copy of the object and pass the address to the
2035 function being called. */
2036 rtx copy;
2038 if (!COMPLETE_TYPE_P (type)
2039 || TREE_CODE (TYPE_SIZE_UNIT (type)) != INTEGER_CST
2040 || (flag_stack_check == GENERIC_STACK_CHECK
2041 && compare_tree_int (TYPE_SIZE_UNIT (type),
2042 STACK_CHECK_MAX_VAR_SIZE) > 0))
2044 /* This is a variable-sized object. Make space on the stack
2045 for it. */
2046 rtx size_rtx = expr_size (args[i].tree_value);
2048 if (*old_stack_level == 0)
2050 emit_stack_save (SAVE_BLOCK, old_stack_level);
2051 *old_pending_adj = pending_stack_adjust;
2052 pending_stack_adjust = 0;
2055 /* We can pass TRUE as the 4th argument because we just
2056 saved the stack pointer and will restore it right after
2057 the call. */
2058 copy = allocate_dynamic_stack_space (size_rtx,
2059 TYPE_ALIGN (type),
2060 TYPE_ALIGN (type),
2061 max_int_size_in_bytes
2062 (type),
2063 true);
2064 copy = gen_rtx_MEM (BLKmode, copy);
2065 set_mem_attributes (copy, type, 1);
2067 else
2068 copy = assign_temp (type, 1, 0);
2070 store_expr (args[i].tree_value, copy, 0, false, false);
2072 /* Just change the const function to pure and then let
2073 the next test clear the pure based on
2074 callee_copies. */
2075 if (*ecf_flags & ECF_CONST)
2077 *ecf_flags &= ~ECF_CONST;
2078 *ecf_flags |= ECF_PURE;
2081 if (!callee_copies && *ecf_flags & ECF_PURE)
2082 *ecf_flags &= ~(ECF_PURE | ECF_LOOPING_CONST_OR_PURE);
2084 args[i].tree_value
2085 = build_fold_addr_expr_loc (loc, make_tree (type, copy));
2086 type = TREE_TYPE (args[i].tree_value);
2087 *may_tailcall = false;
2088 maybe_complain_about_tail_call (exp,
2089 "argument must be passed"
2090 " by copying");
2094 unsignedp = TYPE_UNSIGNED (type);
2095 mode = promote_function_mode (type, TYPE_MODE (type), &unsignedp,
2096 fndecl ? TREE_TYPE (fndecl) : fntype, 0);
2098 args[i].unsignedp = unsignedp;
2099 args[i].mode = mode;
2101 targetm.calls.warn_parameter_passing_abi (args_so_far, type);
2103 args[i].reg = targetm.calls.function_arg (args_so_far, mode, type,
2104 argpos < n_named_args);
2106 if (args[i].reg && CONST_INT_P (args[i].reg))
2108 args[i].special_slot = args[i].reg;
2109 args[i].reg = NULL;
2112 /* If this is a sibling call and the machine has register windows, the
2113 register window has to be unwinded before calling the routine, so
2114 arguments have to go into the incoming registers. */
2115 if (targetm.calls.function_incoming_arg != targetm.calls.function_arg)
2116 args[i].tail_call_reg
2117 = targetm.calls.function_incoming_arg (args_so_far, mode, type,
2118 argpos < n_named_args);
2119 else
2120 args[i].tail_call_reg = args[i].reg;
2122 if (args[i].reg)
2123 args[i].partial
2124 = targetm.calls.arg_partial_bytes (args_so_far, mode, type,
2125 argpos < n_named_args);
2127 args[i].pass_on_stack = targetm.calls.must_pass_in_stack (mode, type);
2129 /* If FUNCTION_ARG returned a (parallel [(expr_list (nil) ...) ...]),
2130 it means that we are to pass this arg in the register(s) designated
2131 by the PARALLEL, but also to pass it in the stack. */
2132 if (args[i].reg && GET_CODE (args[i].reg) == PARALLEL
2133 && XEXP (XVECEXP (args[i].reg, 0, 0), 0) == 0)
2134 args[i].pass_on_stack = 1;
2136 /* If this is an addressable type, we must preallocate the stack
2137 since we must evaluate the object into its final location.
2139 If this is to be passed in both registers and the stack, it is simpler
2140 to preallocate. */
2141 if (TREE_ADDRESSABLE (type)
2142 || (args[i].pass_on_stack && args[i].reg != 0))
2143 *must_preallocate = 1;
2145 /* Compute the stack-size of this argument. */
2146 if (args[i].reg == 0 || args[i].partial != 0
2147 || reg_parm_stack_space > 0
2148 || args[i].pass_on_stack)
2149 locate_and_pad_parm (mode, type,
2150 #ifdef STACK_PARMS_IN_REG_PARM_AREA
2152 #else
2153 args[i].reg != 0,
2154 #endif
2155 reg_parm_stack_space,
2156 args[i].pass_on_stack ? 0 : args[i].partial,
2157 fndecl, args_size, &args[i].locate);
2158 #ifdef BLOCK_REG_PADDING
2159 else
2160 /* The argument is passed entirely in registers. See at which
2161 end it should be padded. */
2162 args[i].locate.where_pad =
2163 BLOCK_REG_PADDING (mode, type,
2164 int_size_in_bytes (type) <= UNITS_PER_WORD);
2165 #endif
2167 /* Update ARGS_SIZE, the total stack space for args so far. */
2169 args_size->constant += args[i].locate.size.constant;
2170 if (args[i].locate.size.var)
2171 ADD_PARM_SIZE (*args_size, args[i].locate.size.var);
2173 /* Increment ARGS_SO_FAR, which has info about which arg-registers
2174 have been used, etc. */
2176 targetm.calls.function_arg_advance (args_so_far, TYPE_MODE (type),
2177 type, argpos < n_named_args);
2179 /* Store argument values for functions decorated with attribute
2180 alloc_size. */
2181 if (argpos == alloc_idx[0])
2182 alloc_args[0] = args[i].tree_value;
2183 else if (argpos == alloc_idx[1])
2184 alloc_args[1] = args[i].tree_value;
2187 if (alloc_args[0])
2189 /* Check the arguments of functions decorated with attribute
2190 alloc_size. */
2191 maybe_warn_alloc_args_overflow (fndecl, exp, alloc_args, alloc_idx);
2194 /* Detect passing non-string arguments to functions expecting
2195 nul-terminated strings. */
2196 maybe_warn_nonstring_arg (fndecl, exp);
2199 /* Update ARGS_SIZE to contain the total size for the argument block.
2200 Return the original constant component of the argument block's size.
2202 REG_PARM_STACK_SPACE holds the number of bytes of stack space reserved
2203 for arguments passed in registers. */
2205 static poly_int64
2206 compute_argument_block_size (int reg_parm_stack_space,
2207 struct args_size *args_size,
2208 tree fndecl ATTRIBUTE_UNUSED,
2209 tree fntype ATTRIBUTE_UNUSED,
2210 int preferred_stack_boundary ATTRIBUTE_UNUSED)
2212 poly_int64 unadjusted_args_size = args_size->constant;
2214 /* For accumulate outgoing args mode we don't need to align, since the frame
2215 will be already aligned. Align to STACK_BOUNDARY in order to prevent
2216 backends from generating misaligned frame sizes. */
2217 if (ACCUMULATE_OUTGOING_ARGS && preferred_stack_boundary > STACK_BOUNDARY)
2218 preferred_stack_boundary = STACK_BOUNDARY;
2220 /* Compute the actual size of the argument block required. The variable
2221 and constant sizes must be combined, the size may have to be rounded,
2222 and there may be a minimum required size. */
2224 if (args_size->var)
2226 args_size->var = ARGS_SIZE_TREE (*args_size);
2227 args_size->constant = 0;
2229 preferred_stack_boundary /= BITS_PER_UNIT;
2230 if (preferred_stack_boundary > 1)
2232 /* We don't handle this case yet. To handle it correctly we have
2233 to add the delta, round and subtract the delta.
2234 Currently no machine description requires this support. */
2235 gcc_assert (multiple_p (stack_pointer_delta,
2236 preferred_stack_boundary));
2237 args_size->var = round_up (args_size->var, preferred_stack_boundary);
2240 if (reg_parm_stack_space > 0)
2242 args_size->var
2243 = size_binop (MAX_EXPR, args_size->var,
2244 ssize_int (reg_parm_stack_space));
2246 /* The area corresponding to register parameters is not to count in
2247 the size of the block we need. So make the adjustment. */
2248 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl))))
2249 args_size->var
2250 = size_binop (MINUS_EXPR, args_size->var,
2251 ssize_int (reg_parm_stack_space));
2254 else
2256 preferred_stack_boundary /= BITS_PER_UNIT;
2257 if (preferred_stack_boundary < 1)
2258 preferred_stack_boundary = 1;
2259 args_size->constant = (aligned_upper_bound (args_size->constant
2260 + stack_pointer_delta,
2261 preferred_stack_boundary)
2262 - stack_pointer_delta);
2264 args_size->constant = upper_bound (args_size->constant,
2265 reg_parm_stack_space);
2267 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl))))
2268 args_size->constant -= reg_parm_stack_space;
2270 return unadjusted_args_size;
2273 /* Precompute parameters as needed for a function call.
2275 FLAGS is mask of ECF_* constants.
2277 NUM_ACTUALS is the number of arguments.
2279 ARGS is an array containing information for each argument; this
2280 routine fills in the INITIAL_VALUE and VALUE fields for each
2281 precomputed argument. */
2283 static void
2284 precompute_arguments (int num_actuals, struct arg_data *args)
2286 int i;
2288 /* If this is a libcall, then precompute all arguments so that we do not
2289 get extraneous instructions emitted as part of the libcall sequence. */
2291 /* If we preallocated the stack space, and some arguments must be passed
2292 on the stack, then we must precompute any parameter which contains a
2293 function call which will store arguments on the stack.
2294 Otherwise, evaluating the parameter may clobber previous parameters
2295 which have already been stored into the stack. (we have code to avoid
2296 such case by saving the outgoing stack arguments, but it results in
2297 worse code) */
2298 if (!ACCUMULATE_OUTGOING_ARGS)
2299 return;
2301 for (i = 0; i < num_actuals; i++)
2303 tree type;
2304 machine_mode mode;
2306 if (TREE_CODE (args[i].tree_value) != CALL_EXPR)
2307 continue;
2309 /* If this is an addressable type, we cannot pre-evaluate it. */
2310 type = TREE_TYPE (args[i].tree_value);
2311 gcc_assert (!TREE_ADDRESSABLE (type));
2313 args[i].initial_value = args[i].value
2314 = expand_normal (args[i].tree_value);
2316 mode = TYPE_MODE (type);
2317 if (mode != args[i].mode)
2319 int unsignedp = args[i].unsignedp;
2320 args[i].value
2321 = convert_modes (args[i].mode, mode,
2322 args[i].value, args[i].unsignedp);
2324 /* CSE will replace this only if it contains args[i].value
2325 pseudo, so convert it down to the declared mode using
2326 a SUBREG. */
2327 if (REG_P (args[i].value)
2328 && GET_MODE_CLASS (args[i].mode) == MODE_INT
2329 && promote_mode (type, mode, &unsignedp) != args[i].mode)
2331 args[i].initial_value
2332 = gen_lowpart_SUBREG (mode, args[i].value);
2333 SUBREG_PROMOTED_VAR_P (args[i].initial_value) = 1;
2334 SUBREG_PROMOTED_SET (args[i].initial_value, args[i].unsignedp);
2340 /* Given the current state of MUST_PREALLOCATE and information about
2341 arguments to a function call in NUM_ACTUALS, ARGS and ARGS_SIZE,
2342 compute and return the final value for MUST_PREALLOCATE. */
2344 static int
2345 finalize_must_preallocate (int must_preallocate, int num_actuals,
2346 struct arg_data *args, struct args_size *args_size)
2348 /* See if we have or want to preallocate stack space.
2350 If we would have to push a partially-in-regs parm
2351 before other stack parms, preallocate stack space instead.
2353 If the size of some parm is not a multiple of the required stack
2354 alignment, we must preallocate.
2356 If the total size of arguments that would otherwise create a copy in
2357 a temporary (such as a CALL) is more than half the total argument list
2358 size, preallocation is faster.
2360 Another reason to preallocate is if we have a machine (like the m88k)
2361 where stack alignment is required to be maintained between every
2362 pair of insns, not just when the call is made. However, we assume here
2363 that such machines either do not have push insns (and hence preallocation
2364 would occur anyway) or the problem is taken care of with
2365 PUSH_ROUNDING. */
2367 if (! must_preallocate)
2369 int partial_seen = 0;
2370 poly_int64 copy_to_evaluate_size = 0;
2371 int i;
2373 for (i = 0; i < num_actuals && ! must_preallocate; i++)
2375 if (args[i].partial > 0 && ! args[i].pass_on_stack)
2376 partial_seen = 1;
2377 else if (partial_seen && args[i].reg == 0)
2378 must_preallocate = 1;
2380 if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode
2381 && (TREE_CODE (args[i].tree_value) == CALL_EXPR
2382 || TREE_CODE (args[i].tree_value) == TARGET_EXPR
2383 || TREE_CODE (args[i].tree_value) == COND_EXPR
2384 || TREE_ADDRESSABLE (TREE_TYPE (args[i].tree_value))))
2385 copy_to_evaluate_size
2386 += int_size_in_bytes (TREE_TYPE (args[i].tree_value));
2389 if (maybe_ne (args_size->constant, 0)
2390 && maybe_ge (copy_to_evaluate_size * 2, args_size->constant))
2391 must_preallocate = 1;
2393 return must_preallocate;
2396 /* If we preallocated stack space, compute the address of each argument
2397 and store it into the ARGS array.
2399 We need not ensure it is a valid memory address here; it will be
2400 validized when it is used.
2402 ARGBLOCK is an rtx for the address of the outgoing arguments. */
2404 static void
2405 compute_argument_addresses (struct arg_data *args, rtx argblock, int num_actuals)
2407 if (argblock)
2409 rtx arg_reg = argblock;
2410 int i;
2411 poly_int64 arg_offset = 0;
2413 if (GET_CODE (argblock) == PLUS)
2415 arg_reg = XEXP (argblock, 0);
2416 arg_offset = rtx_to_poly_int64 (XEXP (argblock, 1));
2419 for (i = 0; i < num_actuals; i++)
2421 rtx offset = ARGS_SIZE_RTX (args[i].locate.offset);
2422 rtx slot_offset = ARGS_SIZE_RTX (args[i].locate.slot_offset);
2423 rtx addr;
2424 unsigned int align, boundary;
2425 poly_uint64 units_on_stack = 0;
2426 machine_mode partial_mode = VOIDmode;
2428 /* Skip this parm if it will not be passed on the stack. */
2429 if (! args[i].pass_on_stack
2430 && args[i].reg != 0
2431 && args[i].partial == 0)
2432 continue;
2434 if (TYPE_EMPTY_P (TREE_TYPE (args[i].tree_value)))
2435 continue;
2437 addr = simplify_gen_binary (PLUS, Pmode, arg_reg, offset);
2438 addr = plus_constant (Pmode, addr, arg_offset);
2440 if (args[i].partial != 0)
2442 /* Only part of the parameter is being passed on the stack.
2443 Generate a simple memory reference of the correct size. */
2444 units_on_stack = args[i].locate.size.constant;
2445 poly_uint64 bits_on_stack = units_on_stack * BITS_PER_UNIT;
2446 partial_mode = int_mode_for_size (bits_on_stack, 1).else_blk ();
2447 args[i].stack = gen_rtx_MEM (partial_mode, addr);
2448 set_mem_size (args[i].stack, units_on_stack);
2450 else
2452 args[i].stack = gen_rtx_MEM (args[i].mode, addr);
2453 set_mem_attributes (args[i].stack,
2454 TREE_TYPE (args[i].tree_value), 1);
2456 align = BITS_PER_UNIT;
2457 boundary = args[i].locate.boundary;
2458 poly_int64 offset_val;
2459 if (args[i].locate.where_pad != PAD_DOWNWARD)
2460 align = boundary;
2461 else if (poly_int_rtx_p (offset, &offset_val))
2463 align = least_bit_hwi (boundary);
2464 unsigned int offset_align
2465 = known_alignment (offset_val) * BITS_PER_UNIT;
2466 if (offset_align != 0)
2467 align = MIN (align, offset_align);
2469 set_mem_align (args[i].stack, align);
2471 addr = simplify_gen_binary (PLUS, Pmode, arg_reg, slot_offset);
2472 addr = plus_constant (Pmode, addr, arg_offset);
2474 if (args[i].partial != 0)
2476 /* Only part of the parameter is being passed on the stack.
2477 Generate a simple memory reference of the correct size.
2479 args[i].stack_slot = gen_rtx_MEM (partial_mode, addr);
2480 set_mem_size (args[i].stack_slot, units_on_stack);
2482 else
2484 args[i].stack_slot = gen_rtx_MEM (args[i].mode, addr);
2485 set_mem_attributes (args[i].stack_slot,
2486 TREE_TYPE (args[i].tree_value), 1);
2488 set_mem_align (args[i].stack_slot, args[i].locate.boundary);
2490 /* Function incoming arguments may overlap with sibling call
2491 outgoing arguments and we cannot allow reordering of reads
2492 from function arguments with stores to outgoing arguments
2493 of sibling calls. */
2494 set_mem_alias_set (args[i].stack, 0);
2495 set_mem_alias_set (args[i].stack_slot, 0);
2500 /* Given a FNDECL and EXP, return an rtx suitable for use as a target address
2501 in a call instruction.
2503 FNDECL is the tree node for the target function. For an indirect call
2504 FNDECL will be NULL_TREE.
2506 ADDR is the operand 0 of CALL_EXPR for this call. */
2508 static rtx
2509 rtx_for_function_call (tree fndecl, tree addr)
2511 rtx funexp;
2513 /* Get the function to call, in the form of RTL. */
2514 if (fndecl)
2516 if (!TREE_USED (fndecl) && fndecl != current_function_decl)
2517 TREE_USED (fndecl) = 1;
2519 /* Get a SYMBOL_REF rtx for the function address. */
2520 funexp = XEXP (DECL_RTL (fndecl), 0);
2522 else
2523 /* Generate an rtx (probably a pseudo-register) for the address. */
2525 push_temp_slots ();
2526 funexp = expand_normal (addr);
2527 pop_temp_slots (); /* FUNEXP can't be BLKmode. */
2529 return funexp;
2532 /* Return the static chain for this function, if any. */
2535 rtx_for_static_chain (const_tree fndecl_or_type, bool incoming_p)
2537 if (DECL_P (fndecl_or_type) && !DECL_STATIC_CHAIN (fndecl_or_type))
2538 return NULL;
2540 return targetm.calls.static_chain (fndecl_or_type, incoming_p);
2543 /* Internal state for internal_arg_pointer_based_exp and its helpers. */
2544 static struct
2546 /* Last insn that has been scanned by internal_arg_pointer_based_exp_scan,
2547 or NULL_RTX if none has been scanned yet. */
2548 rtx_insn *scan_start;
2549 /* Vector indexed by REGNO - FIRST_PSEUDO_REGISTER, recording if a pseudo is
2550 based on crtl->args.internal_arg_pointer. The element is NULL_RTX if the
2551 pseudo isn't based on it, a CONST_INT offset if the pseudo is based on it
2552 with fixed offset, or PC if this is with variable or unknown offset. */
2553 vec<rtx> cache;
2554 } internal_arg_pointer_exp_state;
2556 static rtx internal_arg_pointer_based_exp (const_rtx, bool);
2558 /* Helper function for internal_arg_pointer_based_exp. Scan insns in
2559 the tail call sequence, starting with first insn that hasn't been
2560 scanned yet, and note for each pseudo on the LHS whether it is based
2561 on crtl->args.internal_arg_pointer or not, and what offset from that
2562 that pointer it has. */
2564 static void
2565 internal_arg_pointer_based_exp_scan (void)
2567 rtx_insn *insn, *scan_start = internal_arg_pointer_exp_state.scan_start;
2569 if (scan_start == NULL_RTX)
2570 insn = get_insns ();
2571 else
2572 insn = NEXT_INSN (scan_start);
2574 while (insn)
2576 rtx set = single_set (insn);
2577 if (set && REG_P (SET_DEST (set)) && !HARD_REGISTER_P (SET_DEST (set)))
2579 rtx val = NULL_RTX;
2580 unsigned int idx = REGNO (SET_DEST (set)) - FIRST_PSEUDO_REGISTER;
2581 /* Punt on pseudos set multiple times. */
2582 if (idx < internal_arg_pointer_exp_state.cache.length ()
2583 && (internal_arg_pointer_exp_state.cache[idx]
2584 != NULL_RTX))
2585 val = pc_rtx;
2586 else
2587 val = internal_arg_pointer_based_exp (SET_SRC (set), false);
2588 if (val != NULL_RTX)
2590 if (idx >= internal_arg_pointer_exp_state.cache.length ())
2591 internal_arg_pointer_exp_state.cache
2592 .safe_grow_cleared (idx + 1);
2593 internal_arg_pointer_exp_state.cache[idx] = val;
2596 if (NEXT_INSN (insn) == NULL_RTX)
2597 scan_start = insn;
2598 insn = NEXT_INSN (insn);
2601 internal_arg_pointer_exp_state.scan_start = scan_start;
2604 /* Compute whether RTL is based on crtl->args.internal_arg_pointer. Return
2605 NULL_RTX if RTL isn't based on it, a CONST_INT offset if RTL is based on
2606 it with fixed offset, or PC if this is with variable or unknown offset.
2607 TOPLEVEL is true if the function is invoked at the topmost level. */
2609 static rtx
2610 internal_arg_pointer_based_exp (const_rtx rtl, bool toplevel)
2612 if (CONSTANT_P (rtl))
2613 return NULL_RTX;
2615 if (rtl == crtl->args.internal_arg_pointer)
2616 return const0_rtx;
2618 if (REG_P (rtl) && HARD_REGISTER_P (rtl))
2619 return NULL_RTX;
2621 poly_int64 offset;
2622 if (GET_CODE (rtl) == PLUS && poly_int_rtx_p (XEXP (rtl, 1), &offset))
2624 rtx val = internal_arg_pointer_based_exp (XEXP (rtl, 0), toplevel);
2625 if (val == NULL_RTX || val == pc_rtx)
2626 return val;
2627 return plus_constant (Pmode, val, offset);
2630 /* When called at the topmost level, scan pseudo assignments in between the
2631 last scanned instruction in the tail call sequence and the latest insn
2632 in that sequence. */
2633 if (toplevel)
2634 internal_arg_pointer_based_exp_scan ();
2636 if (REG_P (rtl))
2638 unsigned int idx = REGNO (rtl) - FIRST_PSEUDO_REGISTER;
2639 if (idx < internal_arg_pointer_exp_state.cache.length ())
2640 return internal_arg_pointer_exp_state.cache[idx];
2642 return NULL_RTX;
2645 subrtx_iterator::array_type array;
2646 FOR_EACH_SUBRTX (iter, array, rtl, NONCONST)
2648 const_rtx x = *iter;
2649 if (REG_P (x) && internal_arg_pointer_based_exp (x, false) != NULL_RTX)
2650 return pc_rtx;
2651 if (MEM_P (x))
2652 iter.skip_subrtxes ();
2655 return NULL_RTX;
2658 /* Return true if SIZE bytes starting from address ADDR might overlap an
2659 already-clobbered argument area. This function is used to determine
2660 if we should give up a sibcall. */
2662 static bool
2663 mem_might_overlap_already_clobbered_arg_p (rtx addr, poly_uint64 size)
2665 poly_int64 i;
2666 unsigned HOST_WIDE_INT start, end;
2667 rtx val;
2669 if (bitmap_empty_p (stored_args_map)
2670 && stored_args_watermark == HOST_WIDE_INT_M1U)
2671 return false;
2672 val = internal_arg_pointer_based_exp (addr, true);
2673 if (val == NULL_RTX)
2674 return false;
2675 else if (!poly_int_rtx_p (val, &i))
2676 return true;
2678 if (known_eq (size, 0U))
2679 return false;
2681 if (STACK_GROWS_DOWNWARD)
2682 i -= crtl->args.pretend_args_size;
2683 else
2684 i += crtl->args.pretend_args_size;
2686 if (ARGS_GROW_DOWNWARD)
2687 i = -i - size;
2689 /* We can ignore any references to the function's pretend args,
2690 which at this point would manifest as negative values of I. */
2691 if (known_le (i, 0) && known_le (size, poly_uint64 (-i)))
2692 return false;
2694 start = maybe_lt (i, 0) ? 0 : constant_lower_bound (i);
2695 if (!(i + size).is_constant (&end))
2696 end = HOST_WIDE_INT_M1U;
2698 if (end > stored_args_watermark)
2699 return true;
2701 end = MIN (end, SBITMAP_SIZE (stored_args_map));
2702 for (unsigned HOST_WIDE_INT k = start; k < end; ++k)
2703 if (bitmap_bit_p (stored_args_map, k))
2704 return true;
2706 return false;
2709 /* Do the register loads required for any wholly-register parms or any
2710 parms which are passed both on the stack and in a register. Their
2711 expressions were already evaluated.
2713 Mark all register-parms as living through the call, putting these USE
2714 insns in the CALL_INSN_FUNCTION_USAGE field.
2716 When IS_SIBCALL, perform the check_sibcall_argument_overlap
2717 checking, setting *SIBCALL_FAILURE if appropriate. */
2719 static void
2720 load_register_parameters (struct arg_data *args, int num_actuals,
2721 rtx *call_fusage, int flags, int is_sibcall,
2722 int *sibcall_failure)
2724 int i, j;
2726 for (i = 0; i < num_actuals; i++)
2728 rtx reg = ((flags & ECF_SIBCALL)
2729 ? args[i].tail_call_reg : args[i].reg);
2730 if (reg)
2732 int partial = args[i].partial;
2733 int nregs;
2734 poly_int64 size = 0;
2735 HOST_WIDE_INT const_size = 0;
2736 rtx_insn *before_arg = get_last_insn ();
2737 /* Set non-negative if we must move a word at a time, even if
2738 just one word (e.g, partial == 4 && mode == DFmode). Set
2739 to -1 if we just use a normal move insn. This value can be
2740 zero if the argument is a zero size structure. */
2741 nregs = -1;
2742 if (GET_CODE (reg) == PARALLEL)
2744 else if (partial)
2746 gcc_assert (partial % UNITS_PER_WORD == 0);
2747 nregs = partial / UNITS_PER_WORD;
2749 else if (TYPE_MODE (TREE_TYPE (args[i].tree_value)) == BLKmode)
2751 /* Variable-sized parameters should be described by a
2752 PARALLEL instead. */
2753 const_size = int_size_in_bytes (TREE_TYPE (args[i].tree_value));
2754 gcc_assert (const_size >= 0);
2755 nregs = (const_size + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD;
2756 size = const_size;
2758 else
2759 size = GET_MODE_SIZE (args[i].mode);
2761 /* Handle calls that pass values in multiple non-contiguous
2762 locations. The Irix 6 ABI has examples of this. */
2764 if (GET_CODE (reg) == PARALLEL)
2765 emit_group_move (reg, args[i].parallel_value);
2767 /* If simple case, just do move. If normal partial, store_one_arg
2768 has already loaded the register for us. In all other cases,
2769 load the register(s) from memory. */
2771 else if (nregs == -1)
2773 emit_move_insn (reg, args[i].value);
2774 #ifdef BLOCK_REG_PADDING
2775 /* Handle case where we have a value that needs shifting
2776 up to the msb. eg. a QImode value and we're padding
2777 upward on a BYTES_BIG_ENDIAN machine. */
2778 if (args[i].locate.where_pad
2779 == (BYTES_BIG_ENDIAN ? PAD_UPWARD : PAD_DOWNWARD))
2781 gcc_checking_assert (ordered_p (size, UNITS_PER_WORD));
2782 if (maybe_lt (size, UNITS_PER_WORD))
2784 rtx x;
2785 poly_int64 shift
2786 = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
2788 /* Assigning REG here rather than a temp makes
2789 CALL_FUSAGE report the whole reg as used.
2790 Strictly speaking, the call only uses SIZE
2791 bytes at the msb end, but it doesn't seem worth
2792 generating rtl to say that. */
2793 reg = gen_rtx_REG (word_mode, REGNO (reg));
2794 x = expand_shift (LSHIFT_EXPR, word_mode,
2795 reg, shift, reg, 1);
2796 if (x != reg)
2797 emit_move_insn (reg, x);
2800 #endif
2803 /* If we have pre-computed the values to put in the registers in
2804 the case of non-aligned structures, copy them in now. */
2806 else if (args[i].n_aligned_regs != 0)
2807 for (j = 0; j < args[i].n_aligned_regs; j++)
2808 emit_move_insn (gen_rtx_REG (word_mode, REGNO (reg) + j),
2809 args[i].aligned_regs[j]);
2811 else if (partial == 0 || args[i].pass_on_stack)
2813 /* SIZE and CONST_SIZE are 0 for partial arguments and
2814 the size of a BLKmode type otherwise. */
2815 gcc_checking_assert (known_eq (size, const_size));
2816 rtx mem = validize_mem (copy_rtx (args[i].value));
2818 /* Check for overlap with already clobbered argument area,
2819 providing that this has non-zero size. */
2820 if (is_sibcall
2821 && const_size != 0
2822 && (mem_might_overlap_already_clobbered_arg_p
2823 (XEXP (args[i].value, 0), const_size)))
2824 *sibcall_failure = 1;
2826 if (const_size % UNITS_PER_WORD == 0
2827 || MEM_ALIGN (mem) % BITS_PER_WORD == 0)
2828 move_block_to_reg (REGNO (reg), mem, nregs, args[i].mode);
2829 else
2831 if (nregs > 1)
2832 move_block_to_reg (REGNO (reg), mem, nregs - 1,
2833 args[i].mode);
2834 rtx dest = gen_rtx_REG (word_mode, REGNO (reg) + nregs - 1);
2835 unsigned int bitoff = (nregs - 1) * BITS_PER_WORD;
2836 unsigned int bitsize = const_size * BITS_PER_UNIT - bitoff;
2837 rtx x = extract_bit_field (mem, bitsize, bitoff, 1, dest,
2838 word_mode, word_mode, false,
2839 NULL);
2840 if (BYTES_BIG_ENDIAN)
2841 x = expand_shift (LSHIFT_EXPR, word_mode, x,
2842 BITS_PER_WORD - bitsize, dest, 1);
2843 if (x != dest)
2844 emit_move_insn (dest, x);
2847 /* Handle a BLKmode that needs shifting. */
2848 if (nregs == 1 && const_size < UNITS_PER_WORD
2849 #ifdef BLOCK_REG_PADDING
2850 && args[i].locate.where_pad == PAD_DOWNWARD
2851 #else
2852 && BYTES_BIG_ENDIAN
2853 #endif
2856 rtx dest = gen_rtx_REG (word_mode, REGNO (reg));
2857 int shift = (UNITS_PER_WORD - const_size) * BITS_PER_UNIT;
2858 enum tree_code dir = (BYTES_BIG_ENDIAN
2859 ? RSHIFT_EXPR : LSHIFT_EXPR);
2860 rtx x;
2862 x = expand_shift (dir, word_mode, dest, shift, dest, 1);
2863 if (x != dest)
2864 emit_move_insn (dest, x);
2868 /* When a parameter is a block, and perhaps in other cases, it is
2869 possible that it did a load from an argument slot that was
2870 already clobbered. */
2871 if (is_sibcall
2872 && check_sibcall_argument_overlap (before_arg, &args[i], 0))
2873 *sibcall_failure = 1;
2875 /* Handle calls that pass values in multiple non-contiguous
2876 locations. The Irix 6 ABI has examples of this. */
2877 if (GET_CODE (reg) == PARALLEL)
2878 use_group_regs (call_fusage, reg);
2879 else if (nregs == -1)
2880 use_reg_mode (call_fusage, reg,
2881 TYPE_MODE (TREE_TYPE (args[i].tree_value)));
2882 else if (nregs > 0)
2883 use_regs (call_fusage, REGNO (reg), nregs);
2888 /* We need to pop PENDING_STACK_ADJUST bytes. But, if the arguments
2889 wouldn't fill up an even multiple of PREFERRED_UNIT_STACK_BOUNDARY
2890 bytes, then we would need to push some additional bytes to pad the
2891 arguments. So, we try to compute an adjust to the stack pointer for an
2892 amount that will leave the stack under-aligned by UNADJUSTED_ARGS_SIZE
2893 bytes. Then, when the arguments are pushed the stack will be perfectly
2894 aligned.
2896 Return true if this optimization is possible, storing the adjustment
2897 in ADJUSTMENT_OUT and setting ARGS_SIZE->CONSTANT to the number of
2898 bytes that should be popped after the call. */
2900 static bool
2901 combine_pending_stack_adjustment_and_call (poly_int64_pod *adjustment_out,
2902 poly_int64 unadjusted_args_size,
2903 struct args_size *args_size,
2904 unsigned int preferred_unit_stack_boundary)
2906 /* The number of bytes to pop so that the stack will be
2907 under-aligned by UNADJUSTED_ARGS_SIZE bytes. */
2908 poly_int64 adjustment;
2909 /* The alignment of the stack after the arguments are pushed, if we
2910 just pushed the arguments without adjust the stack here. */
2911 unsigned HOST_WIDE_INT unadjusted_alignment;
2913 if (!known_misalignment (stack_pointer_delta + unadjusted_args_size,
2914 preferred_unit_stack_boundary,
2915 &unadjusted_alignment))
2916 return false;
2918 /* We want to get rid of as many of the PENDING_STACK_ADJUST bytes
2919 as possible -- leaving just enough left to cancel out the
2920 UNADJUSTED_ALIGNMENT. In other words, we want to ensure that the
2921 PENDING_STACK_ADJUST is non-negative, and congruent to
2922 -UNADJUSTED_ALIGNMENT modulo the PREFERRED_UNIT_STACK_BOUNDARY. */
2924 /* Begin by trying to pop all the bytes. */
2925 unsigned HOST_WIDE_INT tmp_misalignment;
2926 if (!known_misalignment (pending_stack_adjust,
2927 preferred_unit_stack_boundary,
2928 &tmp_misalignment))
2929 return false;
2930 unadjusted_alignment -= tmp_misalignment;
2931 adjustment = pending_stack_adjust;
2932 /* Push enough additional bytes that the stack will be aligned
2933 after the arguments are pushed. */
2934 if (preferred_unit_stack_boundary > 1 && unadjusted_alignment)
2935 adjustment -= preferred_unit_stack_boundary - unadjusted_alignment;
2937 /* We need to know whether the adjusted argument size
2938 (UNADJUSTED_ARGS_SIZE - ADJUSTMENT) constitutes an allocation
2939 or a deallocation. */
2940 if (!ordered_p (adjustment, unadjusted_args_size))
2941 return false;
2943 /* Now, sets ARGS_SIZE->CONSTANT so that we pop the right number of
2944 bytes after the call. The right number is the entire
2945 PENDING_STACK_ADJUST less our ADJUSTMENT plus the amount required
2946 by the arguments in the first place. */
2947 args_size->constant
2948 = pending_stack_adjust - adjustment + unadjusted_args_size;
2950 *adjustment_out = adjustment;
2951 return true;
2954 /* Scan X expression if it does not dereference any argument slots
2955 we already clobbered by tail call arguments (as noted in stored_args_map
2956 bitmap).
2957 Return nonzero if X expression dereferences such argument slots,
2958 zero otherwise. */
2960 static int
2961 check_sibcall_argument_overlap_1 (rtx x)
2963 RTX_CODE code;
2964 int i, j;
2965 const char *fmt;
2967 if (x == NULL_RTX)
2968 return 0;
2970 code = GET_CODE (x);
2972 /* We need not check the operands of the CALL expression itself. */
2973 if (code == CALL)
2974 return 0;
2976 if (code == MEM)
2977 return (mem_might_overlap_already_clobbered_arg_p
2978 (XEXP (x, 0), GET_MODE_SIZE (GET_MODE (x))));
2980 /* Scan all subexpressions. */
2981 fmt = GET_RTX_FORMAT (code);
2982 for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
2984 if (*fmt == 'e')
2986 if (check_sibcall_argument_overlap_1 (XEXP (x, i)))
2987 return 1;
2989 else if (*fmt == 'E')
2991 for (j = 0; j < XVECLEN (x, i); j++)
2992 if (check_sibcall_argument_overlap_1 (XVECEXP (x, i, j)))
2993 return 1;
2996 return 0;
2999 /* Scan sequence after INSN if it does not dereference any argument slots
3000 we already clobbered by tail call arguments (as noted in stored_args_map
3001 bitmap). If MARK_STORED_ARGS_MAP, add stack slots for ARG to
3002 stored_args_map bitmap afterwards (when ARG is a register MARK_STORED_ARGS_MAP
3003 should be 0). Return nonzero if sequence after INSN dereferences such argument
3004 slots, zero otherwise. */
3006 static int
3007 check_sibcall_argument_overlap (rtx_insn *insn, struct arg_data *arg,
3008 int mark_stored_args_map)
3010 poly_uint64 low, high;
3011 unsigned HOST_WIDE_INT const_low, const_high;
3013 if (insn == NULL_RTX)
3014 insn = get_insns ();
3015 else
3016 insn = NEXT_INSN (insn);
3018 for (; insn; insn = NEXT_INSN (insn))
3019 if (INSN_P (insn)
3020 && check_sibcall_argument_overlap_1 (PATTERN (insn)))
3021 break;
3023 if (mark_stored_args_map)
3025 if (ARGS_GROW_DOWNWARD)
3026 low = -arg->locate.slot_offset.constant - arg->locate.size.constant;
3027 else
3028 low = arg->locate.slot_offset.constant;
3029 high = low + arg->locate.size.constant;
3031 const_low = constant_lower_bound (low);
3032 if (high.is_constant (&const_high))
3033 for (unsigned HOST_WIDE_INT i = const_low; i < const_high; ++i)
3034 bitmap_set_bit (stored_args_map, i);
3035 else
3036 stored_args_watermark = MIN (stored_args_watermark, const_low);
3038 return insn != NULL_RTX;
3041 /* Given that a function returns a value of mode MODE at the most
3042 significant end of hard register VALUE, shift VALUE left or right
3043 as specified by LEFT_P. Return true if some action was needed. */
3045 bool
3046 shift_return_value (machine_mode mode, bool left_p, rtx value)
3048 gcc_assert (REG_P (value) && HARD_REGISTER_P (value));
3049 machine_mode value_mode = GET_MODE (value);
3050 poly_int64 shift = GET_MODE_BITSIZE (value_mode) - GET_MODE_BITSIZE (mode);
3052 if (known_eq (shift, 0))
3053 return false;
3055 /* Use ashr rather than lshr for right shifts. This is for the benefit
3056 of the MIPS port, which requires SImode values to be sign-extended
3057 when stored in 64-bit registers. */
3058 if (!force_expand_binop (value_mode, left_p ? ashl_optab : ashr_optab,
3059 value, gen_int_shift_amount (value_mode, shift),
3060 value, 1, OPTAB_WIDEN))
3061 gcc_unreachable ();
3062 return true;
3065 /* If X is a likely-spilled register value, copy it to a pseudo
3066 register and return that register. Return X otherwise. */
3068 static rtx
3069 avoid_likely_spilled_reg (rtx x)
3071 rtx new_rtx;
3073 if (REG_P (x)
3074 && HARD_REGISTER_P (x)
3075 && targetm.class_likely_spilled_p (REGNO_REG_CLASS (REGNO (x))))
3077 /* Make sure that we generate a REG rather than a CONCAT.
3078 Moves into CONCATs can need nontrivial instructions,
3079 and the whole point of this function is to avoid
3080 using the hard register directly in such a situation. */
3081 generating_concat_p = 0;
3082 new_rtx = gen_reg_rtx (GET_MODE (x));
3083 generating_concat_p = 1;
3084 emit_move_insn (new_rtx, x);
3085 return new_rtx;
3087 return x;
3090 /* Helper function for expand_call.
3091 Return false is EXP is not implementable as a sibling call. */
3093 static bool
3094 can_implement_as_sibling_call_p (tree exp,
3095 rtx structure_value_addr,
3096 tree funtype,
3097 int reg_parm_stack_space ATTRIBUTE_UNUSED,
3098 tree fndecl,
3099 int flags,
3100 tree addr,
3101 const args_size &args_size)
3103 if (!targetm.have_sibcall_epilogue ())
3105 maybe_complain_about_tail_call
3106 (exp,
3107 "machine description does not have"
3108 " a sibcall_epilogue instruction pattern");
3109 return false;
3112 /* Doing sibling call optimization needs some work, since
3113 structure_value_addr can be allocated on the stack.
3114 It does not seem worth the effort since few optimizable
3115 sibling calls will return a structure. */
3116 if (structure_value_addr != NULL_RTX)
3118 maybe_complain_about_tail_call (exp, "callee returns a structure");
3119 return false;
3122 #ifdef REG_PARM_STACK_SPACE
3123 /* If outgoing reg parm stack space changes, we can not do sibcall. */
3124 if (OUTGOING_REG_PARM_STACK_SPACE (funtype)
3125 != OUTGOING_REG_PARM_STACK_SPACE (TREE_TYPE (current_function_decl))
3126 || (reg_parm_stack_space != REG_PARM_STACK_SPACE (current_function_decl)))
3128 maybe_complain_about_tail_call (exp,
3129 "inconsistent size of stack space"
3130 " allocated for arguments which are"
3131 " passed in registers");
3132 return false;
3134 #endif
3136 /* Check whether the target is able to optimize the call
3137 into a sibcall. */
3138 if (!targetm.function_ok_for_sibcall (fndecl, exp))
3140 maybe_complain_about_tail_call (exp,
3141 "target is not able to optimize the"
3142 " call into a sibling call");
3143 return false;
3146 /* Functions that do not return exactly once may not be sibcall
3147 optimized. */
3148 if (flags & ECF_RETURNS_TWICE)
3150 maybe_complain_about_tail_call (exp, "callee returns twice");
3151 return false;
3153 if (flags & ECF_NORETURN)
3155 maybe_complain_about_tail_call (exp, "callee does not return");
3156 return false;
3159 if (TYPE_VOLATILE (TREE_TYPE (TREE_TYPE (addr))))
3161 maybe_complain_about_tail_call (exp, "volatile function type");
3162 return false;
3165 /* If the called function is nested in the current one, it might access
3166 some of the caller's arguments, but could clobber them beforehand if
3167 the argument areas are shared. */
3168 if (fndecl && decl_function_context (fndecl) == current_function_decl)
3170 maybe_complain_about_tail_call (exp, "nested function");
3171 return false;
3174 /* If this function requires more stack slots than the current
3175 function, we cannot change it into a sibling call.
3176 crtl->args.pretend_args_size is not part of the
3177 stack allocated by our caller. */
3178 if (maybe_gt (args_size.constant,
3179 crtl->args.size - crtl->args.pretend_args_size))
3181 maybe_complain_about_tail_call (exp,
3182 "callee required more stack slots"
3183 " than the caller");
3184 return false;
3187 /* If the callee pops its own arguments, then it must pop exactly
3188 the same number of arguments as the current function. */
3189 if (maybe_ne (targetm.calls.return_pops_args (fndecl, funtype,
3190 args_size.constant),
3191 targetm.calls.return_pops_args (current_function_decl,
3192 TREE_TYPE
3193 (current_function_decl),
3194 crtl->args.size)))
3196 maybe_complain_about_tail_call (exp,
3197 "inconsistent number of"
3198 " popped arguments");
3199 return false;
3202 if (!lang_hooks.decls.ok_for_sibcall (fndecl))
3204 maybe_complain_about_tail_call (exp, "frontend does not support"
3205 " sibling call");
3206 return false;
3209 /* All checks passed. */
3210 return true;
3213 /* Generate all the code for a CALL_EXPR exp
3214 and return an rtx for its value.
3215 Store the value in TARGET (specified as an rtx) if convenient.
3216 If the value is stored in TARGET then TARGET is returned.
3217 If IGNORE is nonzero, then we ignore the value of the function call. */
3220 expand_call (tree exp, rtx target, int ignore)
3222 /* Nonzero if we are currently expanding a call. */
3223 static int currently_expanding_call = 0;
3225 /* RTX for the function to be called. */
3226 rtx funexp;
3227 /* Sequence of insns to perform a normal "call". */
3228 rtx_insn *normal_call_insns = NULL;
3229 /* Sequence of insns to perform a tail "call". */
3230 rtx_insn *tail_call_insns = NULL;
3231 /* Data type of the function. */
3232 tree funtype;
3233 tree type_arg_types;
3234 tree rettype;
3235 /* Declaration of the function being called,
3236 or 0 if the function is computed (not known by name). */
3237 tree fndecl = 0;
3238 /* The type of the function being called. */
3239 tree fntype;
3240 bool try_tail_call = CALL_EXPR_TAILCALL (exp);
3241 bool must_tail_call = CALL_EXPR_MUST_TAIL_CALL (exp);
3242 int pass;
3244 /* Register in which non-BLKmode value will be returned,
3245 or 0 if no value or if value is BLKmode. */
3246 rtx valreg;
3247 /* Address where we should return a BLKmode value;
3248 0 if value not BLKmode. */
3249 rtx structure_value_addr = 0;
3250 /* Nonzero if that address is being passed by treating it as
3251 an extra, implicit first parameter. Otherwise,
3252 it is passed by being copied directly into struct_value_rtx. */
3253 int structure_value_addr_parm = 0;
3254 /* Holds the value of implicit argument for the struct value. */
3255 tree structure_value_addr_value = NULL_TREE;
3256 /* Size of aggregate value wanted, or zero if none wanted
3257 or if we are using the non-reentrant PCC calling convention
3258 or expecting the value in registers. */
3259 poly_int64 struct_value_size = 0;
3260 /* Nonzero if called function returns an aggregate in memory PCC style,
3261 by returning the address of where to find it. */
3262 int pcc_struct_value = 0;
3263 rtx struct_value = 0;
3265 /* Number of actual parameters in this call, including struct value addr. */
3266 int num_actuals;
3267 /* Number of named args. Args after this are anonymous ones
3268 and they must all go on the stack. */
3269 int n_named_args;
3270 /* Number of complex actual arguments that need to be split. */
3271 int num_complex_actuals = 0;
3273 /* Vector of information about each argument.
3274 Arguments are numbered in the order they will be pushed,
3275 not the order they are written. */
3276 struct arg_data *args;
3278 /* Total size in bytes of all the stack-parms scanned so far. */
3279 struct args_size args_size;
3280 struct args_size adjusted_args_size;
3281 /* Size of arguments before any adjustments (such as rounding). */
3282 poly_int64 unadjusted_args_size;
3283 /* Data on reg parms scanned so far. */
3284 CUMULATIVE_ARGS args_so_far_v;
3285 cumulative_args_t args_so_far;
3286 /* Nonzero if a reg parm has been scanned. */
3287 int reg_parm_seen;
3288 /* Nonzero if this is an indirect function call. */
3290 /* Nonzero if we must avoid push-insns in the args for this call.
3291 If stack space is allocated for register parameters, but not by the
3292 caller, then it is preallocated in the fixed part of the stack frame.
3293 So the entire argument block must then be preallocated (i.e., we
3294 ignore PUSH_ROUNDING in that case). */
3296 int must_preallocate = !PUSH_ARGS;
3298 /* Size of the stack reserved for parameter registers. */
3299 int reg_parm_stack_space = 0;
3301 /* Address of space preallocated for stack parms
3302 (on machines that lack push insns), or 0 if space not preallocated. */
3303 rtx argblock = 0;
3305 /* Mask of ECF_ and ERF_ flags. */
3306 int flags = 0;
3307 int return_flags = 0;
3308 #ifdef REG_PARM_STACK_SPACE
3309 /* Define the boundary of the register parm stack space that needs to be
3310 saved, if any. */
3311 int low_to_save, high_to_save;
3312 rtx save_area = 0; /* Place that it is saved */
3313 #endif
3315 unsigned int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
3316 char *initial_stack_usage_map = stack_usage_map;
3317 unsigned HOST_WIDE_INT initial_stack_usage_watermark = stack_usage_watermark;
3318 char *stack_usage_map_buf = NULL;
3320 poly_int64 old_stack_allocated;
3322 /* State variables to track stack modifications. */
3323 rtx old_stack_level = 0;
3324 int old_stack_arg_under_construction = 0;
3325 poly_int64 old_pending_adj = 0;
3326 int old_inhibit_defer_pop = inhibit_defer_pop;
3328 /* Some stack pointer alterations we make are performed via
3329 allocate_dynamic_stack_space. This modifies the stack_pointer_delta,
3330 which we then also need to save/restore along the way. */
3331 poly_int64 old_stack_pointer_delta = 0;
3333 rtx call_fusage;
3334 tree addr = CALL_EXPR_FN (exp);
3335 int i;
3336 /* The alignment of the stack, in bits. */
3337 unsigned HOST_WIDE_INT preferred_stack_boundary;
3338 /* The alignment of the stack, in bytes. */
3339 unsigned HOST_WIDE_INT preferred_unit_stack_boundary;
3340 /* The static chain value to use for this call. */
3341 rtx static_chain_value;
3342 /* See if this is "nothrow" function call. */
3343 if (TREE_NOTHROW (exp))
3344 flags |= ECF_NOTHROW;
3346 /* See if we can find a DECL-node for the actual function, and get the
3347 function attributes (flags) from the function decl or type node. */
3348 fndecl = get_callee_fndecl (exp);
3349 if (fndecl)
3351 fntype = TREE_TYPE (fndecl);
3352 flags |= flags_from_decl_or_type (fndecl);
3353 return_flags |= decl_return_flags (fndecl);
3355 else
3357 fntype = TREE_TYPE (TREE_TYPE (addr));
3358 flags |= flags_from_decl_or_type (fntype);
3359 if (CALL_EXPR_BY_DESCRIPTOR (exp))
3360 flags |= ECF_BY_DESCRIPTOR;
3362 rettype = TREE_TYPE (exp);
3364 struct_value = targetm.calls.struct_value_rtx (fntype, 0);
3366 /* Warn if this value is an aggregate type,
3367 regardless of which calling convention we are using for it. */
3368 if (AGGREGATE_TYPE_P (rettype))
3369 warning (OPT_Waggregate_return, "function call has aggregate value");
3371 /* If the result of a non looping pure or const function call is
3372 ignored (or void), and none of its arguments are volatile, we can
3373 avoid expanding the call and just evaluate the arguments for
3374 side-effects. */
3375 if ((flags & (ECF_CONST | ECF_PURE))
3376 && (!(flags & ECF_LOOPING_CONST_OR_PURE))
3377 && (ignore || target == const0_rtx
3378 || TYPE_MODE (rettype) == VOIDmode))
3380 bool volatilep = false;
3381 tree arg;
3382 call_expr_arg_iterator iter;
3384 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
3385 if (TREE_THIS_VOLATILE (arg))
3387 volatilep = true;
3388 break;
3391 if (! volatilep)
3393 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
3394 expand_expr (arg, const0_rtx, VOIDmode, EXPAND_NORMAL);
3395 return const0_rtx;
3399 #ifdef REG_PARM_STACK_SPACE
3400 reg_parm_stack_space = REG_PARM_STACK_SPACE (!fndecl ? fntype : fndecl);
3401 #endif
3403 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl)))
3404 && reg_parm_stack_space > 0 && PUSH_ARGS)
3405 must_preallocate = 1;
3407 /* Set up a place to return a structure. */
3409 /* Cater to broken compilers. */
3410 if (aggregate_value_p (exp, fntype))
3412 /* This call returns a big structure. */
3413 flags &= ~(ECF_CONST | ECF_PURE | ECF_LOOPING_CONST_OR_PURE);
3415 #ifdef PCC_STATIC_STRUCT_RETURN
3417 pcc_struct_value = 1;
3419 #else /* not PCC_STATIC_STRUCT_RETURN */
3421 if (!poly_int_tree_p (TYPE_SIZE_UNIT (rettype), &struct_value_size))
3422 struct_value_size = -1;
3424 /* Even if it is semantically safe to use the target as the return
3425 slot, it may be not sufficiently aligned for the return type. */
3426 if (CALL_EXPR_RETURN_SLOT_OPT (exp)
3427 && target
3428 && MEM_P (target)
3429 /* If rettype is addressable, we may not create a temporary.
3430 If target is properly aligned at runtime and the compiler
3431 just doesn't know about it, it will work fine, otherwise it
3432 will be UB. */
3433 && (TREE_ADDRESSABLE (rettype)
3434 || !(MEM_ALIGN (target) < TYPE_ALIGN (rettype)
3435 && targetm.slow_unaligned_access (TYPE_MODE (rettype),
3436 MEM_ALIGN (target)))))
3437 structure_value_addr = XEXP (target, 0);
3438 else
3440 /* For variable-sized objects, we must be called with a target
3441 specified. If we were to allocate space on the stack here,
3442 we would have no way of knowing when to free it. */
3443 rtx d = assign_temp (rettype, 1, 1);
3444 structure_value_addr = XEXP (d, 0);
3445 target = 0;
3448 #endif /* not PCC_STATIC_STRUCT_RETURN */
3451 /* Figure out the amount to which the stack should be aligned. */
3452 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
3453 if (fndecl)
3455 struct cgraph_rtl_info *i = cgraph_node::rtl_info (fndecl);
3456 /* Without automatic stack alignment, we can't increase preferred
3457 stack boundary. With automatic stack alignment, it is
3458 unnecessary since unless we can guarantee that all callers will
3459 align the outgoing stack properly, callee has to align its
3460 stack anyway. */
3461 if (i
3462 && i->preferred_incoming_stack_boundary
3463 && i->preferred_incoming_stack_boundary < preferred_stack_boundary)
3464 preferred_stack_boundary = i->preferred_incoming_stack_boundary;
3467 /* Operand 0 is a pointer-to-function; get the type of the function. */
3468 funtype = TREE_TYPE (addr);
3469 gcc_assert (POINTER_TYPE_P (funtype));
3470 funtype = TREE_TYPE (funtype);
3472 /* Count whether there are actual complex arguments that need to be split
3473 into their real and imaginary parts. Munge the type_arg_types
3474 appropriately here as well. */
3475 if (targetm.calls.split_complex_arg)
3477 call_expr_arg_iterator iter;
3478 tree arg;
3479 FOR_EACH_CALL_EXPR_ARG (arg, iter, exp)
3481 tree type = TREE_TYPE (arg);
3482 if (type && TREE_CODE (type) == COMPLEX_TYPE
3483 && targetm.calls.split_complex_arg (type))
3484 num_complex_actuals++;
3486 type_arg_types = split_complex_types (TYPE_ARG_TYPES (funtype));
3488 else
3489 type_arg_types = TYPE_ARG_TYPES (funtype);
3491 if (flags & ECF_MAY_BE_ALLOCA)
3492 cfun->calls_alloca = 1;
3494 /* If struct_value_rtx is 0, it means pass the address
3495 as if it were an extra parameter. Put the argument expression
3496 in structure_value_addr_value. */
3497 if (structure_value_addr && struct_value == 0)
3499 /* If structure_value_addr is a REG other than
3500 virtual_outgoing_args_rtx, we can use always use it. If it
3501 is not a REG, we must always copy it into a register.
3502 If it is virtual_outgoing_args_rtx, we must copy it to another
3503 register in some cases. */
3504 rtx temp = (!REG_P (structure_value_addr)
3505 || (ACCUMULATE_OUTGOING_ARGS
3506 && stack_arg_under_construction
3507 && structure_value_addr == virtual_outgoing_args_rtx)
3508 ? copy_addr_to_reg (convert_memory_address
3509 (Pmode, structure_value_addr))
3510 : structure_value_addr);
3512 structure_value_addr_value =
3513 make_tree (build_pointer_type (TREE_TYPE (funtype)), temp);
3514 structure_value_addr_parm = 1;
3517 /* Count the arguments and set NUM_ACTUALS. */
3518 num_actuals =
3519 call_expr_nargs (exp) + num_complex_actuals + structure_value_addr_parm;
3521 /* Compute number of named args.
3522 First, do a raw count of the args for INIT_CUMULATIVE_ARGS. */
3524 if (type_arg_types != 0)
3525 n_named_args
3526 = (list_length (type_arg_types)
3527 /* Count the struct value address, if it is passed as a parm. */
3528 + structure_value_addr_parm);
3529 else
3530 /* If we know nothing, treat all args as named. */
3531 n_named_args = num_actuals;
3533 /* Start updating where the next arg would go.
3535 On some machines (such as the PA) indirect calls have a different
3536 calling convention than normal calls. The fourth argument in
3537 INIT_CUMULATIVE_ARGS tells the backend if this is an indirect call
3538 or not. */
3539 INIT_CUMULATIVE_ARGS (args_so_far_v, funtype, NULL_RTX, fndecl, n_named_args);
3540 args_so_far = pack_cumulative_args (&args_so_far_v);
3542 /* Now possibly adjust the number of named args.
3543 Normally, don't include the last named arg if anonymous args follow.
3544 We do include the last named arg if
3545 targetm.calls.strict_argument_naming() returns nonzero.
3546 (If no anonymous args follow, the result of list_length is actually
3547 one too large. This is harmless.)
3549 If targetm.calls.pretend_outgoing_varargs_named() returns
3550 nonzero, and targetm.calls.strict_argument_naming() returns zero,
3551 this machine will be able to place unnamed args that were passed
3552 in registers into the stack. So treat all args as named. This
3553 allows the insns emitting for a specific argument list to be
3554 independent of the function declaration.
3556 If targetm.calls.pretend_outgoing_varargs_named() returns zero,
3557 we do not have any reliable way to pass unnamed args in
3558 registers, so we must force them into memory. */
3560 if (type_arg_types != 0
3561 && targetm.calls.strict_argument_naming (args_so_far))
3563 else if (type_arg_types != 0
3564 && ! targetm.calls.pretend_outgoing_varargs_named (args_so_far))
3565 /* Don't include the last named arg. */
3566 --n_named_args;
3567 else
3568 /* Treat all args as named. */
3569 n_named_args = num_actuals;
3571 /* Make a vector to hold all the information about each arg. */
3572 args = XCNEWVEC (struct arg_data, num_actuals);
3574 /* Build up entries in the ARGS array, compute the size of the
3575 arguments into ARGS_SIZE, etc. */
3576 initialize_argument_information (num_actuals, args, &args_size,
3577 n_named_args, exp,
3578 structure_value_addr_value, fndecl, fntype,
3579 args_so_far, reg_parm_stack_space,
3580 &old_stack_level, &old_pending_adj,
3581 &must_preallocate, &flags,
3582 &try_tail_call, CALL_FROM_THUNK_P (exp));
3584 if (args_size.var)
3585 must_preallocate = 1;
3587 /* Now make final decision about preallocating stack space. */
3588 must_preallocate = finalize_must_preallocate (must_preallocate,
3589 num_actuals, args,
3590 &args_size);
3592 /* If the structure value address will reference the stack pointer, we
3593 must stabilize it. We don't need to do this if we know that we are
3594 not going to adjust the stack pointer in processing this call. */
3596 if (structure_value_addr
3597 && (reg_mentioned_p (virtual_stack_dynamic_rtx, structure_value_addr)
3598 || reg_mentioned_p (virtual_outgoing_args_rtx,
3599 structure_value_addr))
3600 && (args_size.var
3601 || (!ACCUMULATE_OUTGOING_ARGS
3602 && maybe_ne (args_size.constant, 0))))
3603 structure_value_addr = copy_to_reg (structure_value_addr);
3605 /* Tail calls can make things harder to debug, and we've traditionally
3606 pushed these optimizations into -O2. Don't try if we're already
3607 expanding a call, as that means we're an argument. Don't try if
3608 there's cleanups, as we know there's code to follow the call. */
3610 if (currently_expanding_call++ != 0
3611 || !flag_optimize_sibling_calls
3612 || args_size.var
3613 || dbg_cnt (tail_call) == false)
3614 try_tail_call = 0;
3616 /* If the user has marked the function as requiring tail-call
3617 optimization, attempt it. */
3618 if (must_tail_call)
3619 try_tail_call = 1;
3621 /* Rest of purposes for tail call optimizations to fail. */
3622 if (try_tail_call)
3623 try_tail_call = can_implement_as_sibling_call_p (exp,
3624 structure_value_addr,
3625 funtype,
3626 reg_parm_stack_space,
3627 fndecl,
3628 flags, addr, args_size);
3630 /* Check if caller and callee disagree in promotion of function
3631 return value. */
3632 if (try_tail_call)
3634 machine_mode caller_mode, caller_promoted_mode;
3635 machine_mode callee_mode, callee_promoted_mode;
3636 int caller_unsignedp, callee_unsignedp;
3637 tree caller_res = DECL_RESULT (current_function_decl);
3639 caller_unsignedp = TYPE_UNSIGNED (TREE_TYPE (caller_res));
3640 caller_mode = DECL_MODE (caller_res);
3641 callee_unsignedp = TYPE_UNSIGNED (TREE_TYPE (funtype));
3642 callee_mode = TYPE_MODE (TREE_TYPE (funtype));
3643 caller_promoted_mode
3644 = promote_function_mode (TREE_TYPE (caller_res), caller_mode,
3645 &caller_unsignedp,
3646 TREE_TYPE (current_function_decl), 1);
3647 callee_promoted_mode
3648 = promote_function_mode (TREE_TYPE (funtype), callee_mode,
3649 &callee_unsignedp,
3650 funtype, 1);
3651 if (caller_mode != VOIDmode
3652 && (caller_promoted_mode != callee_promoted_mode
3653 || ((caller_mode != caller_promoted_mode
3654 || callee_mode != callee_promoted_mode)
3655 && (caller_unsignedp != callee_unsignedp
3656 || partial_subreg_p (caller_mode, callee_mode)))))
3658 try_tail_call = 0;
3659 maybe_complain_about_tail_call (exp,
3660 "caller and callee disagree in"
3661 " promotion of function"
3662 " return value");
3666 /* Ensure current function's preferred stack boundary is at least
3667 what we need. Stack alignment may also increase preferred stack
3668 boundary. */
3669 if (crtl->preferred_stack_boundary < preferred_stack_boundary)
3670 crtl->preferred_stack_boundary = preferred_stack_boundary;
3671 else
3672 preferred_stack_boundary = crtl->preferred_stack_boundary;
3674 preferred_unit_stack_boundary = preferred_stack_boundary / BITS_PER_UNIT;
3676 /* We want to make two insn chains; one for a sibling call, the other
3677 for a normal call. We will select one of the two chains after
3678 initial RTL generation is complete. */
3679 for (pass = try_tail_call ? 0 : 1; pass < 2; pass++)
3681 int sibcall_failure = 0;
3682 /* We want to emit any pending stack adjustments before the tail
3683 recursion "call". That way we know any adjustment after the tail
3684 recursion call can be ignored if we indeed use the tail
3685 call expansion. */
3686 saved_pending_stack_adjust save;
3687 rtx_insn *insns, *before_call, *after_args;
3688 rtx next_arg_reg;
3690 if (pass == 0)
3692 /* State variables we need to save and restore between
3693 iterations. */
3694 save_pending_stack_adjust (&save);
3696 if (pass)
3697 flags &= ~ECF_SIBCALL;
3698 else
3699 flags |= ECF_SIBCALL;
3701 /* Other state variables that we must reinitialize each time
3702 through the loop (that are not initialized by the loop itself). */
3703 argblock = 0;
3704 call_fusage = 0;
3706 /* Start a new sequence for the normal call case.
3708 From this point on, if the sibling call fails, we want to set
3709 sibcall_failure instead of continuing the loop. */
3710 start_sequence ();
3712 /* Don't let pending stack adjusts add up to too much.
3713 Also, do all pending adjustments now if there is any chance
3714 this might be a call to alloca or if we are expanding a sibling
3715 call sequence.
3716 Also do the adjustments before a throwing call, otherwise
3717 exception handling can fail; PR 19225. */
3718 if (maybe_ge (pending_stack_adjust, 32)
3719 || (maybe_ne (pending_stack_adjust, 0)
3720 && (flags & ECF_MAY_BE_ALLOCA))
3721 || (maybe_ne (pending_stack_adjust, 0)
3722 && flag_exceptions && !(flags & ECF_NOTHROW))
3723 || pass == 0)
3724 do_pending_stack_adjust ();
3726 /* Precompute any arguments as needed. */
3727 if (pass)
3728 precompute_arguments (num_actuals, args);
3730 /* Now we are about to start emitting insns that can be deleted
3731 if a libcall is deleted. */
3732 if (pass && (flags & ECF_MALLOC))
3733 start_sequence ();
3735 if (pass == 0
3736 && crtl->stack_protect_guard
3737 && targetm.stack_protect_runtime_enabled_p ())
3738 stack_protect_epilogue ();
3740 adjusted_args_size = args_size;
3741 /* Compute the actual size of the argument block required. The variable
3742 and constant sizes must be combined, the size may have to be rounded,
3743 and there may be a minimum required size. When generating a sibcall
3744 pattern, do not round up, since we'll be re-using whatever space our
3745 caller provided. */
3746 unadjusted_args_size
3747 = compute_argument_block_size (reg_parm_stack_space,
3748 &adjusted_args_size,
3749 fndecl, fntype,
3750 (pass == 0 ? 0
3751 : preferred_stack_boundary));
3753 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
3755 /* The argument block when performing a sibling call is the
3756 incoming argument block. */
3757 if (pass == 0)
3759 argblock = crtl->args.internal_arg_pointer;
3760 if (STACK_GROWS_DOWNWARD)
3761 argblock
3762 = plus_constant (Pmode, argblock, crtl->args.pretend_args_size);
3763 else
3764 argblock
3765 = plus_constant (Pmode, argblock, -crtl->args.pretend_args_size);
3767 HOST_WIDE_INT map_size = constant_lower_bound (args_size.constant);
3768 stored_args_map = sbitmap_alloc (map_size);
3769 bitmap_clear (stored_args_map);
3770 stored_args_watermark = HOST_WIDE_INT_M1U;
3773 /* If we have no actual push instructions, or shouldn't use them,
3774 make space for all args right now. */
3775 else if (adjusted_args_size.var != 0)
3777 if (old_stack_level == 0)
3779 emit_stack_save (SAVE_BLOCK, &old_stack_level);
3780 old_stack_pointer_delta = stack_pointer_delta;
3781 old_pending_adj = pending_stack_adjust;
3782 pending_stack_adjust = 0;
3783 /* stack_arg_under_construction says whether a stack arg is
3784 being constructed at the old stack level. Pushing the stack
3785 gets a clean outgoing argument block. */
3786 old_stack_arg_under_construction = stack_arg_under_construction;
3787 stack_arg_under_construction = 0;
3789 argblock = push_block (ARGS_SIZE_RTX (adjusted_args_size), 0, 0);
3790 if (flag_stack_usage_info)
3791 current_function_has_unbounded_dynamic_stack_size = 1;
3793 else
3795 /* Note that we must go through the motions of allocating an argument
3796 block even if the size is zero because we may be storing args
3797 in the area reserved for register arguments, which may be part of
3798 the stack frame. */
3800 poly_int64 needed = adjusted_args_size.constant;
3802 /* Store the maximum argument space used. It will be pushed by
3803 the prologue (if ACCUMULATE_OUTGOING_ARGS, or stack overflow
3804 checking). */
3806 crtl->outgoing_args_size = upper_bound (crtl->outgoing_args_size,
3807 needed);
3809 if (must_preallocate)
3811 if (ACCUMULATE_OUTGOING_ARGS)
3813 /* Since the stack pointer will never be pushed, it is
3814 possible for the evaluation of a parm to clobber
3815 something we have already written to the stack.
3816 Since most function calls on RISC machines do not use
3817 the stack, this is uncommon, but must work correctly.
3819 Therefore, we save any area of the stack that was already
3820 written and that we are using. Here we set up to do this
3821 by making a new stack usage map from the old one. The
3822 actual save will be done by store_one_arg.
3824 Another approach might be to try to reorder the argument
3825 evaluations to avoid this conflicting stack usage. */
3827 /* Since we will be writing into the entire argument area,
3828 the map must be allocated for its entire size, not just
3829 the part that is the responsibility of the caller. */
3830 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl))))
3831 needed += reg_parm_stack_space;
3833 poly_int64 limit = needed;
3834 if (ARGS_GROW_DOWNWARD)
3835 limit += 1;
3837 /* For polynomial sizes, this is the maximum possible
3838 size needed for arguments with a constant size
3839 and offset. */
3840 HOST_WIDE_INT const_limit = constant_lower_bound (limit);
3841 highest_outgoing_arg_in_use
3842 = MAX (initial_highest_arg_in_use, const_limit);
3844 free (stack_usage_map_buf);
3845 stack_usage_map_buf = XNEWVEC (char, highest_outgoing_arg_in_use);
3846 stack_usage_map = stack_usage_map_buf;
3848 if (initial_highest_arg_in_use)
3849 memcpy (stack_usage_map, initial_stack_usage_map,
3850 initial_highest_arg_in_use);
3852 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
3853 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
3854 (highest_outgoing_arg_in_use
3855 - initial_highest_arg_in_use));
3856 needed = 0;
3858 /* The address of the outgoing argument list must not be
3859 copied to a register here, because argblock would be left
3860 pointing to the wrong place after the call to
3861 allocate_dynamic_stack_space below. */
3863 argblock = virtual_outgoing_args_rtx;
3865 else
3867 /* Try to reuse some or all of the pending_stack_adjust
3868 to get this space. */
3869 if (inhibit_defer_pop == 0
3870 && (combine_pending_stack_adjustment_and_call
3871 (&needed,
3872 unadjusted_args_size,
3873 &adjusted_args_size,
3874 preferred_unit_stack_boundary)))
3876 /* combine_pending_stack_adjustment_and_call computes
3877 an adjustment before the arguments are allocated.
3878 Account for them and see whether or not the stack
3879 needs to go up or down. */
3880 needed = unadjusted_args_size - needed;
3882 /* Checked by
3883 combine_pending_stack_adjustment_and_call. */
3884 gcc_checking_assert (ordered_p (needed, 0));
3885 if (maybe_lt (needed, 0))
3887 /* We're releasing stack space. */
3888 /* ??? We can avoid any adjustment at all if we're
3889 already aligned. FIXME. */
3890 pending_stack_adjust = -needed;
3891 do_pending_stack_adjust ();
3892 needed = 0;
3894 else
3895 /* We need to allocate space. We'll do that in
3896 push_block below. */
3897 pending_stack_adjust = 0;
3900 /* Special case this because overhead of `push_block' in
3901 this case is non-trivial. */
3902 if (known_eq (needed, 0))
3903 argblock = virtual_outgoing_args_rtx;
3904 else
3906 rtx needed_rtx = gen_int_mode (needed, Pmode);
3907 argblock = push_block (needed_rtx, 0, 0);
3908 if (ARGS_GROW_DOWNWARD)
3909 argblock = plus_constant (Pmode, argblock, needed);
3912 /* We only really need to call `copy_to_reg' in the case
3913 where push insns are going to be used to pass ARGBLOCK
3914 to a function call in ARGS. In that case, the stack
3915 pointer changes value from the allocation point to the
3916 call point, and hence the value of
3917 VIRTUAL_OUTGOING_ARGS_RTX changes as well. But might
3918 as well always do it. */
3919 argblock = copy_to_reg (argblock);
3924 if (ACCUMULATE_OUTGOING_ARGS)
3926 /* The save/restore code in store_one_arg handles all
3927 cases except one: a constructor call (including a C
3928 function returning a BLKmode struct) to initialize
3929 an argument. */
3930 if (stack_arg_under_construction)
3932 rtx push_size
3933 = (gen_int_mode
3934 (adjusted_args_size.constant
3935 + (OUTGOING_REG_PARM_STACK_SPACE (!fndecl ? fntype
3936 : TREE_TYPE (fndecl))
3937 ? 0 : reg_parm_stack_space), Pmode));
3938 if (old_stack_level == 0)
3940 emit_stack_save (SAVE_BLOCK, &old_stack_level);
3941 old_stack_pointer_delta = stack_pointer_delta;
3942 old_pending_adj = pending_stack_adjust;
3943 pending_stack_adjust = 0;
3944 /* stack_arg_under_construction says whether a stack
3945 arg is being constructed at the old stack level.
3946 Pushing the stack gets a clean outgoing argument
3947 block. */
3948 old_stack_arg_under_construction
3949 = stack_arg_under_construction;
3950 stack_arg_under_construction = 0;
3951 /* Make a new map for the new argument list. */
3952 free (stack_usage_map_buf);
3953 stack_usage_map_buf = XCNEWVEC (char, highest_outgoing_arg_in_use);
3954 stack_usage_map = stack_usage_map_buf;
3955 highest_outgoing_arg_in_use = 0;
3956 stack_usage_watermark = HOST_WIDE_INT_M1U;
3958 /* We can pass TRUE as the 4th argument because we just
3959 saved the stack pointer and will restore it right after
3960 the call. */
3961 allocate_dynamic_stack_space (push_size, 0, BIGGEST_ALIGNMENT,
3962 -1, true);
3965 /* If argument evaluation might modify the stack pointer,
3966 copy the address of the argument list to a register. */
3967 for (i = 0; i < num_actuals; i++)
3968 if (args[i].pass_on_stack)
3970 argblock = copy_addr_to_reg (argblock);
3971 break;
3975 compute_argument_addresses (args, argblock, num_actuals);
3977 /* Stack is properly aligned, pops can't safely be deferred during
3978 the evaluation of the arguments. */
3979 NO_DEFER_POP;
3981 /* Precompute all register parameters. It isn't safe to compute
3982 anything once we have started filling any specific hard regs.
3983 TLS symbols sometimes need a call to resolve. Precompute
3984 register parameters before any stack pointer manipulation
3985 to avoid unaligned stack in the called function. */
3986 precompute_register_parameters (num_actuals, args, &reg_parm_seen);
3988 OK_DEFER_POP;
3990 /* Perform stack alignment before the first push (the last arg). */
3991 if (argblock == 0
3992 && maybe_gt (adjusted_args_size.constant, reg_parm_stack_space)
3993 && maybe_ne (adjusted_args_size.constant, unadjusted_args_size))
3995 /* When the stack adjustment is pending, we get better code
3996 by combining the adjustments. */
3997 if (maybe_ne (pending_stack_adjust, 0)
3998 && ! inhibit_defer_pop
3999 && (combine_pending_stack_adjustment_and_call
4000 (&pending_stack_adjust,
4001 unadjusted_args_size,
4002 &adjusted_args_size,
4003 preferred_unit_stack_boundary)))
4004 do_pending_stack_adjust ();
4005 else if (argblock == 0)
4006 anti_adjust_stack (gen_int_mode (adjusted_args_size.constant
4007 - unadjusted_args_size,
4008 Pmode));
4010 /* Now that the stack is properly aligned, pops can't safely
4011 be deferred during the evaluation of the arguments. */
4012 NO_DEFER_POP;
4014 /* Record the maximum pushed stack space size. We need to delay
4015 doing it this far to take into account the optimization done
4016 by combine_pending_stack_adjustment_and_call. */
4017 if (flag_stack_usage_info
4018 && !ACCUMULATE_OUTGOING_ARGS
4019 && pass
4020 && adjusted_args_size.var == 0)
4022 poly_int64 pushed = (adjusted_args_size.constant
4023 + pending_stack_adjust);
4024 current_function_pushed_stack_size
4025 = upper_bound (current_function_pushed_stack_size, pushed);
4028 funexp = rtx_for_function_call (fndecl, addr);
4030 if (CALL_EXPR_STATIC_CHAIN (exp))
4031 static_chain_value = expand_normal (CALL_EXPR_STATIC_CHAIN (exp));
4032 else
4033 static_chain_value = 0;
4035 #ifdef REG_PARM_STACK_SPACE
4036 /* Save the fixed argument area if it's part of the caller's frame and
4037 is clobbered by argument setup for this call. */
4038 if (ACCUMULATE_OUTGOING_ARGS && pass)
4039 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
4040 &low_to_save, &high_to_save);
4041 #endif
4043 /* Now store (and compute if necessary) all non-register parms.
4044 These come before register parms, since they can require block-moves,
4045 which could clobber the registers used for register parms.
4046 Parms which have partial registers are not stored here,
4047 but we do preallocate space here if they want that. */
4049 for (i = 0; i < num_actuals; i++)
4051 if (args[i].reg == 0 || args[i].pass_on_stack)
4053 rtx_insn *before_arg = get_last_insn ();
4055 /* We don't allow passing huge (> 2^30 B) arguments
4056 by value. It would cause an overflow later on. */
4057 if (constant_lower_bound (adjusted_args_size.constant)
4058 >= (1 << (HOST_BITS_PER_INT - 2)))
4060 sorry ("passing too large argument on stack");
4061 continue;
4064 if (store_one_arg (&args[i], argblock, flags,
4065 adjusted_args_size.var != 0,
4066 reg_parm_stack_space)
4067 || (pass == 0
4068 && check_sibcall_argument_overlap (before_arg,
4069 &args[i], 1)))
4070 sibcall_failure = 1;
4073 if (args[i].stack)
4074 call_fusage
4075 = gen_rtx_EXPR_LIST (TYPE_MODE (TREE_TYPE (args[i].tree_value)),
4076 gen_rtx_USE (VOIDmode, args[i].stack),
4077 call_fusage);
4080 /* If we have a parm that is passed in registers but not in memory
4081 and whose alignment does not permit a direct copy into registers,
4082 make a group of pseudos that correspond to each register that we
4083 will later fill. */
4084 if (STRICT_ALIGNMENT)
4085 store_unaligned_arguments_into_pseudos (args, num_actuals);
4087 /* Now store any partially-in-registers parm.
4088 This is the last place a block-move can happen. */
4089 if (reg_parm_seen)
4090 for (i = 0; i < num_actuals; i++)
4091 if (args[i].partial != 0 && ! args[i].pass_on_stack)
4093 rtx_insn *before_arg = get_last_insn ();
4095 /* On targets with weird calling conventions (e.g. PA) it's
4096 hard to ensure that all cases of argument overlap between
4097 stack and registers work. Play it safe and bail out. */
4098 if (ARGS_GROW_DOWNWARD && !STACK_GROWS_DOWNWARD)
4100 sibcall_failure = 1;
4101 break;
4104 if (store_one_arg (&args[i], argblock, flags,
4105 adjusted_args_size.var != 0,
4106 reg_parm_stack_space)
4107 || (pass == 0
4108 && check_sibcall_argument_overlap (before_arg,
4109 &args[i], 1)))
4110 sibcall_failure = 1;
4113 bool any_regs = false;
4114 for (i = 0; i < num_actuals; i++)
4115 if (args[i].reg != NULL_RTX)
4117 any_regs = true;
4118 targetm.calls.call_args (args[i].reg, funtype);
4120 if (!any_regs)
4121 targetm.calls.call_args (pc_rtx, funtype);
4123 /* Figure out the register where the value, if any, will come back. */
4124 valreg = 0;
4125 if (TYPE_MODE (rettype) != VOIDmode
4126 && ! structure_value_addr)
4128 if (pcc_struct_value)
4129 valreg = hard_function_value (build_pointer_type (rettype),
4130 fndecl, NULL, (pass == 0));
4131 else
4132 valreg = hard_function_value (rettype, fndecl, fntype,
4133 (pass == 0));
4135 /* If VALREG is a PARALLEL whose first member has a zero
4136 offset, use that. This is for targets such as m68k that
4137 return the same value in multiple places. */
4138 if (GET_CODE (valreg) == PARALLEL)
4140 rtx elem = XVECEXP (valreg, 0, 0);
4141 rtx where = XEXP (elem, 0);
4142 rtx offset = XEXP (elem, 1);
4143 if (offset == const0_rtx
4144 && GET_MODE (where) == GET_MODE (valreg))
4145 valreg = where;
4149 /* If register arguments require space on the stack and stack space
4150 was not preallocated, allocate stack space here for arguments
4151 passed in registers. */
4152 if (OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl)))
4153 && !ACCUMULATE_OUTGOING_ARGS
4154 && must_preallocate == 0 && reg_parm_stack_space > 0)
4155 anti_adjust_stack (GEN_INT (reg_parm_stack_space));
4157 /* Pass the function the address in which to return a
4158 structure value. */
4159 if (pass != 0 && structure_value_addr && ! structure_value_addr_parm)
4161 structure_value_addr
4162 = convert_memory_address (Pmode, structure_value_addr);
4163 emit_move_insn (struct_value,
4164 force_reg (Pmode,
4165 force_operand (structure_value_addr,
4166 NULL_RTX)));
4168 if (REG_P (struct_value))
4169 use_reg (&call_fusage, struct_value);
4172 after_args = get_last_insn ();
4173 funexp = prepare_call_address (fndecl ? fndecl : fntype, funexp,
4174 static_chain_value, &call_fusage,
4175 reg_parm_seen, flags);
4177 load_register_parameters (args, num_actuals, &call_fusage, flags,
4178 pass == 0, &sibcall_failure);
4180 /* Save a pointer to the last insn before the call, so that we can
4181 later safely search backwards to find the CALL_INSN. */
4182 before_call = get_last_insn ();
4184 /* Set up next argument register. For sibling calls on machines
4185 with register windows this should be the incoming register. */
4186 if (pass == 0)
4187 next_arg_reg = targetm.calls.function_incoming_arg (args_so_far,
4188 VOIDmode,
4189 void_type_node,
4190 true);
4191 else
4192 next_arg_reg = targetm.calls.function_arg (args_so_far,
4193 VOIDmode, void_type_node,
4194 true);
4196 if (pass == 1 && (return_flags & ERF_RETURNS_ARG))
4198 int arg_nr = return_flags & ERF_RETURN_ARG_MASK;
4199 arg_nr = num_actuals - arg_nr - 1;
4200 if (arg_nr >= 0
4201 && arg_nr < num_actuals
4202 && args[arg_nr].reg
4203 && valreg
4204 && REG_P (valreg)
4205 && GET_MODE (args[arg_nr].reg) == GET_MODE (valreg))
4206 call_fusage
4207 = gen_rtx_EXPR_LIST (TYPE_MODE (TREE_TYPE (args[arg_nr].tree_value)),
4208 gen_rtx_SET (valreg, args[arg_nr].reg),
4209 call_fusage);
4211 /* All arguments and registers used for the call must be set up by
4212 now! */
4214 /* Stack must be properly aligned now. */
4215 gcc_assert (!pass
4216 || multiple_p (stack_pointer_delta,
4217 preferred_unit_stack_boundary));
4219 /* Generate the actual call instruction. */
4220 emit_call_1 (funexp, exp, fndecl, funtype, unadjusted_args_size,
4221 adjusted_args_size.constant, struct_value_size,
4222 next_arg_reg, valreg, old_inhibit_defer_pop, call_fusage,
4223 flags, args_so_far);
4225 if (flag_ipa_ra)
4227 rtx_call_insn *last;
4228 rtx datum = NULL_RTX;
4229 if (fndecl != NULL_TREE)
4231 datum = XEXP (DECL_RTL (fndecl), 0);
4232 gcc_assert (datum != NULL_RTX
4233 && GET_CODE (datum) == SYMBOL_REF);
4235 last = last_call_insn ();
4236 add_reg_note (last, REG_CALL_DECL, datum);
4239 /* If the call setup or the call itself overlaps with anything
4240 of the argument setup we probably clobbered our call address.
4241 In that case we can't do sibcalls. */
4242 if (pass == 0
4243 && check_sibcall_argument_overlap (after_args, 0, 0))
4244 sibcall_failure = 1;
4246 /* If a non-BLKmode value is returned at the most significant end
4247 of a register, shift the register right by the appropriate amount
4248 and update VALREG accordingly. BLKmode values are handled by the
4249 group load/store machinery below. */
4250 if (!structure_value_addr
4251 && !pcc_struct_value
4252 && TYPE_MODE (rettype) != VOIDmode
4253 && TYPE_MODE (rettype) != BLKmode
4254 && REG_P (valreg)
4255 && targetm.calls.return_in_msb (rettype))
4257 if (shift_return_value (TYPE_MODE (rettype), false, valreg))
4258 sibcall_failure = 1;
4259 valreg = gen_rtx_REG (TYPE_MODE (rettype), REGNO (valreg));
4262 if (pass && (flags & ECF_MALLOC))
4264 rtx temp = gen_reg_rtx (GET_MODE (valreg));
4265 rtx_insn *last, *insns;
4267 /* The return value from a malloc-like function is a pointer. */
4268 if (TREE_CODE (rettype) == POINTER_TYPE)
4269 mark_reg_pointer (temp, MALLOC_ABI_ALIGNMENT);
4271 emit_move_insn (temp, valreg);
4273 /* The return value from a malloc-like function can not alias
4274 anything else. */
4275 last = get_last_insn ();
4276 add_reg_note (last, REG_NOALIAS, temp);
4278 /* Write out the sequence. */
4279 insns = get_insns ();
4280 end_sequence ();
4281 emit_insn (insns);
4282 valreg = temp;
4285 /* For calls to `setjmp', etc., inform
4286 function.c:setjmp_warnings that it should complain if
4287 nonvolatile values are live. For functions that cannot
4288 return, inform flow that control does not fall through. */
4290 if ((flags & ECF_NORETURN) || pass == 0)
4292 /* The barrier must be emitted
4293 immediately after the CALL_INSN. Some ports emit more
4294 than just a CALL_INSN above, so we must search for it here. */
4296 rtx_insn *last = get_last_insn ();
4297 while (!CALL_P (last))
4299 last = PREV_INSN (last);
4300 /* There was no CALL_INSN? */
4301 gcc_assert (last != before_call);
4304 emit_barrier_after (last);
4306 /* Stack adjustments after a noreturn call are dead code.
4307 However when NO_DEFER_POP is in effect, we must preserve
4308 stack_pointer_delta. */
4309 if (inhibit_defer_pop == 0)
4311 stack_pointer_delta = old_stack_allocated;
4312 pending_stack_adjust = 0;
4316 /* If value type not void, return an rtx for the value. */
4318 if (TYPE_MODE (rettype) == VOIDmode
4319 || ignore)
4320 target = const0_rtx;
4321 else if (structure_value_addr)
4323 if (target == 0 || !MEM_P (target))
4325 target
4326 = gen_rtx_MEM (TYPE_MODE (rettype),
4327 memory_address (TYPE_MODE (rettype),
4328 structure_value_addr));
4329 set_mem_attributes (target, rettype, 1);
4332 else if (pcc_struct_value)
4334 /* This is the special C++ case where we need to
4335 know what the true target was. We take care to
4336 never use this value more than once in one expression. */
4337 target = gen_rtx_MEM (TYPE_MODE (rettype),
4338 copy_to_reg (valreg));
4339 set_mem_attributes (target, rettype, 1);
4341 /* Handle calls that return values in multiple non-contiguous locations.
4342 The Irix 6 ABI has examples of this. */
4343 else if (GET_CODE (valreg) == PARALLEL)
4345 if (target == 0)
4346 target = emit_group_move_into_temps (valreg);
4347 else if (rtx_equal_p (target, valreg))
4349 else if (GET_CODE (target) == PARALLEL)
4350 /* Handle the result of a emit_group_move_into_temps
4351 call in the previous pass. */
4352 emit_group_move (target, valreg);
4353 else
4354 emit_group_store (target, valreg, rettype,
4355 int_size_in_bytes (rettype));
4357 else if (target
4358 && GET_MODE (target) == TYPE_MODE (rettype)
4359 && GET_MODE (target) == GET_MODE (valreg))
4361 bool may_overlap = false;
4363 /* We have to copy a return value in a CLASS_LIKELY_SPILLED hard
4364 reg to a plain register. */
4365 if (!REG_P (target) || HARD_REGISTER_P (target))
4366 valreg = avoid_likely_spilled_reg (valreg);
4368 /* If TARGET is a MEM in the argument area, and we have
4369 saved part of the argument area, then we can't store
4370 directly into TARGET as it may get overwritten when we
4371 restore the argument save area below. Don't work too
4372 hard though and simply force TARGET to a register if it
4373 is a MEM; the optimizer is quite likely to sort it out. */
4374 if (ACCUMULATE_OUTGOING_ARGS && pass && MEM_P (target))
4375 for (i = 0; i < num_actuals; i++)
4376 if (args[i].save_area)
4378 may_overlap = true;
4379 break;
4382 if (may_overlap)
4383 target = copy_to_reg (valreg);
4384 else
4386 /* TARGET and VALREG cannot be equal at this point
4387 because the latter would not have
4388 REG_FUNCTION_VALUE_P true, while the former would if
4389 it were referring to the same register.
4391 If they refer to the same register, this move will be
4392 a no-op, except when function inlining is being
4393 done. */
4394 emit_move_insn (target, valreg);
4396 /* If we are setting a MEM, this code must be executed.
4397 Since it is emitted after the call insn, sibcall
4398 optimization cannot be performed in that case. */
4399 if (MEM_P (target))
4400 sibcall_failure = 1;
4403 else
4404 target = copy_to_reg (avoid_likely_spilled_reg (valreg));
4406 /* If we promoted this return value, make the proper SUBREG.
4407 TARGET might be const0_rtx here, so be careful. */
4408 if (REG_P (target)
4409 && TYPE_MODE (rettype) != BLKmode
4410 && GET_MODE (target) != TYPE_MODE (rettype))
4412 tree type = rettype;
4413 int unsignedp = TYPE_UNSIGNED (type);
4414 machine_mode pmode;
4416 /* Ensure we promote as expected, and get the new unsignedness. */
4417 pmode = promote_function_mode (type, TYPE_MODE (type), &unsignedp,
4418 funtype, 1);
4419 gcc_assert (GET_MODE (target) == pmode);
4421 poly_uint64 offset = subreg_lowpart_offset (TYPE_MODE (type),
4422 GET_MODE (target));
4423 target = gen_rtx_SUBREG (TYPE_MODE (type), target, offset);
4424 SUBREG_PROMOTED_VAR_P (target) = 1;
4425 SUBREG_PROMOTED_SET (target, unsignedp);
4428 /* If size of args is variable or this was a constructor call for a stack
4429 argument, restore saved stack-pointer value. */
4431 if (old_stack_level)
4433 rtx_insn *prev = get_last_insn ();
4435 emit_stack_restore (SAVE_BLOCK, old_stack_level);
4436 stack_pointer_delta = old_stack_pointer_delta;
4438 fixup_args_size_notes (prev, get_last_insn (), stack_pointer_delta);
4440 pending_stack_adjust = old_pending_adj;
4441 old_stack_allocated = stack_pointer_delta - pending_stack_adjust;
4442 stack_arg_under_construction = old_stack_arg_under_construction;
4443 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
4444 stack_usage_map = initial_stack_usage_map;
4445 stack_usage_watermark = initial_stack_usage_watermark;
4446 sibcall_failure = 1;
4448 else if (ACCUMULATE_OUTGOING_ARGS && pass)
4450 #ifdef REG_PARM_STACK_SPACE
4451 if (save_area)
4452 restore_fixed_argument_area (save_area, argblock,
4453 high_to_save, low_to_save);
4454 #endif
4456 /* If we saved any argument areas, restore them. */
4457 for (i = 0; i < num_actuals; i++)
4458 if (args[i].save_area)
4460 machine_mode save_mode = GET_MODE (args[i].save_area);
4461 rtx stack_area
4462 = gen_rtx_MEM (save_mode,
4463 memory_address (save_mode,
4464 XEXP (args[i].stack_slot, 0)));
4466 if (save_mode != BLKmode)
4467 emit_move_insn (stack_area, args[i].save_area);
4468 else
4469 emit_block_move (stack_area, args[i].save_area,
4470 (gen_int_mode
4471 (args[i].locate.size.constant, Pmode)),
4472 BLOCK_OP_CALL_PARM);
4475 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
4476 stack_usage_map = initial_stack_usage_map;
4477 stack_usage_watermark = initial_stack_usage_watermark;
4480 /* If this was alloca, record the new stack level. */
4481 if (flags & ECF_MAY_BE_ALLOCA)
4482 record_new_stack_level ();
4484 /* Free up storage we no longer need. */
4485 for (i = 0; i < num_actuals; ++i)
4486 free (args[i].aligned_regs);
4488 targetm.calls.end_call_args ();
4490 insns = get_insns ();
4491 end_sequence ();
4493 if (pass == 0)
4495 tail_call_insns = insns;
4497 /* Restore the pending stack adjustment now that we have
4498 finished generating the sibling call sequence. */
4500 restore_pending_stack_adjust (&save);
4502 /* Prepare arg structure for next iteration. */
4503 for (i = 0; i < num_actuals; i++)
4505 args[i].value = 0;
4506 args[i].aligned_regs = 0;
4507 args[i].stack = 0;
4510 sbitmap_free (stored_args_map);
4511 internal_arg_pointer_exp_state.scan_start = NULL;
4512 internal_arg_pointer_exp_state.cache.release ();
4514 else
4516 normal_call_insns = insns;
4518 /* Verify that we've deallocated all the stack we used. */
4519 gcc_assert ((flags & ECF_NORETURN)
4520 || known_eq (old_stack_allocated,
4521 stack_pointer_delta
4522 - pending_stack_adjust));
4525 /* If something prevents making this a sibling call,
4526 zero out the sequence. */
4527 if (sibcall_failure)
4528 tail_call_insns = NULL;
4529 else
4530 break;
4533 /* If tail call production succeeded, we need to remove REG_EQUIV notes on
4534 arguments too, as argument area is now clobbered by the call. */
4535 if (tail_call_insns)
4537 emit_insn (tail_call_insns);
4538 crtl->tail_call_emit = true;
4540 else
4542 emit_insn (normal_call_insns);
4543 if (try_tail_call)
4544 /* Ideally we'd emit a message for all of the ways that it could
4545 have failed. */
4546 maybe_complain_about_tail_call (exp, "tail call production failed");
4549 currently_expanding_call--;
4551 free (stack_usage_map_buf);
4552 free (args);
4553 return target;
4556 /* A sibling call sequence invalidates any REG_EQUIV notes made for
4557 this function's incoming arguments.
4559 At the start of RTL generation we know the only REG_EQUIV notes
4560 in the rtl chain are those for incoming arguments, so we can look
4561 for REG_EQUIV notes between the start of the function and the
4562 NOTE_INSN_FUNCTION_BEG.
4564 This is (slight) overkill. We could keep track of the highest
4565 argument we clobber and be more selective in removing notes, but it
4566 does not seem to be worth the effort. */
4568 void
4569 fixup_tail_calls (void)
4571 rtx_insn *insn;
4573 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
4575 rtx note;
4577 /* There are never REG_EQUIV notes for the incoming arguments
4578 after the NOTE_INSN_FUNCTION_BEG note, so stop if we see it. */
4579 if (NOTE_P (insn)
4580 && NOTE_KIND (insn) == NOTE_INSN_FUNCTION_BEG)
4581 break;
4583 note = find_reg_note (insn, REG_EQUIV, 0);
4584 if (note)
4585 remove_note (insn, note);
4586 note = find_reg_note (insn, REG_EQUIV, 0);
4587 gcc_assert (!note);
4591 /* Traverse a list of TYPES and expand all complex types into their
4592 components. */
4593 static tree
4594 split_complex_types (tree types)
4596 tree p;
4598 /* Before allocating memory, check for the common case of no complex. */
4599 for (p = types; p; p = TREE_CHAIN (p))
4601 tree type = TREE_VALUE (p);
4602 if (TREE_CODE (type) == COMPLEX_TYPE
4603 && targetm.calls.split_complex_arg (type))
4604 goto found;
4606 return types;
4608 found:
4609 types = copy_list (types);
4611 for (p = types; p; p = TREE_CHAIN (p))
4613 tree complex_type = TREE_VALUE (p);
4615 if (TREE_CODE (complex_type) == COMPLEX_TYPE
4616 && targetm.calls.split_complex_arg (complex_type))
4618 tree next, imag;
4620 /* Rewrite complex type with component type. */
4621 TREE_VALUE (p) = TREE_TYPE (complex_type);
4622 next = TREE_CHAIN (p);
4624 /* Add another component type for the imaginary part. */
4625 imag = build_tree_list (NULL_TREE, TREE_VALUE (p));
4626 TREE_CHAIN (p) = imag;
4627 TREE_CHAIN (imag) = next;
4629 /* Skip the newly created node. */
4630 p = TREE_CHAIN (p);
4634 return types;
4637 /* Output a library call to function ORGFUN (a SYMBOL_REF rtx)
4638 for a value of mode OUTMODE,
4639 with NARGS different arguments, passed as ARGS.
4640 Store the return value if RETVAL is nonzero: store it in VALUE if
4641 VALUE is nonnull, otherwise pick a convenient location. In either
4642 case return the location of the stored value.
4644 FN_TYPE should be LCT_NORMAL for `normal' calls, LCT_CONST for
4645 `const' calls, LCT_PURE for `pure' calls, or another LCT_ value for
4646 other types of library calls. */
4649 emit_library_call_value_1 (int retval, rtx orgfun, rtx value,
4650 enum libcall_type fn_type,
4651 machine_mode outmode, int nargs, rtx_mode_t *args)
4653 /* Total size in bytes of all the stack-parms scanned so far. */
4654 struct args_size args_size;
4655 /* Size of arguments before any adjustments (such as rounding). */
4656 struct args_size original_args_size;
4657 int argnum;
4658 rtx fun;
4659 /* Todo, choose the correct decl type of orgfun. Sadly this information
4660 isn't present here, so we default to native calling abi here. */
4661 tree fndecl ATTRIBUTE_UNUSED = NULL_TREE; /* library calls default to host calling abi ? */
4662 tree fntype ATTRIBUTE_UNUSED = NULL_TREE; /* library calls default to host calling abi ? */
4663 int count;
4664 rtx argblock = 0;
4665 CUMULATIVE_ARGS args_so_far_v;
4666 cumulative_args_t args_so_far;
4667 struct arg
4669 rtx value;
4670 machine_mode mode;
4671 rtx reg;
4672 int partial;
4673 struct locate_and_pad_arg_data locate;
4674 rtx save_area;
4676 struct arg *argvec;
4677 int old_inhibit_defer_pop = inhibit_defer_pop;
4678 rtx call_fusage = 0;
4679 rtx mem_value = 0;
4680 rtx valreg;
4681 int pcc_struct_value = 0;
4682 poly_int64 struct_value_size = 0;
4683 int flags;
4684 int reg_parm_stack_space = 0;
4685 poly_int64 needed;
4686 rtx_insn *before_call;
4687 bool have_push_fusage;
4688 tree tfom; /* type_for_mode (outmode, 0) */
4690 #ifdef REG_PARM_STACK_SPACE
4691 /* Define the boundary of the register parm stack space that needs to be
4692 save, if any. */
4693 int low_to_save = 0, high_to_save = 0;
4694 rtx save_area = 0; /* Place that it is saved. */
4695 #endif
4697 /* Size of the stack reserved for parameter registers. */
4698 unsigned int initial_highest_arg_in_use = highest_outgoing_arg_in_use;
4699 char *initial_stack_usage_map = stack_usage_map;
4700 unsigned HOST_WIDE_INT initial_stack_usage_watermark = stack_usage_watermark;
4701 char *stack_usage_map_buf = NULL;
4703 rtx struct_value = targetm.calls.struct_value_rtx (0, 0);
4705 #ifdef REG_PARM_STACK_SPACE
4706 reg_parm_stack_space = REG_PARM_STACK_SPACE ((tree) 0);
4707 #endif
4709 /* By default, library functions cannot throw. */
4710 flags = ECF_NOTHROW;
4712 switch (fn_type)
4714 case LCT_NORMAL:
4715 break;
4716 case LCT_CONST:
4717 flags |= ECF_CONST;
4718 break;
4719 case LCT_PURE:
4720 flags |= ECF_PURE;
4721 break;
4722 case LCT_NORETURN:
4723 flags |= ECF_NORETURN;
4724 break;
4725 case LCT_THROW:
4726 flags &= ~ECF_NOTHROW;
4727 break;
4728 case LCT_RETURNS_TWICE:
4729 flags = ECF_RETURNS_TWICE;
4730 break;
4732 fun = orgfun;
4734 /* Ensure current function's preferred stack boundary is at least
4735 what we need. */
4736 if (crtl->preferred_stack_boundary < PREFERRED_STACK_BOUNDARY)
4737 crtl->preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
4739 /* If this kind of value comes back in memory,
4740 decide where in memory it should come back. */
4741 if (outmode != VOIDmode)
4743 tfom = lang_hooks.types.type_for_mode (outmode, 0);
4744 if (aggregate_value_p (tfom, 0))
4746 #ifdef PCC_STATIC_STRUCT_RETURN
4747 rtx pointer_reg
4748 = hard_function_value (build_pointer_type (tfom), 0, 0, 0);
4749 mem_value = gen_rtx_MEM (outmode, pointer_reg);
4750 pcc_struct_value = 1;
4751 if (value == 0)
4752 value = gen_reg_rtx (outmode);
4753 #else /* not PCC_STATIC_STRUCT_RETURN */
4754 struct_value_size = GET_MODE_SIZE (outmode);
4755 if (value != 0 && MEM_P (value))
4756 mem_value = value;
4757 else
4758 mem_value = assign_temp (tfom, 1, 1);
4759 #endif
4760 /* This call returns a big structure. */
4761 flags &= ~(ECF_CONST | ECF_PURE | ECF_LOOPING_CONST_OR_PURE);
4764 else
4765 tfom = void_type_node;
4767 /* ??? Unfinished: must pass the memory address as an argument. */
4769 /* Copy all the libcall-arguments out of the varargs data
4770 and into a vector ARGVEC.
4772 Compute how to pass each argument. We only support a very small subset
4773 of the full argument passing conventions to limit complexity here since
4774 library functions shouldn't have many args. */
4776 argvec = XALLOCAVEC (struct arg, nargs + 1);
4777 memset (argvec, 0, (nargs + 1) * sizeof (struct arg));
4779 #ifdef INIT_CUMULATIVE_LIBCALL_ARGS
4780 INIT_CUMULATIVE_LIBCALL_ARGS (args_so_far_v, outmode, fun);
4781 #else
4782 INIT_CUMULATIVE_ARGS (args_so_far_v, NULL_TREE, fun, 0, nargs);
4783 #endif
4784 args_so_far = pack_cumulative_args (&args_so_far_v);
4786 args_size.constant = 0;
4787 args_size.var = 0;
4789 count = 0;
4791 push_temp_slots ();
4793 /* If there's a structure value address to be passed,
4794 either pass it in the special place, or pass it as an extra argument. */
4795 if (mem_value && struct_value == 0 && ! pcc_struct_value)
4797 rtx addr = XEXP (mem_value, 0);
4799 nargs++;
4801 /* Make sure it is a reasonable operand for a move or push insn. */
4802 if (!REG_P (addr) && !MEM_P (addr)
4803 && !(CONSTANT_P (addr)
4804 && targetm.legitimate_constant_p (Pmode, addr)))
4805 addr = force_operand (addr, NULL_RTX);
4807 argvec[count].value = addr;
4808 argvec[count].mode = Pmode;
4809 argvec[count].partial = 0;
4811 argvec[count].reg = targetm.calls.function_arg (args_so_far,
4812 Pmode, NULL_TREE, true);
4813 gcc_assert (targetm.calls.arg_partial_bytes (args_so_far, Pmode,
4814 NULL_TREE, 1) == 0);
4816 locate_and_pad_parm (Pmode, NULL_TREE,
4817 #ifdef STACK_PARMS_IN_REG_PARM_AREA
4819 #else
4820 argvec[count].reg != 0,
4821 #endif
4822 reg_parm_stack_space, 0,
4823 NULL_TREE, &args_size, &argvec[count].locate);
4825 if (argvec[count].reg == 0 || argvec[count].partial != 0
4826 || reg_parm_stack_space > 0)
4827 args_size.constant += argvec[count].locate.size.constant;
4829 targetm.calls.function_arg_advance (args_so_far, Pmode, (tree) 0, true);
4831 count++;
4834 for (unsigned int i = 0; count < nargs; i++, count++)
4836 rtx val = args[i].first;
4837 machine_mode mode = args[i].second;
4838 int unsigned_p = 0;
4840 /* We cannot convert the arg value to the mode the library wants here;
4841 must do it earlier where we know the signedness of the arg. */
4842 gcc_assert (mode != BLKmode
4843 && (GET_MODE (val) == mode || GET_MODE (val) == VOIDmode));
4845 /* Make sure it is a reasonable operand for a move or push insn. */
4846 if (!REG_P (val) && !MEM_P (val)
4847 && !(CONSTANT_P (val) && targetm.legitimate_constant_p (mode, val)))
4848 val = force_operand (val, NULL_RTX);
4850 if (pass_by_reference (&args_so_far_v, mode, NULL_TREE, 1))
4852 rtx slot;
4853 int must_copy
4854 = !reference_callee_copied (&args_so_far_v, mode, NULL_TREE, 1);
4856 /* If this was a CONST function, it is now PURE since it now
4857 reads memory. */
4858 if (flags & ECF_CONST)
4860 flags &= ~ECF_CONST;
4861 flags |= ECF_PURE;
4864 if (MEM_P (val) && !must_copy)
4866 tree val_expr = MEM_EXPR (val);
4867 if (val_expr)
4868 mark_addressable (val_expr);
4869 slot = val;
4871 else
4873 slot = assign_temp (lang_hooks.types.type_for_mode (mode, 0),
4874 1, 1);
4875 emit_move_insn (slot, val);
4878 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
4879 gen_rtx_USE (VOIDmode, slot),
4880 call_fusage);
4881 if (must_copy)
4882 call_fusage = gen_rtx_EXPR_LIST (VOIDmode,
4883 gen_rtx_CLOBBER (VOIDmode,
4884 slot),
4885 call_fusage);
4887 mode = Pmode;
4888 val = force_operand (XEXP (slot, 0), NULL_RTX);
4891 mode = promote_function_mode (NULL_TREE, mode, &unsigned_p, NULL_TREE, 0);
4892 argvec[count].mode = mode;
4893 argvec[count].value = convert_modes (mode, GET_MODE (val), val, unsigned_p);
4894 argvec[count].reg = targetm.calls.function_arg (args_so_far, mode,
4895 NULL_TREE, true);
4897 argvec[count].partial
4898 = targetm.calls.arg_partial_bytes (args_so_far, mode, NULL_TREE, 1);
4900 if (argvec[count].reg == 0
4901 || argvec[count].partial != 0
4902 || reg_parm_stack_space > 0)
4904 locate_and_pad_parm (mode, NULL_TREE,
4905 #ifdef STACK_PARMS_IN_REG_PARM_AREA
4907 #else
4908 argvec[count].reg != 0,
4909 #endif
4910 reg_parm_stack_space, argvec[count].partial,
4911 NULL_TREE, &args_size, &argvec[count].locate);
4912 args_size.constant += argvec[count].locate.size.constant;
4913 gcc_assert (!argvec[count].locate.size.var);
4915 #ifdef BLOCK_REG_PADDING
4916 else
4917 /* The argument is passed entirely in registers. See at which
4918 end it should be padded. */
4919 argvec[count].locate.where_pad =
4920 BLOCK_REG_PADDING (mode, NULL_TREE,
4921 known_le (GET_MODE_SIZE (mode), UNITS_PER_WORD));
4922 #endif
4924 targetm.calls.function_arg_advance (args_so_far, mode, (tree) 0, true);
4927 /* If this machine requires an external definition for library
4928 functions, write one out. */
4929 assemble_external_libcall (fun);
4931 original_args_size = args_size;
4932 args_size.constant = (aligned_upper_bound (args_size.constant
4933 + stack_pointer_delta,
4934 STACK_BYTES)
4935 - stack_pointer_delta);
4937 args_size.constant = upper_bound (args_size.constant,
4938 reg_parm_stack_space);
4940 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl))))
4941 args_size.constant -= reg_parm_stack_space;
4943 crtl->outgoing_args_size = upper_bound (crtl->outgoing_args_size,
4944 args_size.constant);
4946 if (flag_stack_usage_info && !ACCUMULATE_OUTGOING_ARGS)
4948 poly_int64 pushed = args_size.constant + pending_stack_adjust;
4949 current_function_pushed_stack_size
4950 = upper_bound (current_function_pushed_stack_size, pushed);
4953 if (ACCUMULATE_OUTGOING_ARGS)
4955 /* Since the stack pointer will never be pushed, it is possible for
4956 the evaluation of a parm to clobber something we have already
4957 written to the stack. Since most function calls on RISC machines
4958 do not use the stack, this is uncommon, but must work correctly.
4960 Therefore, we save any area of the stack that was already written
4961 and that we are using. Here we set up to do this by making a new
4962 stack usage map from the old one.
4964 Another approach might be to try to reorder the argument
4965 evaluations to avoid this conflicting stack usage. */
4967 needed = args_size.constant;
4969 /* Since we will be writing into the entire argument area, the
4970 map must be allocated for its entire size, not just the part that
4971 is the responsibility of the caller. */
4972 if (! OUTGOING_REG_PARM_STACK_SPACE ((!fndecl ? fntype : TREE_TYPE (fndecl))))
4973 needed += reg_parm_stack_space;
4975 poly_int64 limit = needed;
4976 if (ARGS_GROW_DOWNWARD)
4977 limit += 1;
4979 /* For polynomial sizes, this is the maximum possible size needed
4980 for arguments with a constant size and offset. */
4981 HOST_WIDE_INT const_limit = constant_lower_bound (limit);
4982 highest_outgoing_arg_in_use = MAX (initial_highest_arg_in_use,
4983 const_limit);
4985 stack_usage_map_buf = XNEWVEC (char, highest_outgoing_arg_in_use);
4986 stack_usage_map = stack_usage_map_buf;
4988 if (initial_highest_arg_in_use)
4989 memcpy (stack_usage_map, initial_stack_usage_map,
4990 initial_highest_arg_in_use);
4992 if (initial_highest_arg_in_use != highest_outgoing_arg_in_use)
4993 memset (&stack_usage_map[initial_highest_arg_in_use], 0,
4994 highest_outgoing_arg_in_use - initial_highest_arg_in_use);
4995 needed = 0;
4997 /* We must be careful to use virtual regs before they're instantiated,
4998 and real regs afterwards. Loop optimization, for example, can create
4999 new libcalls after we've instantiated the virtual regs, and if we
5000 use virtuals anyway, they won't match the rtl patterns. */
5002 if (virtuals_instantiated)
5003 argblock = plus_constant (Pmode, stack_pointer_rtx,
5004 STACK_POINTER_OFFSET);
5005 else
5006 argblock = virtual_outgoing_args_rtx;
5008 else
5010 if (!PUSH_ARGS)
5011 argblock = push_block (gen_int_mode (args_size.constant, Pmode), 0, 0);
5014 /* We push args individually in reverse order, perform stack alignment
5015 before the first push (the last arg). */
5016 if (argblock == 0)
5017 anti_adjust_stack (gen_int_mode (args_size.constant
5018 - original_args_size.constant,
5019 Pmode));
5021 argnum = nargs - 1;
5023 #ifdef REG_PARM_STACK_SPACE
5024 if (ACCUMULATE_OUTGOING_ARGS)
5026 /* The argument list is the property of the called routine and it
5027 may clobber it. If the fixed area has been used for previous
5028 parameters, we must save and restore it. */
5029 save_area = save_fixed_argument_area (reg_parm_stack_space, argblock,
5030 &low_to_save, &high_to_save);
5032 #endif
5034 /* When expanding a normal call, args are stored in push order,
5035 which is the reverse of what we have here. */
5036 bool any_regs = false;
5037 for (int i = nargs; i-- > 0; )
5038 if (argvec[i].reg != NULL_RTX)
5040 targetm.calls.call_args (argvec[i].reg, NULL_TREE);
5041 any_regs = true;
5043 if (!any_regs)
5044 targetm.calls.call_args (pc_rtx, NULL_TREE);
5046 /* Push the args that need to be pushed. */
5048 have_push_fusage = false;
5050 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
5051 are to be pushed. */
5052 for (count = 0; count < nargs; count++, argnum--)
5054 machine_mode mode = argvec[argnum].mode;
5055 rtx val = argvec[argnum].value;
5056 rtx reg = argvec[argnum].reg;
5057 int partial = argvec[argnum].partial;
5058 unsigned int parm_align = argvec[argnum].locate.boundary;
5059 poly_int64 lower_bound = 0, upper_bound = 0;
5061 if (! (reg != 0 && partial == 0))
5063 rtx use;
5065 if (ACCUMULATE_OUTGOING_ARGS)
5067 /* If this is being stored into a pre-allocated, fixed-size,
5068 stack area, save any previous data at that location. */
5070 if (ARGS_GROW_DOWNWARD)
5072 /* stack_slot is negative, but we want to index stack_usage_map
5073 with positive values. */
5074 upper_bound = -argvec[argnum].locate.slot_offset.constant + 1;
5075 lower_bound = upper_bound - argvec[argnum].locate.size.constant;
5077 else
5079 lower_bound = argvec[argnum].locate.slot_offset.constant;
5080 upper_bound = lower_bound + argvec[argnum].locate.size.constant;
5083 if (stack_region_maybe_used_p (lower_bound, upper_bound,
5084 reg_parm_stack_space))
5086 /* We need to make a save area. */
5087 poly_uint64 size
5088 = argvec[argnum].locate.size.constant * BITS_PER_UNIT;
5089 machine_mode save_mode
5090 = int_mode_for_size (size, 1).else_blk ();
5091 rtx adr
5092 = plus_constant (Pmode, argblock,
5093 argvec[argnum].locate.offset.constant);
5094 rtx stack_area
5095 = gen_rtx_MEM (save_mode, memory_address (save_mode, adr));
5097 if (save_mode == BLKmode)
5099 argvec[argnum].save_area
5100 = assign_stack_temp (BLKmode,
5101 argvec[argnum].locate.size.constant
5104 emit_block_move (validize_mem
5105 (copy_rtx (argvec[argnum].save_area)),
5106 stack_area,
5107 (gen_int_mode
5108 (argvec[argnum].locate.size.constant,
5109 Pmode)),
5110 BLOCK_OP_CALL_PARM);
5112 else
5114 argvec[argnum].save_area = gen_reg_rtx (save_mode);
5116 emit_move_insn (argvec[argnum].save_area, stack_area);
5121 emit_push_insn (val, mode, NULL_TREE, NULL_RTX, parm_align,
5122 partial, reg, 0, argblock,
5123 (gen_int_mode
5124 (argvec[argnum].locate.offset.constant, Pmode)),
5125 reg_parm_stack_space,
5126 ARGS_SIZE_RTX (argvec[argnum].locate.alignment_pad), false);
5128 /* Now mark the segment we just used. */
5129 if (ACCUMULATE_OUTGOING_ARGS)
5130 mark_stack_region_used (lower_bound, upper_bound);
5132 NO_DEFER_POP;
5134 /* Indicate argument access so that alias.c knows that these
5135 values are live. */
5136 if (argblock)
5137 use = plus_constant (Pmode, argblock,
5138 argvec[argnum].locate.offset.constant);
5139 else if (have_push_fusage)
5140 continue;
5141 else
5143 /* When arguments are pushed, trying to tell alias.c where
5144 exactly this argument is won't work, because the
5145 auto-increment causes confusion. So we merely indicate
5146 that we access something with a known mode somewhere on
5147 the stack. */
5148 use = gen_rtx_PLUS (Pmode, stack_pointer_rtx,
5149 gen_rtx_SCRATCH (Pmode));
5150 have_push_fusage = true;
5152 use = gen_rtx_MEM (argvec[argnum].mode, use);
5153 use = gen_rtx_USE (VOIDmode, use);
5154 call_fusage = gen_rtx_EXPR_LIST (VOIDmode, use, call_fusage);
5158 argnum = nargs - 1;
5160 fun = prepare_call_address (NULL, fun, NULL, &call_fusage, 0, 0);
5162 /* Now load any reg parms into their regs. */
5164 /* ARGNUM indexes the ARGVEC array in the order in which the arguments
5165 are to be pushed. */
5166 for (count = 0; count < nargs; count++, argnum--)
5168 machine_mode mode = argvec[argnum].mode;
5169 rtx val = argvec[argnum].value;
5170 rtx reg = argvec[argnum].reg;
5171 int partial = argvec[argnum].partial;
5173 /* Handle calls that pass values in multiple non-contiguous
5174 locations. The PA64 has examples of this for library calls. */
5175 if (reg != 0 && GET_CODE (reg) == PARALLEL)
5176 emit_group_load (reg, val, NULL_TREE, GET_MODE_SIZE (mode));
5177 else if (reg != 0 && partial == 0)
5179 emit_move_insn (reg, val);
5180 #ifdef BLOCK_REG_PADDING
5181 poly_int64 size = GET_MODE_SIZE (argvec[argnum].mode);
5183 /* Copied from load_register_parameters. */
5185 /* Handle case where we have a value that needs shifting
5186 up to the msb. eg. a QImode value and we're padding
5187 upward on a BYTES_BIG_ENDIAN machine. */
5188 if (known_lt (size, UNITS_PER_WORD)
5189 && (argvec[argnum].locate.where_pad
5190 == (BYTES_BIG_ENDIAN ? PAD_UPWARD : PAD_DOWNWARD)))
5192 rtx x;
5193 poly_int64 shift = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
5195 /* Assigning REG here rather than a temp makes CALL_FUSAGE
5196 report the whole reg as used. Strictly speaking, the
5197 call only uses SIZE bytes at the msb end, but it doesn't
5198 seem worth generating rtl to say that. */
5199 reg = gen_rtx_REG (word_mode, REGNO (reg));
5200 x = expand_shift (LSHIFT_EXPR, word_mode, reg, shift, reg, 1);
5201 if (x != reg)
5202 emit_move_insn (reg, x);
5204 #endif
5207 NO_DEFER_POP;
5210 /* Any regs containing parms remain in use through the call. */
5211 for (count = 0; count < nargs; count++)
5213 rtx reg = argvec[count].reg;
5214 if (reg != 0 && GET_CODE (reg) == PARALLEL)
5215 use_group_regs (&call_fusage, reg);
5216 else if (reg != 0)
5218 int partial = argvec[count].partial;
5219 if (partial)
5221 int nregs;
5222 gcc_assert (partial % UNITS_PER_WORD == 0);
5223 nregs = partial / UNITS_PER_WORD;
5224 use_regs (&call_fusage, REGNO (reg), nregs);
5226 else
5227 use_reg (&call_fusage, reg);
5231 /* Pass the function the address in which to return a structure value. */
5232 if (mem_value != 0 && struct_value != 0 && ! pcc_struct_value)
5234 emit_move_insn (struct_value,
5235 force_reg (Pmode,
5236 force_operand (XEXP (mem_value, 0),
5237 NULL_RTX)));
5238 if (REG_P (struct_value))
5239 use_reg (&call_fusage, struct_value);
5242 /* Don't allow popping to be deferred, since then
5243 cse'ing of library calls could delete a call and leave the pop. */
5244 NO_DEFER_POP;
5245 valreg = (mem_value == 0 && outmode != VOIDmode
5246 ? hard_libcall_value (outmode, orgfun) : NULL_RTX);
5248 /* Stack must be properly aligned now. */
5249 gcc_assert (multiple_p (stack_pointer_delta,
5250 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT));
5252 before_call = get_last_insn ();
5254 /* We pass the old value of inhibit_defer_pop + 1 to emit_call_1, which
5255 will set inhibit_defer_pop to that value. */
5256 /* The return type is needed to decide how many bytes the function pops.
5257 Signedness plays no role in that, so for simplicity, we pretend it's
5258 always signed. We also assume that the list of arguments passed has
5259 no impact, so we pretend it is unknown. */
5261 emit_call_1 (fun, NULL,
5262 get_identifier (XSTR (orgfun, 0)),
5263 build_function_type (tfom, NULL_TREE),
5264 original_args_size.constant, args_size.constant,
5265 struct_value_size,
5266 targetm.calls.function_arg (args_so_far,
5267 VOIDmode, void_type_node, true),
5268 valreg,
5269 old_inhibit_defer_pop + 1, call_fusage, flags, args_so_far);
5271 if (flag_ipa_ra)
5273 rtx datum = orgfun;
5274 gcc_assert (GET_CODE (datum) == SYMBOL_REF);
5275 rtx_call_insn *last = last_call_insn ();
5276 add_reg_note (last, REG_CALL_DECL, datum);
5279 /* Right-shift returned value if necessary. */
5280 if (!pcc_struct_value
5281 && TYPE_MODE (tfom) != BLKmode
5282 && targetm.calls.return_in_msb (tfom))
5284 shift_return_value (TYPE_MODE (tfom), false, valreg);
5285 valreg = gen_rtx_REG (TYPE_MODE (tfom), REGNO (valreg));
5288 targetm.calls.end_call_args ();
5290 /* For calls to `setjmp', etc., inform function.c:setjmp_warnings
5291 that it should complain if nonvolatile values are live. For
5292 functions that cannot return, inform flow that control does not
5293 fall through. */
5294 if (flags & ECF_NORETURN)
5296 /* The barrier note must be emitted
5297 immediately after the CALL_INSN. Some ports emit more than
5298 just a CALL_INSN above, so we must search for it here. */
5299 rtx_insn *last = get_last_insn ();
5300 while (!CALL_P (last))
5302 last = PREV_INSN (last);
5303 /* There was no CALL_INSN? */
5304 gcc_assert (last != before_call);
5307 emit_barrier_after (last);
5310 /* Consider that "regular" libcalls, i.e. all of them except for LCT_THROW
5311 and LCT_RETURNS_TWICE, cannot perform non-local gotos. */
5312 if (flags & ECF_NOTHROW)
5314 rtx_insn *last = get_last_insn ();
5315 while (!CALL_P (last))
5317 last = PREV_INSN (last);
5318 /* There was no CALL_INSN? */
5319 gcc_assert (last != before_call);
5322 make_reg_eh_region_note_nothrow_nononlocal (last);
5325 /* Now restore inhibit_defer_pop to its actual original value. */
5326 OK_DEFER_POP;
5328 pop_temp_slots ();
5330 /* Copy the value to the right place. */
5331 if (outmode != VOIDmode && retval)
5333 if (mem_value)
5335 if (value == 0)
5336 value = mem_value;
5337 if (value != mem_value)
5338 emit_move_insn (value, mem_value);
5340 else if (GET_CODE (valreg) == PARALLEL)
5342 if (value == 0)
5343 value = gen_reg_rtx (outmode);
5344 emit_group_store (value, valreg, NULL_TREE, GET_MODE_SIZE (outmode));
5346 else
5348 /* Convert to the proper mode if a promotion has been active. */
5349 if (GET_MODE (valreg) != outmode)
5351 int unsignedp = TYPE_UNSIGNED (tfom);
5353 gcc_assert (promote_function_mode (tfom, outmode, &unsignedp,
5354 fndecl ? TREE_TYPE (fndecl) : fntype, 1)
5355 == GET_MODE (valreg));
5356 valreg = convert_modes (outmode, GET_MODE (valreg), valreg, 0);
5359 if (value != 0)
5360 emit_move_insn (value, valreg);
5361 else
5362 value = valreg;
5366 if (ACCUMULATE_OUTGOING_ARGS)
5368 #ifdef REG_PARM_STACK_SPACE
5369 if (save_area)
5370 restore_fixed_argument_area (save_area, argblock,
5371 high_to_save, low_to_save);
5372 #endif
5374 /* If we saved any argument areas, restore them. */
5375 for (count = 0; count < nargs; count++)
5376 if (argvec[count].save_area)
5378 machine_mode save_mode = GET_MODE (argvec[count].save_area);
5379 rtx adr = plus_constant (Pmode, argblock,
5380 argvec[count].locate.offset.constant);
5381 rtx stack_area = gen_rtx_MEM (save_mode,
5382 memory_address (save_mode, adr));
5384 if (save_mode == BLKmode)
5385 emit_block_move (stack_area,
5386 validize_mem
5387 (copy_rtx (argvec[count].save_area)),
5388 (gen_int_mode
5389 (argvec[count].locate.size.constant, Pmode)),
5390 BLOCK_OP_CALL_PARM);
5391 else
5392 emit_move_insn (stack_area, argvec[count].save_area);
5395 highest_outgoing_arg_in_use = initial_highest_arg_in_use;
5396 stack_usage_map = initial_stack_usage_map;
5397 stack_usage_watermark = initial_stack_usage_watermark;
5400 free (stack_usage_map_buf);
5402 return value;
5407 /* Store a single argument for a function call
5408 into the register or memory area where it must be passed.
5409 *ARG describes the argument value and where to pass it.
5411 ARGBLOCK is the address of the stack-block for all the arguments,
5412 or 0 on a machine where arguments are pushed individually.
5414 MAY_BE_ALLOCA nonzero says this could be a call to `alloca'
5415 so must be careful about how the stack is used.
5417 VARIABLE_SIZE nonzero says that this was a variable-sized outgoing
5418 argument stack. This is used if ACCUMULATE_OUTGOING_ARGS to indicate
5419 that we need not worry about saving and restoring the stack.
5421 FNDECL is the declaration of the function we are calling.
5423 Return nonzero if this arg should cause sibcall failure,
5424 zero otherwise. */
5426 static int
5427 store_one_arg (struct arg_data *arg, rtx argblock, int flags,
5428 int variable_size ATTRIBUTE_UNUSED, int reg_parm_stack_space)
5430 tree pval = arg->tree_value;
5431 rtx reg = 0;
5432 int partial = 0;
5433 poly_int64 used = 0;
5434 poly_int64 lower_bound = 0, upper_bound = 0;
5435 int sibcall_failure = 0;
5437 if (TREE_CODE (pval) == ERROR_MARK)
5438 return 1;
5440 /* Push a new temporary level for any temporaries we make for
5441 this argument. */
5442 push_temp_slots ();
5444 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL))
5446 /* If this is being stored into a pre-allocated, fixed-size, stack area,
5447 save any previous data at that location. */
5448 if (argblock && ! variable_size && arg->stack)
5450 if (ARGS_GROW_DOWNWARD)
5452 /* stack_slot is negative, but we want to index stack_usage_map
5453 with positive values. */
5454 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
5456 rtx offset = XEXP (XEXP (arg->stack_slot, 0), 1);
5457 upper_bound = -rtx_to_poly_int64 (offset) + 1;
5459 else
5460 upper_bound = 0;
5462 lower_bound = upper_bound - arg->locate.size.constant;
5464 else
5466 if (GET_CODE (XEXP (arg->stack_slot, 0)) == PLUS)
5468 rtx offset = XEXP (XEXP (arg->stack_slot, 0), 1);
5469 lower_bound = rtx_to_poly_int64 (offset);
5471 else
5472 lower_bound = 0;
5474 upper_bound = lower_bound + arg->locate.size.constant;
5477 if (stack_region_maybe_used_p (lower_bound, upper_bound,
5478 reg_parm_stack_space))
5480 /* We need to make a save area. */
5481 poly_uint64 size = arg->locate.size.constant * BITS_PER_UNIT;
5482 machine_mode save_mode
5483 = int_mode_for_size (size, 1).else_blk ();
5484 rtx adr = memory_address (save_mode, XEXP (arg->stack_slot, 0));
5485 rtx stack_area = gen_rtx_MEM (save_mode, adr);
5487 if (save_mode == BLKmode)
5489 arg->save_area
5490 = assign_temp (TREE_TYPE (arg->tree_value), 1, 1);
5491 preserve_temp_slots (arg->save_area);
5492 emit_block_move (validize_mem (copy_rtx (arg->save_area)),
5493 stack_area,
5494 (gen_int_mode
5495 (arg->locate.size.constant, Pmode)),
5496 BLOCK_OP_CALL_PARM);
5498 else
5500 arg->save_area = gen_reg_rtx (save_mode);
5501 emit_move_insn (arg->save_area, stack_area);
5507 /* If this isn't going to be placed on both the stack and in registers,
5508 set up the register and number of words. */
5509 if (! arg->pass_on_stack)
5511 if (flags & ECF_SIBCALL)
5512 reg = arg->tail_call_reg;
5513 else
5514 reg = arg->reg;
5515 partial = arg->partial;
5518 /* Being passed entirely in a register. We shouldn't be called in
5519 this case. */
5520 gcc_assert (reg == 0 || partial != 0);
5522 /* If this arg needs special alignment, don't load the registers
5523 here. */
5524 if (arg->n_aligned_regs != 0)
5525 reg = 0;
5527 /* If this is being passed partially in a register, we can't evaluate
5528 it directly into its stack slot. Otherwise, we can. */
5529 if (arg->value == 0)
5531 /* stack_arg_under_construction is nonzero if a function argument is
5532 being evaluated directly into the outgoing argument list and
5533 expand_call must take special action to preserve the argument list
5534 if it is called recursively.
5536 For scalar function arguments stack_usage_map is sufficient to
5537 determine which stack slots must be saved and restored. Scalar
5538 arguments in general have pass_on_stack == 0.
5540 If this argument is initialized by a function which takes the
5541 address of the argument (a C++ constructor or a C function
5542 returning a BLKmode structure), then stack_usage_map is
5543 insufficient and expand_call must push the stack around the
5544 function call. Such arguments have pass_on_stack == 1.
5546 Note that it is always safe to set stack_arg_under_construction,
5547 but this generates suboptimal code if set when not needed. */
5549 if (arg->pass_on_stack)
5550 stack_arg_under_construction++;
5552 arg->value = expand_expr (pval,
5553 (partial
5554 || TYPE_MODE (TREE_TYPE (pval)) != arg->mode)
5555 ? NULL_RTX : arg->stack,
5556 VOIDmode, EXPAND_STACK_PARM);
5558 /* If we are promoting object (or for any other reason) the mode
5559 doesn't agree, convert the mode. */
5561 if (arg->mode != TYPE_MODE (TREE_TYPE (pval)))
5562 arg->value = convert_modes (arg->mode, TYPE_MODE (TREE_TYPE (pval)),
5563 arg->value, arg->unsignedp);
5565 if (arg->pass_on_stack)
5566 stack_arg_under_construction--;
5569 /* Check for overlap with already clobbered argument area. */
5570 if ((flags & ECF_SIBCALL)
5571 && MEM_P (arg->value)
5572 && mem_might_overlap_already_clobbered_arg_p (XEXP (arg->value, 0),
5573 arg->locate.size.constant))
5574 sibcall_failure = 1;
5576 /* Don't allow anything left on stack from computation
5577 of argument to alloca. */
5578 if (flags & ECF_MAY_BE_ALLOCA)
5579 do_pending_stack_adjust ();
5581 if (arg->value == arg->stack)
5582 /* If the value is already in the stack slot, we are done. */
5584 else if (arg->mode != BLKmode)
5586 unsigned int parm_align;
5588 /* Argument is a scalar, not entirely passed in registers.
5589 (If part is passed in registers, arg->partial says how much
5590 and emit_push_insn will take care of putting it there.)
5592 Push it, and if its size is less than the
5593 amount of space allocated to it,
5594 also bump stack pointer by the additional space.
5595 Note that in C the default argument promotions
5596 will prevent such mismatches. */
5598 poly_int64 size = (TYPE_EMPTY_P (TREE_TYPE (pval))
5599 ? 0 : GET_MODE_SIZE (arg->mode));
5601 /* Compute how much space the push instruction will push.
5602 On many machines, pushing a byte will advance the stack
5603 pointer by a halfword. */
5604 #ifdef PUSH_ROUNDING
5605 size = PUSH_ROUNDING (size);
5606 #endif
5607 used = size;
5609 /* Compute how much space the argument should get:
5610 round up to a multiple of the alignment for arguments. */
5611 if (targetm.calls.function_arg_padding (arg->mode, TREE_TYPE (pval))
5612 != PAD_NONE)
5613 /* At the moment we don't (need to) support ABIs for which the
5614 padding isn't known at compile time. In principle it should
5615 be easy to add though. */
5616 used = force_align_up (size, PARM_BOUNDARY / BITS_PER_UNIT);
5618 /* Compute the alignment of the pushed argument. */
5619 parm_align = arg->locate.boundary;
5620 if (targetm.calls.function_arg_padding (arg->mode, TREE_TYPE (pval))
5621 == PAD_DOWNWARD)
5623 poly_int64 pad = used - size;
5624 unsigned int pad_align = known_alignment (pad) * BITS_PER_UNIT;
5625 if (pad_align != 0)
5626 parm_align = MIN (parm_align, pad_align);
5629 /* This isn't already where we want it on the stack, so put it there.
5630 This can either be done with push or copy insns. */
5631 if (maybe_ne (used, 0)
5632 && !emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval),
5633 NULL_RTX, parm_align, partial, reg, used - size,
5634 argblock, ARGS_SIZE_RTX (arg->locate.offset),
5635 reg_parm_stack_space,
5636 ARGS_SIZE_RTX (arg->locate.alignment_pad), true))
5637 sibcall_failure = 1;
5639 /* Unless this is a partially-in-register argument, the argument is now
5640 in the stack. */
5641 if (partial == 0)
5642 arg->value = arg->stack;
5644 else
5646 /* BLKmode, at least partly to be pushed. */
5648 unsigned int parm_align;
5649 poly_int64 excess;
5650 rtx size_rtx;
5652 /* Pushing a nonscalar.
5653 If part is passed in registers, PARTIAL says how much
5654 and emit_push_insn will take care of putting it there. */
5656 /* Round its size up to a multiple
5657 of the allocation unit for arguments. */
5659 if (arg->locate.size.var != 0)
5661 excess = 0;
5662 size_rtx = ARGS_SIZE_RTX (arg->locate.size);
5664 else
5666 /* PUSH_ROUNDING has no effect on us, because emit_push_insn
5667 for BLKmode is careful to avoid it. */
5668 excess = (arg->locate.size.constant
5669 - arg_int_size_in_bytes (TREE_TYPE (pval))
5670 + partial);
5671 size_rtx = expand_expr (arg_size_in_bytes (TREE_TYPE (pval)),
5672 NULL_RTX, TYPE_MODE (sizetype),
5673 EXPAND_NORMAL);
5676 parm_align = arg->locate.boundary;
5678 /* When an argument is padded down, the block is aligned to
5679 PARM_BOUNDARY, but the actual argument isn't. */
5680 if (targetm.calls.function_arg_padding (arg->mode, TREE_TYPE (pval))
5681 == PAD_DOWNWARD)
5683 if (arg->locate.size.var)
5684 parm_align = BITS_PER_UNIT;
5685 else
5687 unsigned int excess_align
5688 = known_alignment (excess) * BITS_PER_UNIT;
5689 if (excess_align != 0)
5690 parm_align = MIN (parm_align, excess_align);
5694 if ((flags & ECF_SIBCALL) && MEM_P (arg->value))
5696 /* emit_push_insn might not work properly if arg->value and
5697 argblock + arg->locate.offset areas overlap. */
5698 rtx x = arg->value;
5699 poly_int64 i = 0;
5701 if (strip_offset (XEXP (x, 0), &i)
5702 == crtl->args.internal_arg_pointer)
5704 /* arg.locate doesn't contain the pretend_args_size offset,
5705 it's part of argblock. Ensure we don't count it in I. */
5706 if (STACK_GROWS_DOWNWARD)
5707 i -= crtl->args.pretend_args_size;
5708 else
5709 i += crtl->args.pretend_args_size;
5711 /* expand_call should ensure this. */
5712 gcc_assert (!arg->locate.offset.var
5713 && arg->locate.size.var == 0);
5714 poly_int64 size_val = rtx_to_poly_int64 (size_rtx);
5716 if (known_eq (arg->locate.offset.constant, i))
5718 /* Even though they appear to be at the same location,
5719 if part of the outgoing argument is in registers,
5720 they aren't really at the same location. Check for
5721 this by making sure that the incoming size is the
5722 same as the outgoing size. */
5723 if (maybe_ne (arg->locate.size.constant, size_val))
5724 sibcall_failure = 1;
5726 else if (maybe_in_range_p (arg->locate.offset.constant,
5727 i, size_val))
5728 sibcall_failure = 1;
5729 /* Use arg->locate.size.constant instead of size_rtx
5730 because we only care about the part of the argument
5731 on the stack. */
5732 else if (maybe_in_range_p (i, arg->locate.offset.constant,
5733 arg->locate.size.constant))
5734 sibcall_failure = 1;
5738 if (!CONST_INT_P (size_rtx) || INTVAL (size_rtx) != 0)
5739 emit_push_insn (arg->value, arg->mode, TREE_TYPE (pval), size_rtx,
5740 parm_align, partial, reg, excess, argblock,
5741 ARGS_SIZE_RTX (arg->locate.offset),
5742 reg_parm_stack_space,
5743 ARGS_SIZE_RTX (arg->locate.alignment_pad), false);
5745 /* Unless this is a partially-in-register argument, the argument is now
5746 in the stack.
5748 ??? Unlike the case above, in which we want the actual
5749 address of the data, so that we can load it directly into a
5750 register, here we want the address of the stack slot, so that
5751 it's properly aligned for word-by-word copying or something
5752 like that. It's not clear that this is always correct. */
5753 if (partial == 0)
5754 arg->value = arg->stack_slot;
5757 if (arg->reg && GET_CODE (arg->reg) == PARALLEL)
5759 tree type = TREE_TYPE (arg->tree_value);
5760 arg->parallel_value
5761 = emit_group_load_into_temps (arg->reg, arg->value, type,
5762 int_size_in_bytes (type));
5765 /* Mark all slots this store used. */
5766 if (ACCUMULATE_OUTGOING_ARGS && !(flags & ECF_SIBCALL)
5767 && argblock && ! variable_size && arg->stack)
5768 mark_stack_region_used (lower_bound, upper_bound);
5770 /* Once we have pushed something, pops can't safely
5771 be deferred during the rest of the arguments. */
5772 NO_DEFER_POP;
5774 /* Free any temporary slots made in processing this argument. */
5775 pop_temp_slots ();
5777 return sibcall_failure;
5780 /* Nonzero if we do not know how to pass TYPE solely in registers. */
5782 bool
5783 must_pass_in_stack_var_size (machine_mode mode ATTRIBUTE_UNUSED,
5784 const_tree type)
5786 if (!type)
5787 return false;
5789 /* If the type has variable size... */
5790 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
5791 return true;
5793 /* If the type is marked as addressable (it is required
5794 to be constructed into the stack)... */
5795 if (TREE_ADDRESSABLE (type))
5796 return true;
5798 return false;
5801 /* Another version of the TARGET_MUST_PASS_IN_STACK hook. This one
5802 takes trailing padding of a structure into account. */
5803 /* ??? Should be able to merge these two by examining BLOCK_REG_PADDING. */
5805 bool
5806 must_pass_in_stack_var_size_or_pad (machine_mode mode, const_tree type)
5808 if (!type)
5809 return false;
5811 /* If the type has variable size... */
5812 if (TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST)
5813 return true;
5815 /* If the type is marked as addressable (it is required
5816 to be constructed into the stack)... */
5817 if (TREE_ADDRESSABLE (type))
5818 return true;
5820 if (TYPE_EMPTY_P (type))
5821 return false;
5823 /* If the padding and mode of the type is such that a copy into
5824 a register would put it into the wrong part of the register. */
5825 if (mode == BLKmode
5826 && int_size_in_bytes (type) % (PARM_BOUNDARY / BITS_PER_UNIT)
5827 && (targetm.calls.function_arg_padding (mode, type)
5828 == (BYTES_BIG_ENDIAN ? PAD_UPWARD : PAD_DOWNWARD)))
5829 return true;
5831 return false;
5834 /* Tell the garbage collector about GTY markers in this source file. */
5835 #include "gt-calls.h"