hppa: Fix pr110279-1.c on hppa
[official-gcc.git] / gcc / cfgexpand.cc
blobec887ef918f24f21c10704efba0eaf973499f019
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2023 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
76 #include "opts.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 switch (gimple_assign_rhs_class (stmt))
109 case GIMPLE_TERNARY_RHS:
110 t = build3 (gimple_assign_rhs_code (stmt),
111 TREE_TYPE (gimple_assign_lhs (stmt)),
112 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
113 gimple_assign_rhs3 (stmt));
114 break;
115 case GIMPLE_BINARY_RHS:
116 t = build2 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
119 break;
120 case GIMPLE_UNARY_RHS:
121 t = build1 (gimple_assign_rhs_code (stmt),
122 TREE_TYPE (gimple_assign_lhs (stmt)),
123 gimple_assign_rhs1 (stmt));
124 break;
125 case GIMPLE_SINGLE_RHS:
127 t = gimple_assign_rhs1 (stmt);
128 /* Avoid modifying this tree in place below. */
129 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
130 && gimple_location (stmt) != EXPR_LOCATION (t))
131 || (gimple_block (stmt) && currently_expanding_to_rtl
132 && EXPR_P (t)))
133 t = copy_node (t);
134 break;
136 default:
137 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 class stack_var
310 public:
311 /* The Variable. */
312 tree decl;
314 /* Initially, the size of the variable. Later, the size of the partition,
315 if this variable becomes it's partition's representative. */
316 poly_uint64 size;
318 /* The *byte* alignment required for this variable. Or as, with the
319 size, the alignment for this partition. */
320 unsigned int alignb;
322 /* The partition representative. */
323 size_t representative;
325 /* The next stack variable in the partition, or EOC. */
326 size_t next;
328 /* The numbers of conflicting stack variables. */
329 bitmap conflicts;
332 #define EOC ((size_t)-1)
334 /* We have an array of such objects while deciding allocation. */
335 static class stack_var *stack_vars;
336 static size_t stack_vars_alloc;
337 static size_t stack_vars_num;
338 static hash_map<tree, size_t> *decl_to_stack_part;
340 /* Conflict bitmaps go on this obstack. This allows us to destroy
341 all of them in one big sweep. */
342 static bitmap_obstack stack_var_bitmap_obstack;
344 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
345 is non-decreasing. */
346 static size_t *stack_vars_sorted;
348 /* The phase of the stack frame. This is the known misalignment of
349 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
350 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
351 static int frame_phase;
353 /* Used during expand_used_vars to remember if we saw any decls for
354 which we'd like to enable stack smashing protection. */
355 static bool has_protected_decls;
357 /* Used during expand_used_vars. Remember if we say a character buffer
358 smaller than our cutoff threshold. Used for -Wstack-protector. */
359 static bool has_short_buffer;
361 /* Compute the byte alignment to use for DECL. Ignore alignment
362 we can't do with expected alignment of the stack boundary. */
364 static unsigned int
365 align_local_variable (tree decl, bool really_expand)
367 unsigned int align;
369 if (TREE_CODE (decl) == SSA_NAME)
371 tree type = TREE_TYPE (decl);
372 machine_mode mode = TYPE_MODE (type);
374 align = TYPE_ALIGN (type);
375 if (mode != BLKmode
376 && align < GET_MODE_ALIGNMENT (mode))
377 align = GET_MODE_ALIGNMENT (mode);
379 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
382 if (hwasan_sanitize_stack_p ())
383 align = MAX (align, (unsigned) HWASAN_TAG_GRANULE_SIZE * BITS_PER_UNIT);
385 if (TREE_CODE (decl) != SSA_NAME && really_expand)
386 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
387 That is done before IPA and could bump alignment based on host
388 backend even for offloaded code which wants different
389 LOCAL_DECL_ALIGNMENT. */
390 SET_DECL_ALIGN (decl, align);
392 return align / BITS_PER_UNIT;
395 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
396 down otherwise. Return truncated BASE value. */
398 static inline unsigned HOST_WIDE_INT
399 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
401 return align_up ? (base + align - 1) & -align : base & -align;
404 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
405 Return the frame offset. */
407 static poly_int64
408 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
410 poly_int64 offset, new_frame_offset;
412 if (FRAME_GROWS_DOWNWARD)
414 new_frame_offset
415 = aligned_lower_bound (frame_offset - frame_phase - size,
416 align) + frame_phase;
417 offset = new_frame_offset;
419 else
421 new_frame_offset
422 = aligned_upper_bound (frame_offset - frame_phase,
423 align) + frame_phase;
424 offset = new_frame_offset;
425 new_frame_offset += size;
427 frame_offset = new_frame_offset;
429 if (frame_offset_overflow (frame_offset, cfun->decl))
430 frame_offset = offset = 0;
432 return offset;
435 /* Ensure that the stack is aligned to ALIGN bytes.
436 Return the new frame offset. */
437 static poly_int64
438 align_frame_offset (unsigned HOST_WIDE_INT align)
440 return alloc_stack_frame_space (0, align);
443 /* Accumulate DECL into STACK_VARS. */
445 static void
446 add_stack_var (tree decl, bool really_expand)
448 class stack_var *v;
450 if (stack_vars_num >= stack_vars_alloc)
452 if (stack_vars_alloc)
453 stack_vars_alloc = stack_vars_alloc * 3 / 2;
454 else
455 stack_vars_alloc = 32;
456 stack_vars
457 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
459 if (!decl_to_stack_part)
460 decl_to_stack_part = new hash_map<tree, size_t>;
462 v = &stack_vars[stack_vars_num];
463 decl_to_stack_part->put (decl, stack_vars_num);
465 v->decl = decl;
466 tree size = TREE_CODE (decl) == SSA_NAME
467 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
468 : DECL_SIZE_UNIT (decl);
469 v->size = tree_to_poly_uint64 (size);
470 /* Ensure that all variables have size, so that &a != &b for any two
471 variables that are simultaneously live. */
472 if (known_eq (v->size, 0U))
473 v->size = 1;
474 v->alignb = align_local_variable (decl, really_expand);
475 /* An alignment of zero can mightily confuse us later. */
476 gcc_assert (v->alignb != 0);
478 /* All variables are initially in their own partition. */
479 v->representative = stack_vars_num;
480 v->next = EOC;
482 /* All variables initially conflict with no other. */
483 v->conflicts = NULL;
485 /* Ensure that this decl doesn't get put onto the list twice. */
486 set_rtl (decl, pc_rtx);
488 stack_vars_num++;
491 /* Make the decls associated with luid's X and Y conflict. */
493 static void
494 add_stack_var_conflict (size_t x, size_t y)
496 class stack_var *a = &stack_vars[x];
497 class stack_var *b = &stack_vars[y];
498 if (x == y)
499 return;
500 if (!a->conflicts)
501 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
502 if (!b->conflicts)
503 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
504 bitmap_set_bit (a->conflicts, y);
505 bitmap_set_bit (b->conflicts, x);
508 /* Check whether the decls associated with luid's X and Y conflict. */
510 static bool
511 stack_var_conflict_p (size_t x, size_t y)
513 class stack_var *a = &stack_vars[x];
514 class stack_var *b = &stack_vars[y];
515 if (x == y)
516 return false;
517 /* Partitions containing an SSA name result from gimple registers
518 with things like unsupported modes. They are top-level and
519 hence conflict with everything else. */
520 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
521 return true;
523 if (!a->conflicts || !b->conflicts)
524 return false;
525 return bitmap_bit_p (a->conflicts, y);
528 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
529 enter its partition number into bitmap DATA. */
531 static bool
532 visit_op (gimple *, tree op, tree, void *data)
534 bitmap active = (bitmap)data;
535 op = get_base_address (op);
536 if (op
537 && DECL_P (op)
538 && DECL_RTL_IF_SET (op) == pc_rtx)
540 size_t *v = decl_to_stack_part->get (op);
541 if (v)
542 bitmap_set_bit (active, *v);
544 return false;
547 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
548 record conflicts between it and all currently active other partitions
549 from bitmap DATA. */
551 static bool
552 visit_conflict (gimple *, tree op, tree, void *data)
554 bitmap active = (bitmap)data;
555 op = get_base_address (op);
556 if (op
557 && DECL_P (op)
558 && DECL_RTL_IF_SET (op) == pc_rtx)
560 size_t *v = decl_to_stack_part->get (op);
561 if (v && bitmap_set_bit (active, *v))
563 size_t num = *v;
564 bitmap_iterator bi;
565 unsigned i;
566 gcc_assert (num < stack_vars_num);
567 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
568 add_stack_var_conflict (num, i);
571 return false;
574 /* Helper routine for add_scope_conflicts, calculating the active partitions
575 at the end of BB, leaving the result in WORK. We're called to generate
576 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
577 liveness. */
579 static void
580 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
582 edge e;
583 edge_iterator ei;
584 gimple_stmt_iterator gsi;
585 walk_stmt_load_store_addr_fn visit;
587 bitmap_clear (work);
588 FOR_EACH_EDGE (e, ei, bb->preds)
589 bitmap_ior_into (work, (bitmap)e->src->aux);
591 visit = visit_op;
593 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
595 gimple *stmt = gsi_stmt (gsi);
596 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
598 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
600 gimple *stmt = gsi_stmt (gsi);
602 if (gimple_clobber_p (stmt))
604 tree lhs = gimple_assign_lhs (stmt);
605 size_t *v;
606 /* Nested function lowering might introduce LHSs
607 that are COMPONENT_REFs. */
608 if (!VAR_P (lhs))
609 continue;
610 if (DECL_RTL_IF_SET (lhs) == pc_rtx
611 && (v = decl_to_stack_part->get (lhs)))
612 bitmap_clear_bit (work, *v);
614 else if (!is_gimple_debug (stmt))
616 if (for_conflict
617 && visit == visit_op)
619 /* If this is the first real instruction in this BB we need
620 to add conflicts for everything live at this point now.
621 Unlike classical liveness for named objects we can't
622 rely on seeing a def/use of the names we're interested in.
623 There might merely be indirect loads/stores. We'd not add any
624 conflicts for such partitions. */
625 bitmap_iterator bi;
626 unsigned i;
627 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
629 class stack_var *a = &stack_vars[i];
630 if (!a->conflicts)
631 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
632 bitmap_ior_into (a->conflicts, work);
634 visit = visit_conflict;
636 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
641 /* Generate stack partition conflicts between all partitions that are
642 simultaneously live. */
644 static void
645 add_scope_conflicts (void)
647 basic_block bb;
648 bool changed;
649 bitmap work = BITMAP_ALLOC (NULL);
650 int *rpo;
651 int n_bbs;
653 /* We approximate the live range of a stack variable by taking the first
654 mention of its name as starting point(s), and by the end-of-scope
655 death clobber added by gimplify as ending point(s) of the range.
656 This overapproximates in the case we for instance moved an address-taken
657 operation upward, without also moving a dereference to it upwards.
658 But it's conservatively correct as a variable never can hold values
659 before its name is mentioned at least once.
661 We then do a mostly classical bitmap liveness algorithm. */
663 FOR_ALL_BB_FN (bb, cfun)
664 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
666 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
667 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
669 changed = true;
670 while (changed)
672 int i;
673 changed = false;
674 for (i = 0; i < n_bbs; i++)
676 bitmap active;
677 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
678 active = (bitmap)bb->aux;
679 add_scope_conflicts_1 (bb, work, false);
680 if (bitmap_ior_into (active, work))
681 changed = true;
685 FOR_EACH_BB_FN (bb, cfun)
686 add_scope_conflicts_1 (bb, work, true);
688 free (rpo);
689 BITMAP_FREE (work);
690 FOR_ALL_BB_FN (bb, cfun)
691 BITMAP_FREE (bb->aux);
694 /* A subroutine of partition_stack_vars. A comparison function for qsort,
695 sorting an array of indices by the properties of the object. */
697 static int
698 stack_var_cmp (const void *a, const void *b)
700 size_t ia = *(const size_t *)a;
701 size_t ib = *(const size_t *)b;
702 unsigned int aligna = stack_vars[ia].alignb;
703 unsigned int alignb = stack_vars[ib].alignb;
704 poly_int64 sizea = stack_vars[ia].size;
705 poly_int64 sizeb = stack_vars[ib].size;
706 tree decla = stack_vars[ia].decl;
707 tree declb = stack_vars[ib].decl;
708 bool largea, largeb;
709 unsigned int uida, uidb;
711 /* Primary compare on "large" alignment. Large comes first. */
712 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
713 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
714 if (largea != largeb)
715 return (int)largeb - (int)largea;
717 /* Secondary compare on size, decreasing */
718 int diff = compare_sizes_for_sort (sizeb, sizea);
719 if (diff != 0)
720 return diff;
722 /* Tertiary compare on true alignment, decreasing. */
723 if (aligna < alignb)
724 return -1;
725 if (aligna > alignb)
726 return 1;
728 /* Final compare on ID for sort stability, increasing.
729 Two SSA names are compared by their version, SSA names come before
730 non-SSA names, and two normal decls are compared by their DECL_UID. */
731 if (TREE_CODE (decla) == SSA_NAME)
733 if (TREE_CODE (declb) == SSA_NAME)
734 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
735 else
736 return -1;
738 else if (TREE_CODE (declb) == SSA_NAME)
739 return 1;
740 else
741 uida = DECL_UID (decla), uidb = DECL_UID (declb);
742 if (uida < uidb)
743 return 1;
744 if (uida > uidb)
745 return -1;
746 return 0;
749 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
750 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
752 /* If the points-to solution *PI points to variables that are in a partition
753 together with other variables add all partition members to the pointed-to
754 variables bitmap. */
756 static void
757 add_partitioned_vars_to_ptset (struct pt_solution *pt,
758 part_hashmap *decls_to_partitions,
759 hash_set<bitmap> *visited, bitmap temp)
761 bitmap_iterator bi;
762 unsigned i;
763 bitmap *part;
765 if (pt->anything
766 || pt->vars == NULL
767 /* The pointed-to vars bitmap is shared, it is enough to
768 visit it once. */
769 || visited->add (pt->vars))
770 return;
772 bitmap_clear (temp);
774 /* By using a temporary bitmap to store all members of the partitions
775 we have to add we make sure to visit each of the partitions only
776 once. */
777 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
778 if ((!temp
779 || !bitmap_bit_p (temp, i))
780 && (part = decls_to_partitions->get (i)))
781 bitmap_ior_into (temp, *part);
782 if (!bitmap_empty_p (temp))
783 bitmap_ior_into (pt->vars, temp);
786 /* Update points-to sets based on partition info, so we can use them on RTL.
787 The bitmaps representing stack partitions will be saved until expand,
788 where partitioned decls used as bases in memory expressions will be
789 rewritten.
791 It is not necessary to update TBAA info on accesses to the coalesced
792 storage since our memory model doesn't allow TBAA to be used for
793 WAW or WAR dependences. For RAW when the write is to an old object
794 the new object would not have been initialized at the point of the
795 read, invoking undefined behavior. */
797 static void
798 update_alias_info_with_stack_vars (void)
800 part_hashmap *decls_to_partitions = NULL;
801 size_t i, j;
802 tree var = NULL_TREE;
804 for (i = 0; i < stack_vars_num; i++)
806 bitmap part = NULL;
807 tree name;
808 struct ptr_info_def *pi;
810 /* Not interested in partitions with single variable. */
811 if (stack_vars[i].representative != i
812 || stack_vars[i].next == EOC)
813 continue;
815 if (!decls_to_partitions)
817 decls_to_partitions = new part_hashmap;
818 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
821 /* Create an SSA_NAME that points to the partition for use
822 as base during alias-oracle queries on RTL for bases that
823 have been partitioned. */
824 if (var == NULL_TREE)
825 var = create_tmp_var (ptr_type_node);
826 name = make_ssa_name (var);
828 /* Create bitmaps representing partitions. They will be used for
829 points-to sets later, so use GGC alloc. */
830 part = BITMAP_GGC_ALLOC ();
831 for (j = i; j != EOC; j = stack_vars[j].next)
833 tree decl = stack_vars[j].decl;
834 unsigned int uid = DECL_PT_UID (decl);
835 bitmap_set_bit (part, uid);
836 decls_to_partitions->put (uid, part);
837 cfun->gimple_df->decls_to_pointers->put (decl, name);
838 if (TREE_ADDRESSABLE (decl))
839 TREE_ADDRESSABLE (name) = 1;
842 /* Make the SSA name point to all partition members. */
843 pi = get_ptr_info (name);
844 pt_solution_set (&pi->pt, part, false);
847 /* Make all points-to sets that contain one member of a partition
848 contain all members of the partition. */
849 if (decls_to_partitions)
851 unsigned i;
852 tree name;
853 hash_set<bitmap> visited;
854 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
856 FOR_EACH_SSA_NAME (i, name, cfun)
858 struct ptr_info_def *pi;
860 if (POINTER_TYPE_P (TREE_TYPE (name))
861 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
862 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
863 &visited, temp);
866 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
867 decls_to_partitions, &visited, temp);
868 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped_return,
869 decls_to_partitions, &visited, temp);
870 delete decls_to_partitions;
871 BITMAP_FREE (temp);
875 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
876 partitioning algorithm. Partitions A and B are known to be non-conflicting.
877 Merge them into a single partition A. */
879 static void
880 union_stack_vars (size_t a, size_t b)
882 class stack_var *vb = &stack_vars[b];
883 bitmap_iterator bi;
884 unsigned u;
886 gcc_assert (stack_vars[b].next == EOC);
887 /* Add B to A's partition. */
888 stack_vars[b].next = stack_vars[a].next;
889 stack_vars[b].representative = a;
890 stack_vars[a].next = b;
892 /* Make sure A is big enough to hold B. */
893 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
895 /* Update the required alignment of partition A to account for B. */
896 if (stack_vars[a].alignb < stack_vars[b].alignb)
897 stack_vars[a].alignb = stack_vars[b].alignb;
899 /* Update the interference graph and merge the conflicts. */
900 if (vb->conflicts)
902 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
903 add_stack_var_conflict (a, stack_vars[u].representative);
904 BITMAP_FREE (vb->conflicts);
908 /* A subroutine of expand_used_vars. Binpack the variables into
909 partitions constrained by the interference graph. The overall
910 algorithm used is as follows:
912 Sort the objects by size in descending order.
913 For each object A {
914 S = size(A)
915 O = 0
916 loop {
917 Look for the largest non-conflicting object B with size <= S.
918 UNION (A, B)
923 static void
924 partition_stack_vars (void)
926 size_t si, sj, n = stack_vars_num;
928 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
929 for (si = 0; si < n; ++si)
930 stack_vars_sorted[si] = si;
932 if (n == 1)
933 return;
935 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
937 for (si = 0; si < n; ++si)
939 size_t i = stack_vars_sorted[si];
940 unsigned int ialign = stack_vars[i].alignb;
941 poly_int64 isize = stack_vars[i].size;
943 /* Ignore objects that aren't partition representatives. If we
944 see a var that is not a partition representative, it must
945 have been merged earlier. */
946 if (stack_vars[i].representative != i)
947 continue;
949 for (sj = si + 1; sj < n; ++sj)
951 size_t j = stack_vars_sorted[sj];
952 unsigned int jalign = stack_vars[j].alignb;
953 poly_int64 jsize = stack_vars[j].size;
955 /* Ignore objects that aren't partition representatives. */
956 if (stack_vars[j].representative != j)
957 continue;
959 /* Do not mix objects of "small" (supported) alignment
960 and "large" (unsupported) alignment. */
961 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
962 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
963 break;
965 /* For Address Sanitizer do not mix objects with different
966 sizes, as the shorter vars wouldn't be adequately protected.
967 Don't do that for "large" (unsupported) alignment objects,
968 those aren't protected anyway. */
969 if (asan_sanitize_stack_p ()
970 && maybe_ne (isize, jsize)
971 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
972 break;
974 /* Ignore conflicting objects. */
975 if (stack_var_conflict_p (i, j))
976 continue;
978 /* UNION the objects, placing J at OFFSET. */
979 union_stack_vars (i, j);
983 update_alias_info_with_stack_vars ();
986 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
988 static void
989 dump_stack_var_partition (void)
991 size_t si, i, j, n = stack_vars_num;
993 for (si = 0; si < n; ++si)
995 i = stack_vars_sorted[si];
997 /* Skip variables that aren't partition representatives, for now. */
998 if (stack_vars[i].representative != i)
999 continue;
1001 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
1002 print_dec (stack_vars[i].size, dump_file);
1003 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
1005 for (j = i; j != EOC; j = stack_vars[j].next)
1007 fputc ('\t', dump_file);
1008 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
1010 fputc ('\n', dump_file);
1014 /* Assign rtl to DECL at BASE + OFFSET. */
1016 static void
1017 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1018 poly_int64 offset)
1020 unsigned align;
1021 rtx x;
1023 /* If this fails, we've overflowed the stack frame. Error nicely? */
1024 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1026 if (hwasan_sanitize_stack_p ())
1027 x = targetm.memtag.add_tag (base, offset,
1028 hwasan_current_frame_tag ());
1029 else
1030 x = plus_constant (Pmode, base, offset);
1032 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1033 ? TYPE_MODE (TREE_TYPE (decl))
1034 : DECL_MODE (decl), x);
1036 /* Set alignment we actually gave this decl if it isn't an SSA name.
1037 If it is we generate stack slots only accidentally so it isn't as
1038 important, we'll simply set the alignment directly on the MEM. */
1040 if (stack_vars_base_reg_p (base))
1041 offset -= frame_phase;
1042 align = known_alignment (offset);
1043 align *= BITS_PER_UNIT;
1044 if (align == 0 || align > base_align)
1045 align = base_align;
1047 if (TREE_CODE (decl) != SSA_NAME)
1049 /* One would think that we could assert that we're not decreasing
1050 alignment here, but (at least) the i386 port does exactly this
1051 via the MINIMUM_ALIGNMENT hook. */
1053 SET_DECL_ALIGN (decl, align);
1054 DECL_USER_ALIGN (decl) = 0;
1057 set_rtl (decl, x);
1059 set_mem_align (x, align);
1062 class stack_vars_data
1064 public:
1065 /* Vector of offset pairs, always end of some padding followed
1066 by start of the padding that needs Address Sanitizer protection.
1067 The vector is in reversed, highest offset pairs come first. */
1068 auto_vec<HOST_WIDE_INT> asan_vec;
1070 /* Vector of partition representative decls in between the paddings. */
1071 auto_vec<tree> asan_decl_vec;
1073 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1074 rtx asan_base;
1076 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1077 unsigned int asan_alignb;
1080 /* A subroutine of expand_used_vars. Give each partition representative
1081 a unique location within the stack frame. Update each partition member
1082 with that location. */
1083 static void
1084 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1086 size_t si, i, j, n = stack_vars_num;
1087 poly_uint64 large_size = 0, large_alloc = 0;
1088 rtx large_base = NULL;
1089 rtx large_untagged_base = NULL;
1090 unsigned large_align = 0;
1091 bool large_allocation_done = false;
1092 tree decl;
1094 /* Determine if there are any variables requiring "large" alignment.
1095 Since these are dynamically allocated, we only process these if
1096 no predicate involved. */
1097 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1098 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1100 /* Find the total size of these variables. */
1101 for (si = 0; si < n; ++si)
1103 unsigned alignb;
1105 i = stack_vars_sorted[si];
1106 alignb = stack_vars[i].alignb;
1108 /* All "large" alignment decls come before all "small" alignment
1109 decls, but "large" alignment decls are not sorted based on
1110 their alignment. Increase large_align to track the largest
1111 required alignment. */
1112 if ((alignb * BITS_PER_UNIT) > large_align)
1113 large_align = alignb * BITS_PER_UNIT;
1115 /* Stop when we get to the first decl with "small" alignment. */
1116 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1117 break;
1119 /* Skip variables that aren't partition representatives. */
1120 if (stack_vars[i].representative != i)
1121 continue;
1123 /* Skip variables that have already had rtl assigned. See also
1124 add_stack_var where we perpetrate this pc_rtx hack. */
1125 decl = stack_vars[i].decl;
1126 if (TREE_CODE (decl) == SSA_NAME
1127 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1128 : DECL_RTL (decl) != pc_rtx)
1129 continue;
1131 large_size = aligned_upper_bound (large_size, alignb);
1132 large_size += stack_vars[i].size;
1136 for (si = 0; si < n; ++si)
1138 rtx base;
1139 unsigned base_align, alignb;
1140 poly_int64 offset = 0;
1142 i = stack_vars_sorted[si];
1144 /* Skip variables that aren't partition representatives, for now. */
1145 if (stack_vars[i].representative != i)
1146 continue;
1148 /* Skip variables that have already had rtl assigned. See also
1149 add_stack_var where we perpetrate this pc_rtx hack. */
1150 decl = stack_vars[i].decl;
1151 if (TREE_CODE (decl) == SSA_NAME
1152 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1153 : DECL_RTL (decl) != pc_rtx)
1154 continue;
1156 /* Check the predicate to see whether this variable should be
1157 allocated in this pass. */
1158 if (pred && !pred (i))
1159 continue;
1161 base = (hwasan_sanitize_stack_p ()
1162 ? hwasan_frame_base ()
1163 : virtual_stack_vars_rtx);
1164 alignb = stack_vars[i].alignb;
1165 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1167 poly_int64 hwasan_orig_offset;
1168 if (hwasan_sanitize_stack_p ())
1170 /* There must be no tag granule "shared" between different
1171 objects. This means that no HWASAN_TAG_GRANULE_SIZE byte
1172 chunk can have more than one object in it.
1174 We ensure this by forcing the end of the last bit of data to
1175 be aligned to HWASAN_TAG_GRANULE_SIZE bytes here, and setting
1176 the start of each variable to be aligned to
1177 HWASAN_TAG_GRANULE_SIZE bytes in `align_local_variable`.
1179 We can't align just one of the start or end, since there are
1180 untagged things stored on the stack which we do not align to
1181 HWASAN_TAG_GRANULE_SIZE bytes. If we only aligned the start
1182 or the end of tagged objects then untagged objects could end
1183 up sharing the first granule of a tagged object or sharing the
1184 last granule of a tagged object respectively. */
1185 hwasan_orig_offset = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1186 gcc_assert (stack_vars[i].alignb >= HWASAN_TAG_GRANULE_SIZE);
1188 /* ASAN description strings don't yet have a syntax for expressing
1189 polynomial offsets. */
1190 HOST_WIDE_INT prev_offset;
1191 if (asan_sanitize_stack_p ()
1192 && pred
1193 && frame_offset.is_constant (&prev_offset)
1194 && stack_vars[i].size.is_constant ())
1196 if (data->asan_vec.is_empty ())
1198 align_frame_offset (ASAN_RED_ZONE_SIZE);
1199 prev_offset = frame_offset.to_constant ();
1201 prev_offset = align_base (prev_offset,
1202 ASAN_MIN_RED_ZONE_SIZE,
1203 !FRAME_GROWS_DOWNWARD);
1204 tree repr_decl = NULL_TREE;
1205 unsigned HOST_WIDE_INT size
1206 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1207 if (data->asan_vec.is_empty ())
1208 size = MAX (size, ASAN_RED_ZONE_SIZE);
1210 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1211 ASAN_MIN_RED_ZONE_SIZE);
1212 offset = alloc_stack_frame_space (size, alignment);
1214 data->asan_vec.safe_push (prev_offset);
1215 /* Allocating a constant amount of space from a constant
1216 starting offset must give a constant result. */
1217 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1218 .to_constant ());
1219 /* Find best representative of the partition.
1220 Prefer those with DECL_NAME, even better
1221 satisfying asan_protect_stack_decl predicate. */
1222 for (j = i; j != EOC; j = stack_vars[j].next)
1223 if (asan_protect_stack_decl (stack_vars[j].decl)
1224 && DECL_NAME (stack_vars[j].decl))
1226 repr_decl = stack_vars[j].decl;
1227 break;
1229 else if (repr_decl == NULL_TREE
1230 && DECL_P (stack_vars[j].decl)
1231 && DECL_NAME (stack_vars[j].decl))
1232 repr_decl = stack_vars[j].decl;
1233 if (repr_decl == NULL_TREE)
1234 repr_decl = stack_vars[i].decl;
1235 data->asan_decl_vec.safe_push (repr_decl);
1237 /* Make sure a representative is unpoison if another
1238 variable in the partition is handled by
1239 use-after-scope sanitization. */
1240 if (asan_handled_variables != NULL
1241 && !asan_handled_variables->contains (repr_decl))
1243 for (j = i; j != EOC; j = stack_vars[j].next)
1244 if (asan_handled_variables->contains (stack_vars[j].decl))
1245 break;
1246 if (j != EOC)
1247 asan_handled_variables->add (repr_decl);
1250 data->asan_alignb = MAX (data->asan_alignb, alignb);
1251 if (data->asan_base == NULL)
1252 data->asan_base = gen_reg_rtx (Pmode);
1253 base = data->asan_base;
1255 if (!STRICT_ALIGNMENT)
1256 base_align = crtl->max_used_stack_slot_alignment;
1257 else
1258 base_align = MAX (crtl->max_used_stack_slot_alignment,
1259 GET_MODE_ALIGNMENT (SImode)
1260 << ASAN_SHADOW_SHIFT);
1262 else
1264 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1265 base_align = crtl->max_used_stack_slot_alignment;
1267 if (hwasan_sanitize_stack_p ())
1269 /* Align again since the point of this alignment is to handle
1270 the "end" of the object (i.e. smallest address after the
1271 stack object). For FRAME_GROWS_DOWNWARD that requires
1272 aligning the stack before allocating, but for a frame that
1273 grows upwards that requires aligning the stack after
1274 allocation.
1276 Use `frame_offset` to record the offset value rather than
1277 `offset` since the `frame_offset` describes the extent
1278 allocated for this particular variable while `offset`
1279 describes the address that this variable starts at. */
1280 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1281 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1282 hwasan_orig_offset, frame_offset);
1286 else
1288 /* Large alignment is only processed in the last pass. */
1289 if (pred)
1290 continue;
1292 /* If there were any variables requiring "large" alignment, allocate
1293 space. */
1294 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1296 poly_int64 loffset;
1297 rtx large_allocsize;
1299 large_allocsize = gen_int_mode (large_size, Pmode);
1300 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1301 loffset = alloc_stack_frame_space
1302 (rtx_to_poly_int64 (large_allocsize),
1303 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1304 large_base = get_dynamic_stack_base (loffset, large_align, base);
1305 large_allocation_done = true;
1308 gcc_assert (large_base != NULL);
1309 large_alloc = aligned_upper_bound (large_alloc, alignb);
1310 offset = large_alloc;
1311 large_alloc += stack_vars[i].size;
1312 if (hwasan_sanitize_stack_p ())
1314 /* An object with a large alignment requirement means that the
1315 alignment requirement is greater than the required alignment
1316 for tags. */
1317 if (!large_untagged_base)
1318 large_untagged_base
1319 = targetm.memtag.untagged_pointer (large_base, NULL_RTX);
1320 /* Ensure the end of the variable is also aligned correctly. */
1321 poly_int64 align_again
1322 = aligned_upper_bound (large_alloc, HWASAN_TAG_GRANULE_SIZE);
1323 /* For large allocations we always allocate a chunk of space
1324 (which is addressed by large_untagged_base/large_base) and
1325 then use positive offsets from that. Hence the farthest
1326 offset is `align_again` and the nearest offset from the base
1327 is `offset`. */
1328 hwasan_record_stack_var (large_untagged_base, large_base,
1329 offset, align_again);
1332 base = large_base;
1333 base_align = large_align;
1336 /* Create rtl for each variable based on their location within the
1337 partition. */
1338 for (j = i; j != EOC; j = stack_vars[j].next)
1340 expand_one_stack_var_at (stack_vars[j].decl,
1341 base, base_align, offset);
1343 if (hwasan_sanitize_stack_p ())
1344 hwasan_increment_frame_tag ();
1347 gcc_assert (known_eq (large_alloc, large_size));
1350 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1351 static poly_uint64
1352 account_stack_vars (void)
1354 size_t si, j, i, n = stack_vars_num;
1355 poly_uint64 size = 0;
1357 for (si = 0; si < n; ++si)
1359 i = stack_vars_sorted[si];
1361 /* Skip variables that aren't partition representatives, for now. */
1362 if (stack_vars[i].representative != i)
1363 continue;
1365 size += stack_vars[i].size;
1366 for (j = i; j != EOC; j = stack_vars[j].next)
1367 set_rtl (stack_vars[j].decl, NULL);
1369 return size;
1372 /* Record the RTL assignment X for the default def of PARM. */
1374 extern void
1375 set_parm_rtl (tree parm, rtx x)
1377 gcc_assert (TREE_CODE (parm) == PARM_DECL
1378 || TREE_CODE (parm) == RESULT_DECL);
1380 if (x && !MEM_P (x))
1382 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1383 TYPE_MODE (TREE_TYPE (parm)),
1384 TYPE_ALIGN (TREE_TYPE (parm)));
1386 /* If the variable alignment is very large we'll dynamicaly
1387 allocate it, which means that in-frame portion is just a
1388 pointer. ??? We've got a pseudo for sure here, do we
1389 actually dynamically allocate its spilling area if needed?
1390 ??? Isn't it a problem when Pmode alignment also exceeds
1391 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1392 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1393 align = GET_MODE_ALIGNMENT (Pmode);
1395 record_alignment_for_reg_var (align);
1398 tree ssa = ssa_default_def (cfun, parm);
1399 if (!ssa)
1400 return set_rtl (parm, x);
1402 int part = var_to_partition (SA.map, ssa);
1403 gcc_assert (part != NO_PARTITION);
1405 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1406 gcc_assert (changed);
1408 set_rtl (ssa, x);
1409 gcc_assert (DECL_RTL (parm) == x);
1412 /* A subroutine of expand_one_var. Called to immediately assign rtl
1413 to a variable to be allocated in the stack frame. */
1415 static void
1416 expand_one_stack_var_1 (tree var)
1418 poly_uint64 size;
1419 poly_int64 offset;
1420 unsigned byte_align;
1422 if (TREE_CODE (var) == SSA_NAME)
1424 tree type = TREE_TYPE (var);
1425 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1427 else
1428 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1430 byte_align = align_local_variable (var, true);
1432 /* We handle highly aligned variables in expand_stack_vars. */
1433 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1435 rtx base;
1436 if (hwasan_sanitize_stack_p ())
1438 /* Allocate zero bytes to align the stack. */
1439 poly_int64 hwasan_orig_offset
1440 = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1441 offset = alloc_stack_frame_space (size, byte_align);
1442 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1443 base = hwasan_frame_base ();
1444 /* Use `frame_offset` to automatically account for machines where the
1445 frame grows upwards.
1447 `offset` will always point to the "start" of the stack object, which
1448 will be the smallest address, for ! FRAME_GROWS_DOWNWARD this is *not*
1449 the "furthest" offset from the base delimiting the current stack
1450 object. `frame_offset` will always delimit the extent that the frame.
1452 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1453 hwasan_orig_offset, frame_offset);
1455 else
1457 offset = alloc_stack_frame_space (size, byte_align);
1458 base = virtual_stack_vars_rtx;
1461 expand_one_stack_var_at (var, base,
1462 crtl->max_used_stack_slot_alignment, offset);
1464 if (hwasan_sanitize_stack_p ())
1465 hwasan_increment_frame_tag ();
1468 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1469 already assigned some MEM. */
1471 static void
1472 expand_one_stack_var (tree var)
1474 if (TREE_CODE (var) == SSA_NAME)
1476 int part = var_to_partition (SA.map, var);
1477 if (part != NO_PARTITION)
1479 rtx x = SA.partition_to_pseudo[part];
1480 gcc_assert (x);
1481 gcc_assert (MEM_P (x));
1482 return;
1486 return expand_one_stack_var_1 (var);
1489 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1490 that will reside in a hard register. */
1492 static void
1493 expand_one_hard_reg_var (tree var)
1495 rest_of_decl_compilation (var, 0, 0);
1498 /* Record the alignment requirements of some variable assigned to a
1499 pseudo. */
1501 static void
1502 record_alignment_for_reg_var (unsigned int align)
1504 if (SUPPORTS_STACK_ALIGNMENT
1505 && crtl->stack_alignment_estimated < align)
1507 /* stack_alignment_estimated shouldn't change after stack
1508 realign decision made */
1509 gcc_assert (!crtl->stack_realign_processed);
1510 crtl->stack_alignment_estimated = align;
1513 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1514 So here we only make sure stack_alignment_needed >= align. */
1515 if (crtl->stack_alignment_needed < align)
1516 crtl->stack_alignment_needed = align;
1517 if (crtl->max_used_stack_slot_alignment < align)
1518 crtl->max_used_stack_slot_alignment = align;
1521 /* Create RTL for an SSA partition. */
1523 static void
1524 expand_one_ssa_partition (tree var)
1526 int part = var_to_partition (SA.map, var);
1527 gcc_assert (part != NO_PARTITION);
1529 if (SA.partition_to_pseudo[part])
1530 return;
1532 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1533 TYPE_MODE (TREE_TYPE (var)),
1534 TYPE_ALIGN (TREE_TYPE (var)));
1536 /* If the variable alignment is very large we'll dynamicaly allocate
1537 it, which means that in-frame portion is just a pointer. */
1538 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1539 align = GET_MODE_ALIGNMENT (Pmode);
1541 record_alignment_for_reg_var (align);
1543 if (!use_register_for_decl (var))
1545 if (defer_stack_allocation (var, true))
1546 add_stack_var (var, true);
1547 else
1548 expand_one_stack_var_1 (var);
1549 return;
1552 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1553 rtx x = gen_reg_rtx (reg_mode);
1555 set_rtl (var, x);
1557 /* For a promoted variable, X will not be used directly but wrapped in a
1558 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1559 will assume that its upper bits can be inferred from its lower bits.
1560 Therefore, if X isn't initialized on every path from the entry, then
1561 we must do it manually in order to fulfill the above assumption. */
1562 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1563 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1564 emit_move_insn (x, CONST0_RTX (reg_mode));
1567 /* Record the association between the RTL generated for partition PART
1568 and the underlying variable of the SSA_NAME VAR. */
1570 static void
1571 adjust_one_expanded_partition_var (tree var)
1573 if (!var)
1574 return;
1576 tree decl = SSA_NAME_VAR (var);
1578 int part = var_to_partition (SA.map, var);
1579 if (part == NO_PARTITION)
1580 return;
1582 rtx x = SA.partition_to_pseudo[part];
1584 gcc_assert (x);
1586 set_rtl (var, x);
1588 if (!REG_P (x))
1589 return;
1591 /* Note if the object is a user variable. */
1592 if (decl && !DECL_ARTIFICIAL (decl))
1593 mark_user_reg (x);
1595 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1596 mark_reg_pointer (x, get_pointer_alignment (var));
1599 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1600 that will reside in a pseudo register. */
1602 static void
1603 expand_one_register_var (tree var)
1605 if (TREE_CODE (var) == SSA_NAME)
1607 int part = var_to_partition (SA.map, var);
1608 if (part != NO_PARTITION)
1610 rtx x = SA.partition_to_pseudo[part];
1611 gcc_assert (x);
1612 gcc_assert (REG_P (x));
1613 return;
1615 gcc_unreachable ();
1618 tree decl = var;
1619 tree type = TREE_TYPE (decl);
1620 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1621 rtx x = gen_reg_rtx (reg_mode);
1623 set_rtl (var, x);
1625 /* Note if the object is a user variable. */
1626 if (!DECL_ARTIFICIAL (decl))
1627 mark_user_reg (x);
1629 if (POINTER_TYPE_P (type))
1630 mark_reg_pointer (x, get_pointer_alignment (var));
1633 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1634 has some associated error, e.g. its type is error-mark. We just need
1635 to pick something that won't crash the rest of the compiler. */
1637 static void
1638 expand_one_error_var (tree var)
1640 machine_mode mode = DECL_MODE (var);
1641 rtx x;
1643 if (mode == BLKmode)
1644 x = gen_rtx_MEM (BLKmode, const0_rtx);
1645 else if (mode == VOIDmode)
1646 x = const0_rtx;
1647 else
1648 x = gen_reg_rtx (mode);
1650 SET_DECL_RTL (var, x);
1653 /* A subroutine of expand_one_var. VAR is a variable that will be
1654 allocated to the local stack frame. Return true if we wish to
1655 add VAR to STACK_VARS so that it will be coalesced with other
1656 variables. Return false to allocate VAR immediately.
1658 This function is used to reduce the number of variables considered
1659 for coalescing, which reduces the size of the quadratic problem. */
1661 static bool
1662 defer_stack_allocation (tree var, bool toplevel)
1664 tree size_unit = TREE_CODE (var) == SSA_NAME
1665 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1666 : DECL_SIZE_UNIT (var);
1667 poly_uint64 size;
1669 /* Whether the variable is small enough for immediate allocation not to be
1670 a problem with regard to the frame size. */
1671 bool smallish
1672 = (poly_int_tree_p (size_unit, &size)
1673 && (estimated_poly_value (size)
1674 < param_min_size_for_stack_sharing));
1676 /* If stack protection is enabled, *all* stack variables must be deferred,
1677 so that we can re-order the strings to the top of the frame.
1678 Similarly for Address Sanitizer. */
1679 if (flag_stack_protect || asan_sanitize_stack_p ())
1680 return true;
1682 unsigned int align = TREE_CODE (var) == SSA_NAME
1683 ? TYPE_ALIGN (TREE_TYPE (var))
1684 : DECL_ALIGN (var);
1686 /* We handle "large" alignment via dynamic allocation. We want to handle
1687 this extra complication in only one place, so defer them. */
1688 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1689 return true;
1691 bool ignored = TREE_CODE (var) == SSA_NAME
1692 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1693 : DECL_IGNORED_P (var);
1695 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1696 might be detached from their block and appear at toplevel when we reach
1697 here. We want to coalesce them with variables from other blocks when
1698 the immediate contribution to the frame size would be noticeable. */
1699 if (toplevel && optimize > 0 && ignored && !smallish)
1700 return true;
1702 /* Variables declared in the outermost scope automatically conflict
1703 with every other variable. The only reason to want to defer them
1704 at all is that, after sorting, we can more efficiently pack
1705 small variables in the stack frame. Continue to defer at -O2. */
1706 if (toplevel && optimize < 2)
1707 return false;
1709 /* Without optimization, *most* variables are allocated from the
1710 stack, which makes the quadratic problem large exactly when we
1711 want compilation to proceed as quickly as possible. On the
1712 other hand, we don't want the function's stack frame size to
1713 get completely out of hand. So we avoid adding scalars and
1714 "small" aggregates to the list at all. */
1715 if (optimize == 0 && smallish)
1716 return false;
1718 return true;
1721 /* A subroutine of expand_used_vars. Expand one variable according to
1722 its flavor. Variables to be placed on the stack are not actually
1723 expanded yet, merely recorded.
1724 When REALLY_EXPAND is false, only add stack values to be allocated.
1725 Return stack usage this variable is supposed to take.
1728 static poly_uint64
1729 expand_one_var (tree var, bool toplevel, bool really_expand,
1730 bitmap forced_stack_var = NULL)
1732 unsigned int align = BITS_PER_UNIT;
1733 tree origvar = var;
1735 var = SSAVAR (var);
1737 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1739 if (is_global_var (var))
1740 return 0;
1742 /* Because we don't know if VAR will be in register or on stack,
1743 we conservatively assume it will be on stack even if VAR is
1744 eventually put into register after RA pass. For non-automatic
1745 variables, which won't be on stack, we collect alignment of
1746 type and ignore user specified alignment. Similarly for
1747 SSA_NAMEs for which use_register_for_decl returns true. */
1748 if (TREE_STATIC (var)
1749 || DECL_EXTERNAL (var)
1750 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1751 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1752 TYPE_MODE (TREE_TYPE (var)),
1753 TYPE_ALIGN (TREE_TYPE (var)));
1754 else if (DECL_HAS_VALUE_EXPR_P (var)
1755 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1756 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1757 or variables which were assigned a stack slot already by
1758 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1759 changed from the offset chosen to it. */
1760 align = crtl->stack_alignment_estimated;
1761 else
1762 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1764 /* If the variable alignment is very large we'll dynamicaly allocate
1765 it, which means that in-frame portion is just a pointer. */
1766 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1767 align = GET_MODE_ALIGNMENT (Pmode);
1770 record_alignment_for_reg_var (align);
1772 poly_uint64 size;
1773 if (TREE_CODE (origvar) == SSA_NAME)
1775 gcc_assert (!VAR_P (var)
1776 || (!DECL_EXTERNAL (var)
1777 && !DECL_HAS_VALUE_EXPR_P (var)
1778 && !TREE_STATIC (var)
1779 && TREE_TYPE (var) != error_mark_node
1780 && !DECL_HARD_REGISTER (var)
1781 && really_expand));
1783 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1785 else if (DECL_EXTERNAL (var))
1787 else if (DECL_HAS_VALUE_EXPR_P (var))
1789 else if (TREE_STATIC (var))
1791 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1793 else if (TREE_TYPE (var) == error_mark_node)
1795 if (really_expand)
1796 expand_one_error_var (var);
1798 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1800 if (really_expand)
1802 expand_one_hard_reg_var (var);
1803 if (!DECL_HARD_REGISTER (var))
1804 /* Invalid register specification. */
1805 expand_one_error_var (var);
1808 else if (use_register_for_decl (var)
1809 && (!forced_stack_var
1810 || !bitmap_bit_p (forced_stack_var, DECL_UID (var))))
1812 if (really_expand)
1813 expand_one_register_var (origvar);
1815 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1816 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1818 /* Reject variables which cover more than half of the address-space. */
1819 if (really_expand)
1821 if (DECL_NONLOCAL_FRAME (var))
1822 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1823 "total size of local objects is too large");
1824 else
1825 error_at (DECL_SOURCE_LOCATION (var),
1826 "size of variable %q+D is too large", var);
1827 expand_one_error_var (var);
1830 else if (defer_stack_allocation (var, toplevel))
1831 add_stack_var (origvar, really_expand);
1832 else
1834 if (really_expand)
1836 if (lookup_attribute ("naked",
1837 DECL_ATTRIBUTES (current_function_decl)))
1838 error ("cannot allocate stack for variable %q+D, naked function",
1839 var);
1841 expand_one_stack_var (origvar);
1843 return size;
1845 return 0;
1848 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1849 expanding variables. Those variables that can be put into registers
1850 are allocated pseudos; those that can't are put on the stack.
1852 TOPLEVEL is true if this is the outermost BLOCK. */
1854 static void
1855 expand_used_vars_for_block (tree block, bool toplevel, bitmap forced_stack_vars)
1857 tree t;
1859 /* Expand all variables at this level. */
1860 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1861 if (TREE_USED (t)
1862 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1863 || !DECL_NONSHAREABLE (t)))
1864 expand_one_var (t, toplevel, true, forced_stack_vars);
1866 /* Expand all variables at containing levels. */
1867 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1868 expand_used_vars_for_block (t, false, forced_stack_vars);
1871 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1872 and clear TREE_USED on all local variables. */
1874 static void
1875 clear_tree_used (tree block)
1877 tree t;
1879 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1880 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1881 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1882 || !DECL_NONSHAREABLE (t))
1883 TREE_USED (t) = 0;
1885 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1886 clear_tree_used (t);
1889 /* Examine TYPE and determine a bit mask of the following features. */
1891 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1892 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1893 #define SPCT_HAS_ARRAY 4
1894 #define SPCT_HAS_AGGREGATE 8
1896 static unsigned int
1897 stack_protect_classify_type (tree type)
1899 unsigned int ret = 0;
1900 tree t;
1902 switch (TREE_CODE (type))
1904 case ARRAY_TYPE:
1905 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1906 if (t == char_type_node
1907 || t == signed_char_type_node
1908 || t == unsigned_char_type_node)
1910 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1911 unsigned HOST_WIDE_INT len;
1913 if (!TYPE_SIZE_UNIT (type)
1914 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1915 len = max;
1916 else
1917 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1919 if (len < max)
1920 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1921 else
1922 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1924 else
1925 ret = SPCT_HAS_ARRAY;
1926 break;
1928 case UNION_TYPE:
1929 case QUAL_UNION_TYPE:
1930 case RECORD_TYPE:
1931 ret = SPCT_HAS_AGGREGATE;
1932 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1933 if (TREE_CODE (t) == FIELD_DECL)
1934 ret |= stack_protect_classify_type (TREE_TYPE (t));
1935 break;
1937 default:
1938 break;
1941 return ret;
1944 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1945 part of the local stack frame. Remember if we ever return nonzero for
1946 any variable in this function. The return value is the phase number in
1947 which the variable should be allocated. */
1949 static int
1950 stack_protect_decl_phase (tree decl)
1952 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1953 int ret = 0;
1955 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1956 has_short_buffer = true;
1958 tree attribs = DECL_ATTRIBUTES (current_function_decl);
1959 if (!lookup_attribute ("no_stack_protector", attribs)
1960 && (flag_stack_protect == SPCT_FLAG_ALL
1961 || flag_stack_protect == SPCT_FLAG_STRONG
1962 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1963 && lookup_attribute ("stack_protect", attribs))))
1965 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1966 && !(bits & SPCT_HAS_AGGREGATE))
1967 ret = 1;
1968 else if (bits & SPCT_HAS_ARRAY)
1969 ret = 2;
1971 else
1972 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1974 if (ret)
1975 has_protected_decls = true;
1977 return ret;
1980 /* Two helper routines that check for phase 1 and phase 2. These are used
1981 as callbacks for expand_stack_vars. */
1983 static bool
1984 stack_protect_decl_phase_1 (size_t i)
1986 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1989 static bool
1990 stack_protect_decl_phase_2 (size_t i)
1992 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1995 /* And helper function that checks for asan phase (with stack protector
1996 it is phase 3). This is used as callback for expand_stack_vars.
1997 Returns true if any of the vars in the partition need to be protected. */
1999 static bool
2000 asan_decl_phase_3 (size_t i)
2002 while (i != EOC)
2004 if (asan_protect_stack_decl (stack_vars[i].decl))
2005 return true;
2006 i = stack_vars[i].next;
2008 return false;
2011 /* Ensure that variables in different stack protection phases conflict
2012 so that they are not merged and share the same stack slot.
2013 Return true if there are any address taken variables. */
2015 static bool
2016 add_stack_protection_conflicts (void)
2018 size_t i, j, n = stack_vars_num;
2019 unsigned char *phase;
2020 bool ret = false;
2022 phase = XNEWVEC (unsigned char, n);
2023 for (i = 0; i < n; ++i)
2025 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
2026 if (TREE_ADDRESSABLE (stack_vars[i].decl))
2027 ret = true;
2030 for (i = 0; i < n; ++i)
2032 unsigned char ph_i = phase[i];
2033 for (j = i + 1; j < n; ++j)
2034 if (ph_i != phase[j])
2035 add_stack_var_conflict (i, j);
2038 XDELETEVEC (phase);
2039 return ret;
2042 /* Create a decl for the guard at the top of the stack frame. */
2044 static void
2045 create_stack_guard (void)
2047 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
2048 VAR_DECL, NULL, ptr_type_node);
2049 TREE_THIS_VOLATILE (guard) = 1;
2050 TREE_USED (guard) = 1;
2051 expand_one_stack_var (guard);
2052 crtl->stack_protect_guard = guard;
2055 /* Prepare for expanding variables. */
2056 static void
2057 init_vars_expansion (void)
2059 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
2060 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
2062 /* A map from decl to stack partition. */
2063 decl_to_stack_part = new hash_map<tree, size_t>;
2065 /* Initialize local stack smashing state. */
2066 has_protected_decls = false;
2067 has_short_buffer = false;
2068 if (hwasan_sanitize_stack_p ())
2069 hwasan_record_frame_init ();
2072 /* Free up stack variable graph data. */
2073 static void
2074 fini_vars_expansion (void)
2076 bitmap_obstack_release (&stack_var_bitmap_obstack);
2077 if (stack_vars)
2078 XDELETEVEC (stack_vars);
2079 if (stack_vars_sorted)
2080 XDELETEVEC (stack_vars_sorted);
2081 stack_vars = NULL;
2082 stack_vars_sorted = NULL;
2083 stack_vars_alloc = stack_vars_num = 0;
2084 delete decl_to_stack_part;
2085 decl_to_stack_part = NULL;
2088 /* Make a fair guess for the size of the stack frame of the function
2089 in NODE. This doesn't have to be exact, the result is only used in
2090 the inline heuristics. So we don't want to run the full stack var
2091 packing algorithm (which is quadratic in the number of stack vars).
2092 Instead, we calculate the total size of all stack vars. This turns
2093 out to be a pretty fair estimate -- packing of stack vars doesn't
2094 happen very often. */
2096 HOST_WIDE_INT
2097 estimated_stack_frame_size (struct cgraph_node *node)
2099 poly_int64 size = 0;
2100 size_t i;
2101 tree var;
2102 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2104 push_cfun (fn);
2106 init_vars_expansion ();
2108 FOR_EACH_LOCAL_DECL (fn, i, var)
2109 if (auto_var_in_fn_p (var, fn->decl))
2110 size += expand_one_var (var, true, false);
2112 if (stack_vars_num > 0)
2114 /* Fake sorting the stack vars for account_stack_vars (). */
2115 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
2116 for (i = 0; i < stack_vars_num; ++i)
2117 stack_vars_sorted[i] = i;
2118 size += account_stack_vars ();
2121 fini_vars_expansion ();
2122 pop_cfun ();
2123 return estimated_poly_value (size);
2126 /* Check if the current function has calls that use a return slot. */
2128 static bool
2129 stack_protect_return_slot_p ()
2131 basic_block bb;
2133 FOR_ALL_BB_FN (bb, cfun)
2134 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2135 !gsi_end_p (gsi); gsi_next (&gsi))
2137 gimple *stmt = gsi_stmt (gsi);
2138 /* This assumes that calls to internal-only functions never
2139 use a return slot. */
2140 if (is_gimple_call (stmt)
2141 && !gimple_call_internal_p (stmt)
2142 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2143 gimple_call_fndecl (stmt)))
2144 return true;
2146 return false;
2149 /* Expand all variables used in the function. */
2151 static rtx_insn *
2152 expand_used_vars (bitmap forced_stack_vars)
2154 tree var, outer_block = DECL_INITIAL (current_function_decl);
2155 auto_vec<tree> maybe_local_decls;
2156 rtx_insn *var_end_seq = NULL;
2157 unsigned i;
2158 unsigned len;
2159 bool gen_stack_protect_signal = false;
2161 /* Compute the phase of the stack frame for this function. */
2163 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2164 int off = targetm.starting_frame_offset () % align;
2165 frame_phase = off ? align - off : 0;
2168 /* Set TREE_USED on all variables in the local_decls. */
2169 FOR_EACH_LOCAL_DECL (cfun, i, var)
2170 TREE_USED (var) = 1;
2171 /* Clear TREE_USED on all variables associated with a block scope. */
2172 clear_tree_used (DECL_INITIAL (current_function_decl));
2174 init_vars_expansion ();
2176 if (targetm.use_pseudo_pic_reg ())
2177 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2179 for (i = 0; i < SA.map->num_partitions; i++)
2181 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2182 continue;
2184 tree var = partition_to_var (SA.map, i);
2186 gcc_assert (!virtual_operand_p (var));
2188 expand_one_ssa_partition (var);
2191 if (flag_stack_protect == SPCT_FLAG_STRONG)
2192 gen_stack_protect_signal = stack_protect_return_slot_p ();
2194 /* At this point all variables on the local_decls with TREE_USED
2195 set are not associated with any block scope. Lay them out. */
2197 len = vec_safe_length (cfun->local_decls);
2198 FOR_EACH_LOCAL_DECL (cfun, i, var)
2200 bool expand_now = false;
2202 /* Expanded above already. */
2203 if (is_gimple_reg (var))
2205 TREE_USED (var) = 0;
2206 goto next;
2208 /* We didn't set a block for static or extern because it's hard
2209 to tell the difference between a global variable (re)declared
2210 in a local scope, and one that's really declared there to
2211 begin with. And it doesn't really matter much, since we're
2212 not giving them stack space. Expand them now. */
2213 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2214 expand_now = true;
2216 /* Expand variables not associated with any block now. Those created by
2217 the optimizers could be live anywhere in the function. Those that
2218 could possibly have been scoped originally and detached from their
2219 block will have their allocation deferred so we coalesce them with
2220 others when optimization is enabled. */
2221 else if (TREE_USED (var))
2222 expand_now = true;
2224 /* Finally, mark all variables on the list as used. We'll use
2225 this in a moment when we expand those associated with scopes. */
2226 TREE_USED (var) = 1;
2228 if (expand_now)
2229 expand_one_var (var, true, true, forced_stack_vars);
2231 next:
2232 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2234 rtx rtl = DECL_RTL_IF_SET (var);
2236 /* Keep artificial non-ignored vars in cfun->local_decls
2237 chain until instantiate_decls. */
2238 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2239 add_local_decl (cfun, var);
2240 else if (rtl == NULL_RTX)
2241 /* If rtl isn't set yet, which can happen e.g. with
2242 -fstack-protector, retry before returning from this
2243 function. */
2244 maybe_local_decls.safe_push (var);
2248 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2250 +-----------------+-----------------+
2251 | ...processed... | ...duplicates...|
2252 +-----------------+-----------------+
2254 +-- LEN points here.
2256 We just want the duplicates, as those are the artificial
2257 non-ignored vars that we want to keep until instantiate_decls.
2258 Move them down and truncate the array. */
2259 if (!vec_safe_is_empty (cfun->local_decls))
2260 cfun->local_decls->block_remove (0, len);
2262 /* At this point, all variables within the block tree with TREE_USED
2263 set are actually used by the optimized function. Lay them out. */
2264 expand_used_vars_for_block (outer_block, true, forced_stack_vars);
2266 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2267 if (stack_vars_num > 0)
2269 bool has_addressable_vars = false;
2271 add_scope_conflicts ();
2273 /* If stack protection is enabled, we don't share space between
2274 vulnerable data and non-vulnerable data. */
2275 if (flag_stack_protect != 0
2276 && !lookup_attribute ("no_stack_protector", attribs)
2277 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2278 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2279 && lookup_attribute ("stack_protect", attribs))))
2280 has_addressable_vars = add_stack_protection_conflicts ();
2282 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2283 gen_stack_protect_signal = true;
2285 /* Now that we have collected all stack variables, and have computed a
2286 minimal interference graph, attempt to save some stack space. */
2287 partition_stack_vars ();
2288 if (dump_file)
2289 dump_stack_var_partition ();
2293 if (!lookup_attribute ("no_stack_protector", attribs))
2294 switch (flag_stack_protect)
2296 case SPCT_FLAG_ALL:
2297 create_stack_guard ();
2298 break;
2300 case SPCT_FLAG_STRONG:
2301 if (gen_stack_protect_signal
2302 || cfun->calls_alloca
2303 || has_protected_decls
2304 || lookup_attribute ("stack_protect", attribs))
2305 create_stack_guard ();
2306 break;
2308 case SPCT_FLAG_DEFAULT:
2309 if (cfun->calls_alloca
2310 || has_protected_decls
2311 || lookup_attribute ("stack_protect", attribs))
2312 create_stack_guard ();
2313 break;
2315 case SPCT_FLAG_EXPLICIT:
2316 if (lookup_attribute ("stack_protect", attribs))
2317 create_stack_guard ();
2318 break;
2320 default:
2321 break;
2324 /* Assign rtl to each variable based on these partitions. */
2325 if (stack_vars_num > 0)
2327 class stack_vars_data data;
2329 data.asan_base = NULL_RTX;
2330 data.asan_alignb = 0;
2332 /* Reorder decls to be protected by iterating over the variables
2333 array multiple times, and allocating out of each phase in turn. */
2334 /* ??? We could probably integrate this into the qsort we did
2335 earlier, such that we naturally see these variables first,
2336 and thus naturally allocate things in the right order. */
2337 if (has_protected_decls)
2339 /* Phase 1 contains only character arrays. */
2340 expand_stack_vars (stack_protect_decl_phase_1, &data);
2342 /* Phase 2 contains other kinds of arrays. */
2343 if (!lookup_attribute ("no_stack_protector", attribs)
2344 && (flag_stack_protect == SPCT_FLAG_ALL
2345 || flag_stack_protect == SPCT_FLAG_STRONG
2346 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2347 && lookup_attribute ("stack_protect", attribs))))
2348 expand_stack_vars (stack_protect_decl_phase_2, &data);
2351 if (asan_sanitize_stack_p ())
2352 /* Phase 3, any partitions that need asan protection
2353 in addition to phase 1 and 2. */
2354 expand_stack_vars (asan_decl_phase_3, &data);
2356 /* ASAN description strings don't yet have a syntax for expressing
2357 polynomial offsets. */
2358 HOST_WIDE_INT prev_offset;
2359 if (!data.asan_vec.is_empty ()
2360 && frame_offset.is_constant (&prev_offset))
2362 HOST_WIDE_INT offset, sz, redzonesz;
2363 redzonesz = ASAN_RED_ZONE_SIZE;
2364 sz = data.asan_vec[0] - prev_offset;
2365 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2366 && data.asan_alignb <= 4096
2367 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2368 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2369 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2370 /* Allocating a constant amount of space from a constant
2371 starting offset must give a constant result. */
2372 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2373 .to_constant ());
2374 data.asan_vec.safe_push (prev_offset);
2375 data.asan_vec.safe_push (offset);
2376 /* Leave space for alignment if STRICT_ALIGNMENT. */
2377 if (STRICT_ALIGNMENT)
2378 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2379 << ASAN_SHADOW_SHIFT)
2380 / BITS_PER_UNIT, 1);
2382 var_end_seq
2383 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2384 data.asan_base,
2385 data.asan_alignb,
2386 data.asan_vec.address (),
2387 data.asan_decl_vec.address (),
2388 data.asan_vec.length ());
2391 expand_stack_vars (NULL, &data);
2394 if (hwasan_sanitize_stack_p ())
2395 hwasan_emit_prologue ();
2396 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2397 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2398 virtual_stack_vars_rtx,
2399 var_end_seq);
2400 else if (hwasan_sanitize_allocas_p () && cfun->calls_alloca)
2401 /* When using out-of-line instrumentation we only want to emit one function
2402 call for clearing the tags in a region of shadow stack. When there are
2403 alloca calls in this frame we want to emit a call using the
2404 virtual_stack_dynamic_rtx, but when not we use the hwasan_frame_extent
2405 rtx we created in expand_stack_vars. */
2406 var_end_seq = hwasan_emit_untag_frame (virtual_stack_dynamic_rtx,
2407 virtual_stack_vars_rtx);
2408 else if (hwasan_sanitize_stack_p ())
2409 /* If no variables were stored on the stack, `hwasan_get_frame_extent`
2410 will return NULL_RTX and hence `hwasan_emit_untag_frame` will return
2411 NULL (i.e. an empty sequence). */
2412 var_end_seq = hwasan_emit_untag_frame (hwasan_get_frame_extent (),
2413 virtual_stack_vars_rtx);
2415 fini_vars_expansion ();
2417 /* If there were any artificial non-ignored vars without rtl
2418 found earlier, see if deferred stack allocation hasn't assigned
2419 rtl to them. */
2420 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2422 rtx rtl = DECL_RTL_IF_SET (var);
2424 /* Keep artificial non-ignored vars in cfun->local_decls
2425 chain until instantiate_decls. */
2426 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2427 add_local_decl (cfun, var);
2430 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2431 if (STACK_ALIGNMENT_NEEDED)
2433 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2434 if (FRAME_GROWS_DOWNWARD)
2435 frame_offset = aligned_lower_bound (frame_offset, align);
2436 else
2437 frame_offset = aligned_upper_bound (frame_offset, align);
2440 return var_end_seq;
2444 /* If we need to produce a detailed dump, print the tree representation
2445 for STMT to the dump file. SINCE is the last RTX after which the RTL
2446 generated for STMT should have been appended. */
2448 static void
2449 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2451 if (dump_file && (dump_flags & TDF_DETAILS))
2453 fprintf (dump_file, "\n;; ");
2454 print_gimple_stmt (dump_file, stmt, 0,
2455 TDF_SLIM | (dump_flags & TDF_LINENO));
2456 fprintf (dump_file, "\n");
2458 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2462 /* Maps the blocks that do not contain tree labels to rtx labels. */
2464 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2466 /* Returns the label_rtx expression for a label starting basic block BB. */
2468 static rtx_code_label *
2469 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2471 if (bb->flags & BB_RTL)
2472 return block_label (bb);
2474 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2475 if (elt)
2476 return *elt;
2478 /* Find the tree label if it is present. */
2479 gimple_stmt_iterator gsi = gsi_start_bb (bb);
2480 glabel *lab_stmt;
2481 if (!gsi_end_p (gsi)
2482 && (lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi)))
2483 && !DECL_NONLOCAL (gimple_label_label (lab_stmt)))
2484 return jump_target_rtx (gimple_label_label (lab_stmt));
2486 rtx_code_label *l = gen_label_rtx ();
2487 lab_rtx_for_bb->put (bb, l);
2488 return l;
2492 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2493 of a basic block where we just expanded the conditional at the end,
2494 possibly clean up the CFG and instruction sequence. LAST is the
2495 last instruction before the just emitted jump sequence. */
2497 static void
2498 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2500 /* Special case: when jumpif decides that the condition is
2501 trivial it emits an unconditional jump (and the necessary
2502 barrier). But we still have two edges, the fallthru one is
2503 wrong. purge_dead_edges would clean this up later. Unfortunately
2504 we have to insert insns (and split edges) before
2505 find_many_sub_basic_blocks and hence before purge_dead_edges.
2506 But splitting edges might create new blocks which depend on the
2507 fact that if there are two edges there's no barrier. So the
2508 barrier would get lost and verify_flow_info would ICE. Instead
2509 of auditing all edge splitters to care for the barrier (which
2510 normally isn't there in a cleaned CFG), fix it here. */
2511 if (BARRIER_P (get_last_insn ()))
2513 rtx_insn *insn;
2514 remove_edge (e);
2515 /* Now, we have a single successor block, if we have insns to
2516 insert on the remaining edge we potentially will insert
2517 it at the end of this block (if the dest block isn't feasible)
2518 in order to avoid splitting the edge. This insertion will take
2519 place in front of the last jump. But we might have emitted
2520 multiple jumps (conditional and one unconditional) to the
2521 same destination. Inserting in front of the last one then
2522 is a problem. See PR 40021. We fix this by deleting all
2523 jumps except the last unconditional one. */
2524 insn = PREV_INSN (get_last_insn ());
2525 /* Make sure we have an unconditional jump. Otherwise we're
2526 confused. */
2527 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2528 for (insn = PREV_INSN (insn); insn != last;)
2530 insn = PREV_INSN (insn);
2531 if (JUMP_P (NEXT_INSN (insn)))
2533 if (!any_condjump_p (NEXT_INSN (insn)))
2535 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2536 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2538 delete_insn (NEXT_INSN (insn));
2544 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2545 Returns a new basic block if we've terminated the current basic
2546 block and created a new one. */
2548 static basic_block
2549 expand_gimple_cond (basic_block bb, gcond *stmt)
2551 basic_block new_bb, dest;
2552 edge true_edge;
2553 edge false_edge;
2554 rtx_insn *last2, *last;
2555 enum tree_code code;
2556 tree op0, op1;
2558 code = gimple_cond_code (stmt);
2559 op0 = gimple_cond_lhs (stmt);
2560 op1 = gimple_cond_rhs (stmt);
2561 /* We're sometimes presented with such code:
2562 D.123_1 = x < y;
2563 if (D.123_1 != 0)
2565 This would expand to two comparisons which then later might
2566 be cleaned up by combine. But some pattern matchers like if-conversion
2567 work better when there's only one compare, so make up for this
2568 here as special exception if TER would have made the same change. */
2569 if (SA.values
2570 && TREE_CODE (op0) == SSA_NAME
2571 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2572 && TREE_CODE (op1) == INTEGER_CST
2573 && ((gimple_cond_code (stmt) == NE_EXPR
2574 && integer_zerop (op1))
2575 || (gimple_cond_code (stmt) == EQ_EXPR
2576 && integer_onep (op1)))
2577 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2579 gimple *second = SSA_NAME_DEF_STMT (op0);
2580 if (gimple_code (second) == GIMPLE_ASSIGN)
2582 enum tree_code code2 = gimple_assign_rhs_code (second);
2583 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2585 code = code2;
2586 op0 = gimple_assign_rhs1 (second);
2587 op1 = gimple_assign_rhs2 (second);
2589 /* If jumps are cheap and the target does not support conditional
2590 compare, turn some more codes into jumpy sequences. */
2591 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2592 && targetm.gen_ccmp_first == NULL)
2594 if ((code2 == BIT_AND_EXPR
2595 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2596 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2597 || code2 == TRUTH_AND_EXPR)
2599 code = TRUTH_ANDIF_EXPR;
2600 op0 = gimple_assign_rhs1 (second);
2601 op1 = gimple_assign_rhs2 (second);
2603 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2605 code = TRUTH_ORIF_EXPR;
2606 op0 = gimple_assign_rhs1 (second);
2607 op1 = gimple_assign_rhs2 (second);
2613 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2614 into (x - C2) * C3 < C4. */
2615 if ((code == EQ_EXPR || code == NE_EXPR)
2616 && TREE_CODE (op0) == SSA_NAME
2617 && TREE_CODE (op1) == INTEGER_CST)
2618 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2620 /* Optimize (x - y) < 0 into x < y if x - y has undefined overflow. */
2621 if (!TYPE_UNSIGNED (TREE_TYPE (op0))
2622 && (code == LT_EXPR || code == LE_EXPR
2623 || code == GT_EXPR || code == GE_EXPR)
2624 && integer_zerop (op1)
2625 && TREE_CODE (op0) == SSA_NAME)
2626 maybe_optimize_sub_cmp_0 (code, &op0, &op1);
2628 last2 = last = get_last_insn ();
2630 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2631 set_curr_insn_location (gimple_location (stmt));
2633 /* These flags have no purpose in RTL land. */
2634 true_edge->flags &= ~EDGE_TRUE_VALUE;
2635 false_edge->flags &= ~EDGE_FALSE_VALUE;
2637 /* We can either have a pure conditional jump with one fallthru edge or
2638 two-way jump that needs to be decomposed into two basic blocks. */
2639 if (false_edge->dest == bb->next_bb)
2641 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2642 true_edge->probability);
2643 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2644 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2645 set_curr_insn_location (true_edge->goto_locus);
2646 false_edge->flags |= EDGE_FALLTHRU;
2647 maybe_cleanup_end_of_block (false_edge, last);
2648 return NULL;
2650 if (true_edge->dest == bb->next_bb)
2652 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2653 false_edge->probability);
2654 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2655 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2656 set_curr_insn_location (false_edge->goto_locus);
2657 true_edge->flags |= EDGE_FALLTHRU;
2658 maybe_cleanup_end_of_block (true_edge, last);
2659 return NULL;
2662 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2663 true_edge->probability);
2664 last = get_last_insn ();
2665 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2666 set_curr_insn_location (false_edge->goto_locus);
2667 emit_jump (label_rtx_for_bb (false_edge->dest));
2669 BB_END (bb) = last;
2670 if (BARRIER_P (BB_END (bb)))
2671 BB_END (bb) = PREV_INSN (BB_END (bb));
2672 update_bb_for_insn (bb);
2674 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2675 dest = false_edge->dest;
2676 redirect_edge_succ (false_edge, new_bb);
2677 false_edge->flags |= EDGE_FALLTHRU;
2678 new_bb->count = false_edge->count ();
2679 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2680 add_bb_to_loop (new_bb, loop);
2681 if (loop->latch == bb
2682 && loop->header == dest)
2683 loop->latch = new_bb;
2684 make_single_succ_edge (new_bb, dest, 0);
2685 if (BARRIER_P (BB_END (new_bb)))
2686 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2687 update_bb_for_insn (new_bb);
2689 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2691 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2693 set_curr_insn_location (true_edge->goto_locus);
2694 true_edge->goto_locus = curr_insn_location ();
2697 return new_bb;
2700 /* Mark all calls that can have a transaction restart. */
2702 static void
2703 mark_transaction_restart_calls (gimple *stmt)
2705 struct tm_restart_node dummy;
2706 tm_restart_node **slot;
2708 if (!cfun->gimple_df->tm_restart)
2709 return;
2711 dummy.stmt = stmt;
2712 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2713 if (slot)
2715 struct tm_restart_node *n = *slot;
2716 tree list = n->label_or_list;
2717 rtx_insn *insn;
2719 for (insn = next_real_insn (get_last_insn ());
2720 !CALL_P (insn);
2721 insn = next_real_insn (insn))
2722 continue;
2724 if (TREE_CODE (list) == LABEL_DECL)
2725 add_reg_note (insn, REG_TM, label_rtx (list));
2726 else
2727 for (; list ; list = TREE_CHAIN (list))
2728 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2732 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2733 statement STMT. */
2735 static void
2736 expand_call_stmt (gcall *stmt)
2738 tree exp, decl, lhs;
2739 bool builtin_p;
2740 size_t i;
2742 if (gimple_call_internal_p (stmt))
2744 expand_internal_call (stmt);
2745 return;
2748 /* If this is a call to a built-in function and it has no effect other
2749 than setting the lhs, try to implement it using an internal function
2750 instead. */
2751 decl = gimple_call_fndecl (stmt);
2752 if (gimple_call_lhs (stmt)
2753 && !gimple_has_side_effects (stmt)
2754 && (optimize || (decl && called_as_built_in (decl))))
2756 internal_fn ifn = replacement_internal_fn (stmt);
2757 if (ifn != IFN_LAST)
2759 expand_internal_call (ifn, stmt);
2760 return;
2764 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2766 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2767 builtin_p = decl && fndecl_built_in_p (decl);
2769 /* If this is not a builtin function, the function type through which the
2770 call is made may be different from the type of the function. */
2771 if (!builtin_p)
2772 CALL_EXPR_FN (exp)
2773 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2774 CALL_EXPR_FN (exp));
2776 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2777 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2779 for (i = 0; i < gimple_call_num_args (stmt); i++)
2781 tree arg = gimple_call_arg (stmt, i);
2782 gimple *def;
2783 /* TER addresses into arguments of builtin functions so we have a
2784 chance to infer more correct alignment information. See PR39954. */
2785 if (builtin_p
2786 && TREE_CODE (arg) == SSA_NAME
2787 && (def = get_gimple_for_ssa_name (arg))
2788 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2789 arg = gimple_assign_rhs1 (def);
2790 CALL_EXPR_ARG (exp, i) = arg;
2793 if (gimple_has_side_effects (stmt)
2794 /* ??? Downstream in expand_expr_real_1 we assume that expressions
2795 w/o side-effects do not throw so work around this here. */
2796 || stmt_could_throw_p (cfun, stmt))
2797 TREE_SIDE_EFFECTS (exp) = 1;
2799 if (gimple_call_nothrow_p (stmt))
2800 TREE_NOTHROW (exp) = 1;
2802 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2803 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2804 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2805 if (decl
2806 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2807 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2808 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2809 else
2810 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2811 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2812 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2813 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2815 /* Must come after copying location. */
2816 copy_warning (exp, stmt);
2818 /* Ensure RTL is created for debug args. */
2819 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2821 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2822 unsigned int ix;
2823 tree dtemp;
2825 if (debug_args)
2826 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2828 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2829 expand_debug_expr (dtemp);
2833 rtx_insn *before_call = get_last_insn ();
2834 lhs = gimple_call_lhs (stmt);
2835 if (lhs)
2836 expand_assignment (lhs, exp, false);
2837 else
2838 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2840 /* If the gimple call is an indirect call and has 'nocf_check'
2841 attribute find a generated CALL insn to mark it as no
2842 control-flow verification is needed. */
2843 if (gimple_call_nocf_check_p (stmt)
2844 && !gimple_call_fndecl (stmt))
2846 rtx_insn *last = get_last_insn ();
2847 while (!CALL_P (last)
2848 && last != before_call)
2849 last = PREV_INSN (last);
2851 if (last != before_call)
2852 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2855 mark_transaction_restart_calls (stmt);
2859 /* Generate RTL for an asm statement (explicit assembler code).
2860 STRING is a STRING_CST node containing the assembler code text,
2861 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2862 insn is volatile; don't optimize it. */
2864 static void
2865 expand_asm_loc (tree string, int vol, location_t locus)
2867 rtx body;
2869 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2870 ggc_strdup (TREE_STRING_POINTER (string)),
2871 locus);
2873 MEM_VOLATILE_P (body) = vol;
2875 /* Non-empty basic ASM implicitly clobbers memory. */
2876 if (TREE_STRING_LENGTH (string) != 0)
2878 rtx asm_op, clob;
2879 unsigned i, nclobbers;
2880 auto_vec<rtx> input_rvec, output_rvec;
2881 auto_vec<machine_mode> input_mode;
2882 auto_vec<const char *> constraints;
2883 auto_vec<rtx> use_rvec;
2884 auto_vec<rtx> clobber_rvec;
2885 HARD_REG_SET clobbered_regs;
2886 CLEAR_HARD_REG_SET (clobbered_regs);
2888 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2889 clobber_rvec.safe_push (clob);
2891 if (targetm.md_asm_adjust)
2892 targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
2893 constraints, use_rvec, clobber_rvec,
2894 clobbered_regs, locus);
2896 asm_op = body;
2897 nclobbers = clobber_rvec.length ();
2898 auto nuses = use_rvec.length ();
2899 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nuses + nclobbers));
2901 i = 0;
2902 XVECEXP (body, 0, i++) = asm_op;
2903 for (rtx use : use_rvec)
2904 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
2905 for (rtx clobber : clobber_rvec)
2906 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobber);
2909 emit_insn (body);
2912 /* Return the number of times character C occurs in string S. */
2913 static int
2914 n_occurrences (int c, const char *s)
2916 int n = 0;
2917 while (*s)
2918 n += (*s++ == c);
2919 return n;
2922 /* A subroutine of expand_asm_operands. Check that all operands have
2923 the same number of alternatives. Return true if so. */
2925 static bool
2926 check_operand_nalternatives (const vec<const char *> &constraints)
2928 unsigned len = constraints.length();
2929 if (len > 0)
2931 int nalternatives = n_occurrences (',', constraints[0]);
2933 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2935 error ("too many alternatives in %<asm%>");
2936 return false;
2939 for (unsigned i = 1; i < len; ++i)
2940 if (n_occurrences (',', constraints[i]) != nalternatives)
2942 error ("operand constraints for %<asm%> differ "
2943 "in number of alternatives");
2944 return false;
2947 return true;
2950 /* Check for overlap between registers marked in CLOBBERED_REGS and
2951 anything inappropriate in T. Emit error and return the register
2952 variable definition for error, NULL_TREE for ok. */
2954 static bool
2955 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs,
2956 location_t loc)
2958 /* Conflicts between asm-declared register variables and the clobber
2959 list are not allowed. */
2960 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2962 if (overlap)
2964 error_at (loc, "%<asm%> specifier for variable %qE conflicts with "
2965 "%<asm%> clobber list", DECL_NAME (overlap));
2967 /* Reset registerness to stop multiple errors emitted for a single
2968 variable. */
2969 DECL_REGISTER (overlap) = 0;
2970 return true;
2973 return false;
2976 /* Check that the given REGNO spanning NREGS is a valid
2977 asm clobber operand. Some HW registers cannot be
2978 saved/restored, hence they should not be clobbered by
2979 asm statements. */
2980 static bool
2981 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
2983 bool is_valid = true;
2984 HARD_REG_SET regset;
2986 CLEAR_HARD_REG_SET (regset);
2988 add_range_to_hard_reg_set (&regset, regno, nregs);
2990 /* Clobbering the PIC register is an error. */
2991 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
2992 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
2994 /* ??? Diagnose during gimplification? */
2995 error ("PIC register clobbered by %qs in %<asm%>", regname);
2996 is_valid = false;
2998 else if (!in_hard_reg_set_p
2999 (accessible_reg_set, reg_raw_mode[regno], regno))
3001 /* ??? Diagnose during gimplification? */
3002 error ("the register %qs cannot be clobbered in %<asm%>"
3003 " for the current target", regname);
3004 is_valid = false;
3007 /* Clobbering the stack pointer register is deprecated. GCC expects
3008 the value of the stack pointer after an asm statement to be the same
3009 as it was before, so no asm can validly clobber the stack pointer in
3010 the usual sense. Adding the stack pointer to the clobber list has
3011 traditionally had some undocumented and somewhat obscure side-effects. */
3012 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
3014 crtl->sp_is_clobbered_by_asm = true;
3015 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
3016 " %qs in a clobber list is deprecated", regname))
3017 inform (input_location, "the value of the stack pointer after"
3018 " an %<asm%> statement must be the same as it was before"
3019 " the statement");
3022 return is_valid;
3025 /* Generate RTL for an asm statement with arguments.
3026 STRING is the instruction template.
3027 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
3028 Each output or input has an expression in the TREE_VALUE and
3029 a tree list in TREE_PURPOSE which in turn contains a constraint
3030 name in TREE_VALUE (or NULL_TREE) and a constraint string
3031 in TREE_PURPOSE.
3032 CLOBBERS is a list of STRING_CST nodes each naming a hard register
3033 that is clobbered by this insn.
3035 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
3036 should be the fallthru basic block of the asm goto.
3038 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
3039 Some elements of OUTPUTS may be replaced with trees representing temporary
3040 values. The caller should copy those temporary values to the originally
3041 specified lvalues.
3043 VOL nonzero means the insn is volatile; don't optimize it. */
3045 static void
3046 expand_asm_stmt (gasm *stmt)
3048 class save_input_location
3050 location_t old;
3052 public:
3053 explicit save_input_location(location_t where)
3055 old = input_location;
3056 input_location = where;
3059 ~save_input_location()
3061 input_location = old;
3065 location_t locus = gimple_location (stmt);
3067 if (gimple_asm_input_p (stmt))
3069 const char *s = gimple_asm_string (stmt);
3070 tree string = build_string (strlen (s), s);
3071 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
3072 return;
3075 /* There are some legacy diagnostics in here. */
3076 save_input_location s_i_l(locus);
3078 unsigned noutputs = gimple_asm_noutputs (stmt);
3079 unsigned ninputs = gimple_asm_ninputs (stmt);
3080 unsigned nlabels = gimple_asm_nlabels (stmt);
3081 unsigned i;
3082 bool error_seen = false;
3084 /* ??? Diagnose during gimplification? */
3085 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
3087 error_at (locus, "more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
3088 return;
3091 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
3092 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
3093 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
3095 /* Copy the gimple vectors into new vectors that we can manipulate. */
3097 output_tvec.safe_grow (noutputs, true);
3098 input_tvec.safe_grow (ninputs, true);
3099 constraints.safe_grow (noutputs + ninputs, true);
3101 for (i = 0; i < noutputs; ++i)
3103 tree t = gimple_asm_output_op (stmt, i);
3104 output_tvec[i] = TREE_VALUE (t);
3105 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3107 for (i = 0; i < ninputs; i++)
3109 tree t = gimple_asm_input_op (stmt, i);
3110 input_tvec[i] = TREE_VALUE (t);
3111 constraints[i + noutputs]
3112 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3115 /* ??? Diagnose during gimplification? */
3116 if (! check_operand_nalternatives (constraints))
3117 return;
3119 /* Count the number of meaningful clobbered registers, ignoring what
3120 we would ignore later. */
3121 auto_vec<rtx> clobber_rvec;
3122 HARD_REG_SET clobbered_regs;
3123 CLEAR_HARD_REG_SET (clobbered_regs);
3125 if (unsigned n = gimple_asm_nclobbers (stmt))
3127 clobber_rvec.reserve (n);
3128 for (i = 0; i < n; i++)
3130 tree t = gimple_asm_clobber_op (stmt, i);
3131 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
3132 int nregs, j;
3134 j = decode_reg_name_and_count (regname, &nregs);
3135 if (j < 0)
3137 if (j == -2)
3139 /* ??? Diagnose during gimplification? */
3140 error_at (locus, "unknown register name %qs in %<asm%>",
3141 regname);
3142 error_seen = true;
3144 else if (j == -4)
3146 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3147 clobber_rvec.safe_push (x);
3149 else
3151 /* Otherwise we should have -1 == empty string
3152 or -3 == cc, which is not a register. */
3153 gcc_assert (j == -1 || j == -3);
3156 else
3157 for (int reg = j; reg < j + nregs; reg++)
3159 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3160 return;
3162 SET_HARD_REG_BIT (clobbered_regs, reg);
3163 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3164 clobber_rvec.safe_push (x);
3169 /* First pass over inputs and outputs checks validity and sets
3170 mark_addressable if needed. */
3171 /* ??? Diagnose during gimplification? */
3173 for (i = 0; i < noutputs; ++i)
3175 tree val = output_tvec[i];
3176 tree type = TREE_TYPE (val);
3177 const char *constraint;
3178 bool is_inout;
3179 bool allows_reg;
3180 bool allows_mem;
3182 /* Try to parse the output constraint. If that fails, there's
3183 no point in going further. */
3184 constraint = constraints[i];
3185 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3186 &allows_mem, &allows_reg, &is_inout))
3187 return;
3189 /* If the output is a hard register, verify it doesn't conflict with
3190 any other operand's possible hard register use. */
3191 if (DECL_P (val)
3192 && REG_P (DECL_RTL (val))
3193 && HARD_REGISTER_P (DECL_RTL (val)))
3195 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3196 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3197 unsigned long match;
3199 /* Verify the other outputs do not use the same hard register. */
3200 for (j = i + 1; j < noutputs; ++j)
3201 if (DECL_P (output_tvec[j])
3202 && REG_P (DECL_RTL (output_tvec[j]))
3203 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3204 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3206 error_at (locus, "invalid hard register usage between output "
3207 "operands");
3208 error_seen = true;
3211 /* Verify matching constraint operands use the same hard register
3212 and that the non-matching constraint operands do not use the same
3213 hard register if the output is an early clobber operand. */
3214 for (j = 0; j < ninputs; ++j)
3215 if (DECL_P (input_tvec[j])
3216 && REG_P (DECL_RTL (input_tvec[j]))
3217 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3219 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3220 switch (*constraints[j + noutputs])
3222 case '0': case '1': case '2': case '3': case '4':
3223 case '5': case '6': case '7': case '8': case '9':
3224 match = strtoul (constraints[j + noutputs], NULL, 10);
3225 break;
3226 default:
3227 match = ULONG_MAX;
3228 break;
3230 if (i == match
3231 && output_hregno != input_hregno)
3233 error_at (locus, "invalid hard register usage between "
3234 "output operand and matching constraint operand");
3235 error_seen = true;
3237 else if (early_clobber_p
3238 && i != match
3239 && output_hregno == input_hregno)
3241 error_at (locus, "invalid hard register usage between "
3242 "earlyclobber operand and input operand");
3243 error_seen = true;
3248 if (! allows_reg
3249 && (allows_mem
3250 || is_inout
3251 || (DECL_P (val)
3252 && REG_P (DECL_RTL (val))
3253 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3254 mark_addressable (val);
3257 for (i = 0; i < ninputs; ++i)
3259 bool allows_reg, allows_mem;
3260 const char *constraint;
3262 constraint = constraints[i + noutputs];
3263 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3264 constraints.address (),
3265 &allows_mem, &allows_reg))
3266 return;
3268 if (! allows_reg && allows_mem)
3269 mark_addressable (input_tvec[i]);
3272 /* Second pass evaluates arguments. */
3274 /* Make sure stack is consistent for asm goto. */
3275 if (nlabels > 0)
3276 do_pending_stack_adjust ();
3277 int old_generating_concat_p = generating_concat_p;
3279 /* Vector of RTX's of evaluated output operands. */
3280 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3281 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3282 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3284 output_rvec.safe_grow (noutputs, true);
3286 for (i = 0; i < noutputs; ++i)
3288 tree val = output_tvec[i];
3289 tree type = TREE_TYPE (val);
3290 bool is_inout, allows_reg, allows_mem, ok;
3291 rtx op;
3293 ok = parse_output_constraint (&constraints[i], i, ninputs,
3294 noutputs, &allows_mem, &allows_reg,
3295 &is_inout);
3296 gcc_assert (ok);
3298 /* If an output operand is not a decl or indirect ref and our constraint
3299 allows a register, make a temporary to act as an intermediate.
3300 Make the asm insn write into that, then we will copy it to
3301 the real output operand. Likewise for promoted variables. */
3303 generating_concat_p = 0;
3305 gcc_assert (TREE_CODE (val) != INDIRECT_REF);
3306 if (((TREE_CODE (val) == MEM_REF
3307 && TREE_CODE (TREE_OPERAND (val, 0)) != ADDR_EXPR)
3308 && allows_mem)
3309 || (DECL_P (val)
3310 && (allows_mem || REG_P (DECL_RTL (val)))
3311 && ! (REG_P (DECL_RTL (val))
3312 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3313 || ! allows_reg
3314 || is_inout
3315 || TREE_ADDRESSABLE (type)
3316 || (!tree_fits_poly_int64_p (TYPE_SIZE (type))
3317 && !known_size_p (max_int_size_in_bytes (type))))
3319 op = expand_expr (val, NULL_RTX, VOIDmode,
3320 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3321 if (MEM_P (op))
3322 op = validize_mem (op);
3324 if (! allows_reg && !MEM_P (op))
3326 error_at (locus, "output number %d not directly addressable", i);
3327 error_seen = true;
3329 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3330 || GET_CODE (op) == CONCAT)
3332 rtx old_op = op;
3333 op = gen_reg_rtx (GET_MODE (op));
3335 generating_concat_p = old_generating_concat_p;
3337 if (is_inout)
3338 emit_move_insn (op, old_op);
3340 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3341 emit_move_insn (old_op, op);
3342 after_rtl_seq = get_insns ();
3343 after_rtl_end = get_last_insn ();
3344 end_sequence ();
3347 else
3349 op = assign_temp (type, 0, 1);
3350 op = validize_mem (op);
3351 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3352 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3354 generating_concat_p = old_generating_concat_p;
3356 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3357 expand_assignment (val, make_tree (type, op), false);
3358 after_rtl_seq = get_insns ();
3359 after_rtl_end = get_last_insn ();
3360 end_sequence ();
3362 output_rvec[i] = op;
3364 if (is_inout)
3365 inout_opnum.safe_push (i);
3368 const char *str = gimple_asm_string (stmt);
3369 if (error_seen)
3371 ninputs = 0;
3372 noutputs = 0;
3373 inout_opnum.truncate (0);
3374 output_rvec.truncate (0);
3375 clobber_rvec.truncate (0);
3376 constraints.truncate (0);
3377 CLEAR_HARD_REG_SET (clobbered_regs);
3378 str = "";
3381 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3382 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3384 input_rvec.safe_grow (ninputs, true);
3385 input_mode.safe_grow (ninputs, true);
3387 generating_concat_p = 0;
3389 for (i = 0; i < ninputs; ++i)
3391 tree val = input_tvec[i];
3392 tree type = TREE_TYPE (val);
3393 bool allows_reg, allows_mem, ok;
3394 const char *constraint;
3395 rtx op;
3397 constraint = constraints[i + noutputs];
3398 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3399 constraints.address (),
3400 &allows_mem, &allows_reg);
3401 gcc_assert (ok);
3403 /* EXPAND_INITIALIZER will not generate code for valid initializer
3404 constants, but will still generate code for other types of operand.
3405 This is the behavior we want for constant constraints. */
3406 op = expand_expr (val, NULL_RTX, VOIDmode,
3407 allows_reg ? EXPAND_NORMAL
3408 : allows_mem ? EXPAND_MEMORY
3409 : EXPAND_INITIALIZER);
3411 /* Never pass a CONCAT to an ASM. */
3412 if (GET_CODE (op) == CONCAT)
3413 op = force_reg (GET_MODE (op), op);
3414 else if (MEM_P (op))
3415 op = validize_mem (op);
3417 if (asm_operand_ok (op, constraint, NULL) <= 0)
3419 if (allows_reg && TYPE_MODE (type) != BLKmode)
3420 op = force_reg (TYPE_MODE (type), op);
3421 else if (!allows_mem)
3422 warning_at (locus, 0, "%<asm%> operand %d probably does not match "
3423 "constraints", i + noutputs);
3424 else if (MEM_P (op))
3426 /* We won't recognize either volatile memory or memory
3427 with a queued address as available a memory_operand
3428 at this point. Ignore it: clearly this *is* a memory. */
3430 else
3431 gcc_unreachable ();
3433 input_rvec[i] = op;
3434 input_mode[i] = TYPE_MODE (type);
3437 /* For in-out operands, copy output rtx to input rtx. */
3438 unsigned ninout = inout_opnum.length ();
3439 for (i = 0; i < ninout; i++)
3441 int j = inout_opnum[i];
3442 rtx o = output_rvec[j];
3444 input_rvec.safe_push (o);
3445 input_mode.safe_push (GET_MODE (o));
3447 char buffer[16];
3448 sprintf (buffer, "%d", j);
3449 constraints.safe_push (ggc_strdup (buffer));
3451 ninputs += ninout;
3453 /* Sometimes we wish to automatically clobber registers across an asm.
3454 Case in point is when the i386 backend moved from cc0 to a hard reg --
3455 maintaining source-level compatibility means automatically clobbering
3456 the flags register. */
3457 rtx_insn *after_md_seq = NULL;
3458 auto_vec<rtx> use_rvec;
3459 if (targetm.md_asm_adjust)
3460 after_md_seq
3461 = targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
3462 constraints, use_rvec, clobber_rvec,
3463 clobbered_regs, locus);
3465 /* Do not allow the hook to change the output and input count,
3466 lest it mess up the operand numbering. */
3467 gcc_assert (output_rvec.length() == noutputs);
3468 gcc_assert (input_rvec.length() == ninputs);
3469 gcc_assert (constraints.length() == noutputs + ninputs);
3471 /* But it certainly can adjust the uses and clobbers. */
3472 unsigned nuses = use_rvec.length ();
3473 unsigned nclobbers = clobber_rvec.length ();
3475 /* Third pass checks for easy conflicts. */
3476 /* ??? Why are we doing this on trees instead of rtx. */
3478 bool clobber_conflict_found = 0;
3479 for (i = 0; i < noutputs; ++i)
3480 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs, locus))
3481 clobber_conflict_found = 1;
3482 for (i = 0; i < ninputs - ninout; ++i)
3483 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs, locus))
3484 clobber_conflict_found = 1;
3486 /* Make vectors for the expression-rtx, constraint strings,
3487 and named operands. */
3489 rtvec argvec = rtvec_alloc (ninputs);
3490 rtvec constraintvec = rtvec_alloc (ninputs);
3491 rtvec labelvec = rtvec_alloc (nlabels);
3493 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3494 : GET_MODE (output_rvec[0])),
3495 ggc_strdup (str),
3496 "", 0, argvec, constraintvec,
3497 labelvec, locus);
3498 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3500 for (i = 0; i < ninputs; ++i)
3502 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3503 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3504 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3505 constraints[i + noutputs],
3506 locus);
3509 /* Copy labels to the vector. */
3510 rtx_code_label *fallthru_label = NULL;
3511 if (nlabels > 0)
3513 basic_block fallthru_bb = NULL;
3514 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3515 if (fallthru)
3516 fallthru_bb = fallthru->dest;
3518 for (i = 0; i < nlabels; ++i)
3520 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3521 rtx_insn *r;
3522 /* If asm goto has any labels in the fallthru basic block, use
3523 a label that we emit immediately after the asm goto. Expansion
3524 may insert further instructions into the same basic block after
3525 asm goto and if we don't do this, insertion of instructions on
3526 the fallthru edge might misbehave. See PR58670. */
3527 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3529 if (fallthru_label == NULL_RTX)
3530 fallthru_label = gen_label_rtx ();
3531 r = fallthru_label;
3533 else
3534 r = label_rtx (label);
3535 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3539 /* Now, for each output, construct an rtx
3540 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3541 ARGVEC CONSTRAINTS OPNAMES))
3542 If there is more than one, put them inside a PARALLEL. */
3544 if (noutputs == 0 && nuses == 0 && nclobbers == 0)
3546 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3547 if (nlabels > 0)
3548 emit_jump_insn (body);
3549 else
3550 emit_insn (body);
3552 else if (noutputs == 1 && nuses == 0 && nclobbers == 0)
3554 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3555 if (nlabels > 0)
3556 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3557 else
3558 emit_insn (gen_rtx_SET (output_rvec[0], body));
3560 else
3562 rtx obody = body;
3563 int num = noutputs;
3565 if (num == 0)
3566 num = 1;
3568 body = gen_rtx_PARALLEL (VOIDmode,
3569 rtvec_alloc (num + nuses + nclobbers));
3571 /* For each output operand, store a SET. */
3572 for (i = 0; i < noutputs; ++i)
3574 rtx src, o = output_rvec[i];
3575 if (i == 0)
3577 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3578 src = obody;
3580 else
3582 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3583 ASM_OPERANDS_TEMPLATE (obody),
3584 constraints[i], i, argvec,
3585 constraintvec, labelvec, locus);
3586 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3588 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3591 /* If there are no outputs (but there are some clobbers)
3592 store the bare ASM_OPERANDS into the PARALLEL. */
3593 if (i == 0)
3594 XVECEXP (body, 0, i++) = obody;
3596 /* Add the uses specified by the target hook. No checking should
3597 be needed since this doesn't come directly from user code. */
3598 for (rtx use : use_rvec)
3599 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
3601 /* Store (clobber REG) for each clobbered register specified. */
3602 for (unsigned j = 0; j < nclobbers; ++j)
3604 rtx clobbered_reg = clobber_rvec[j];
3606 /* Do sanity check for overlap between clobbers and respectively
3607 input and outputs that hasn't been handled. Such overlap
3608 should have been detected and reported above. */
3609 if (!clobber_conflict_found && REG_P (clobbered_reg))
3611 /* We test the old body (obody) contents to avoid
3612 tripping over the under-construction body. */
3613 for (unsigned k = 0; k < noutputs; ++k)
3614 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3615 internal_error ("%<asm%> clobber conflict with "
3616 "output operand");
3618 for (unsigned k = 0; k < ninputs - ninout; ++k)
3619 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3620 internal_error ("%<asm%> clobber conflict with "
3621 "input operand");
3624 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3627 if (nlabels > 0)
3628 emit_jump_insn (body);
3629 else
3630 emit_insn (body);
3633 generating_concat_p = old_generating_concat_p;
3635 if (fallthru_label)
3636 emit_label (fallthru_label);
3638 if (after_md_seq)
3639 emit_insn (after_md_seq);
3640 if (after_rtl_seq)
3642 if (nlabels == 0)
3643 emit_insn (after_rtl_seq);
3644 else
3646 edge e;
3647 edge_iterator ei;
3649 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3651 start_sequence ();
3652 for (rtx_insn *curr = after_rtl_seq;
3653 curr != NULL_RTX;
3654 curr = NEXT_INSN (curr))
3655 emit_insn (copy_insn (PATTERN (curr)));
3656 rtx_insn *copy = get_insns ();
3657 end_sequence ();
3658 insert_insn_on_edge (copy, e);
3663 free_temp_slots ();
3664 crtl->has_asm_statement = 1;
3667 /* Emit code to jump to the address
3668 specified by the pointer expression EXP. */
3670 static void
3671 expand_computed_goto (tree exp)
3673 rtx x = expand_normal (exp);
3675 do_pending_stack_adjust ();
3676 emit_indirect_jump (x);
3679 /* Generate RTL code for a `goto' statement with target label LABEL.
3680 LABEL should be a LABEL_DECL tree node that was or will later be
3681 defined with `expand_label'. */
3683 static void
3684 expand_goto (tree label)
3686 if (flag_checking)
3688 /* Check for a nonlocal goto to a containing function. Should have
3689 gotten translated to __builtin_nonlocal_goto. */
3690 tree context = decl_function_context (label);
3691 gcc_assert (!context || context == current_function_decl);
3694 emit_jump (jump_target_rtx (label));
3697 /* Output a return with no value. */
3699 static void
3700 expand_null_return_1 (void)
3702 clear_pending_stack_adjust ();
3703 do_pending_stack_adjust ();
3704 emit_jump (return_label);
3707 /* Generate RTL to return from the current function, with no value.
3708 (That is, we do not do anything about returning any value.) */
3710 void
3711 expand_null_return (void)
3713 /* If this function was declared to return a value, but we
3714 didn't, clobber the return registers so that they are not
3715 propagated live to the rest of the function. */
3716 clobber_return_register ();
3718 expand_null_return_1 ();
3721 /* Generate RTL to return from the current function, with value VAL. */
3723 static void
3724 expand_value_return (rtx val)
3726 /* Copy the value to the return location unless it's already there. */
3728 tree decl = DECL_RESULT (current_function_decl);
3729 rtx return_reg = DECL_RTL (decl);
3730 if (return_reg != val)
3732 tree funtype = TREE_TYPE (current_function_decl);
3733 tree type = TREE_TYPE (decl);
3734 int unsignedp = TYPE_UNSIGNED (type);
3735 machine_mode old_mode = DECL_MODE (decl);
3736 machine_mode mode;
3737 if (DECL_BY_REFERENCE (decl))
3738 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3739 else
3740 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3742 if (mode != old_mode)
3744 /* Some ABIs require scalar floating point modes to be returned
3745 in a wider scalar integer mode. We need to explicitly
3746 reinterpret to an integer mode of the correct precision
3747 before extending to the desired result. */
3748 if (SCALAR_INT_MODE_P (mode)
3749 && SCALAR_FLOAT_MODE_P (old_mode)
3750 && known_gt (GET_MODE_SIZE (mode), GET_MODE_SIZE (old_mode)))
3751 val = convert_float_to_wider_int (mode, old_mode, val);
3752 else
3753 val = convert_modes (mode, old_mode, val, unsignedp);
3756 if (GET_CODE (return_reg) == PARALLEL)
3757 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3758 else
3759 emit_move_insn (return_reg, val);
3762 expand_null_return_1 ();
3765 /* Generate RTL to evaluate the expression RETVAL and return it
3766 from the current function. */
3768 static void
3769 expand_return (tree retval)
3771 rtx result_rtl;
3772 rtx val = 0;
3773 tree retval_rhs;
3775 /* If function wants no value, give it none. */
3776 if (VOID_TYPE_P (TREE_TYPE (TREE_TYPE (current_function_decl))))
3778 expand_normal (retval);
3779 expand_null_return ();
3780 return;
3783 if (retval == error_mark_node)
3785 /* Treat this like a return of no value from a function that
3786 returns a value. */
3787 expand_null_return ();
3788 return;
3790 else if ((TREE_CODE (retval) == MODIFY_EXPR
3791 || TREE_CODE (retval) == INIT_EXPR)
3792 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3793 retval_rhs = TREE_OPERAND (retval, 1);
3794 else
3795 retval_rhs = retval;
3797 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3799 /* If we are returning the RESULT_DECL, then the value has already
3800 been stored into it, so we don't have to do anything special. */
3801 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3802 expand_value_return (result_rtl);
3804 /* If the result is an aggregate that is being returned in one (or more)
3805 registers, load the registers here. */
3807 else if (retval_rhs != 0
3808 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3809 && REG_P (result_rtl))
3811 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3812 if (val)
3814 /* Use the mode of the result value on the return register. */
3815 PUT_MODE (result_rtl, GET_MODE (val));
3816 expand_value_return (val);
3818 else
3819 expand_null_return ();
3821 else if (retval_rhs != 0
3822 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3823 && (REG_P (result_rtl)
3824 || (GET_CODE (result_rtl) == PARALLEL)))
3826 /* Compute the return value into a temporary (usually a pseudo reg). */
3828 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3829 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3830 val = force_not_mem (val);
3831 expand_value_return (val);
3833 else
3835 /* No hard reg used; calculate value into hard return reg. */
3836 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3837 expand_value_return (result_rtl);
3841 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3842 register, tell the rtl optimizers that its value is no longer
3843 needed. */
3845 static void
3846 expand_clobber (tree lhs)
3848 if (DECL_P (lhs))
3850 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3851 if (decl_rtl && REG_P (decl_rtl))
3853 machine_mode decl_mode = GET_MODE (decl_rtl);
3854 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3855 REGMODE_NATURAL_SIZE (decl_mode)))
3856 emit_clobber (decl_rtl);
3861 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3862 STMT that doesn't require special handling for outgoing edges. That
3863 is no tailcalls and no GIMPLE_COND. */
3865 static void
3866 expand_gimple_stmt_1 (gimple *stmt)
3868 tree op0;
3870 set_curr_insn_location (gimple_location (stmt));
3872 switch (gimple_code (stmt))
3874 case GIMPLE_GOTO:
3875 op0 = gimple_goto_dest (stmt);
3876 if (TREE_CODE (op0) == LABEL_DECL)
3877 expand_goto (op0);
3878 else
3879 expand_computed_goto (op0);
3880 break;
3881 case GIMPLE_LABEL:
3882 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3883 break;
3884 case GIMPLE_NOP:
3885 case GIMPLE_PREDICT:
3886 break;
3887 case GIMPLE_SWITCH:
3889 gswitch *swtch = as_a <gswitch *> (stmt);
3890 if (gimple_switch_num_labels (swtch) == 1)
3891 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3892 else
3893 expand_case (swtch);
3895 break;
3896 case GIMPLE_ASM:
3897 expand_asm_stmt (as_a <gasm *> (stmt));
3898 break;
3899 case GIMPLE_CALL:
3900 expand_call_stmt (as_a <gcall *> (stmt));
3901 break;
3903 case GIMPLE_RETURN:
3905 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3907 /* If a return doesn't have a location, it very likely represents
3908 multiple user returns so we cannot let it inherit the location
3909 of the last statement of the previous basic block in RTL. */
3910 if (!gimple_has_location (stmt))
3911 set_curr_insn_location (cfun->function_end_locus);
3913 if (op0 && op0 != error_mark_node)
3915 tree result = DECL_RESULT (current_function_decl);
3917 /* If we are not returning the current function's RESULT_DECL,
3918 build an assignment to it. */
3919 if (op0 != result)
3921 /* I believe that a function's RESULT_DECL is unique. */
3922 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3924 /* ??? We'd like to use simply expand_assignment here,
3925 but this fails if the value is of BLKmode but the return
3926 decl is a register. expand_return has special handling
3927 for this combination, which eventually should move
3928 to common code. See comments there. Until then, let's
3929 build a modify expression :-/ */
3930 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3931 result, op0);
3935 if (!op0)
3936 expand_null_return ();
3937 else
3938 expand_return (op0);
3940 break;
3942 case GIMPLE_ASSIGN:
3944 gassign *assign_stmt = as_a <gassign *> (stmt);
3945 tree lhs = gimple_assign_lhs (assign_stmt);
3947 /* Tree expand used to fiddle with |= and &= of two bitfield
3948 COMPONENT_REFs here. This can't happen with gimple, the LHS
3949 of binary assigns must be a gimple reg. */
3951 if (TREE_CODE (lhs) != SSA_NAME
3952 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
3954 tree rhs = gimple_assign_rhs1 (assign_stmt);
3955 gcc_assert (gimple_assign_rhs_class (assign_stmt)
3956 == GIMPLE_SINGLE_RHS);
3957 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3958 /* Do not put locations on possibly shared trees. */
3959 && !is_gimple_min_invariant (rhs))
3960 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3961 if (TREE_CLOBBER_P (rhs))
3962 /* This is a clobber to mark the going out of scope for
3963 this LHS. */
3964 expand_clobber (lhs);
3965 else
3966 expand_assignment (lhs, rhs,
3967 gimple_assign_nontemporal_move_p (
3968 assign_stmt));
3970 else
3972 rtx target, temp;
3973 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3974 struct separate_ops ops;
3975 bool promoted = false;
3977 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3978 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3979 promoted = true;
3981 ops.code = gimple_assign_rhs_code (assign_stmt);
3982 ops.type = TREE_TYPE (lhs);
3983 switch (get_gimple_rhs_class (ops.code))
3985 case GIMPLE_TERNARY_RHS:
3986 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3987 /* Fallthru */
3988 case GIMPLE_BINARY_RHS:
3989 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3990 /* Fallthru */
3991 case GIMPLE_UNARY_RHS:
3992 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3993 break;
3994 default:
3995 gcc_unreachable ();
3997 ops.location = gimple_location (stmt);
3999 /* If we want to use a nontemporal store, force the value to
4000 register first. If we store into a promoted register,
4001 don't directly expand to target. */
4002 temp = nontemporal || promoted ? NULL_RTX : target;
4003 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
4004 EXPAND_NORMAL);
4006 if (temp == target)
4008 else if (promoted)
4010 int unsignedp = SUBREG_PROMOTED_SIGN (target);
4011 /* If TEMP is a VOIDmode constant, use convert_modes to make
4012 sure that we properly convert it. */
4013 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
4015 temp = convert_modes (GET_MODE (target),
4016 TYPE_MODE (ops.type),
4017 temp, unsignedp);
4018 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
4019 GET_MODE (target), temp, unsignedp);
4022 convert_move (SUBREG_REG (target), temp, unsignedp);
4024 else if (nontemporal && emit_storent_insn (target, temp))
4026 else
4028 temp = force_operand (temp, target);
4029 if (temp != target)
4030 emit_move_insn (target, temp);
4034 break;
4036 default:
4037 gcc_unreachable ();
4041 /* Expand one gimple statement STMT and return the last RTL instruction
4042 before any of the newly generated ones.
4044 In addition to generating the necessary RTL instructions this also
4045 sets REG_EH_REGION notes if necessary and sets the current source
4046 location for diagnostics. */
4048 static rtx_insn *
4049 expand_gimple_stmt (gimple *stmt)
4051 location_t saved_location = input_location;
4052 rtx_insn *last = get_last_insn ();
4053 int lp_nr;
4055 gcc_assert (cfun);
4057 /* We need to save and restore the current source location so that errors
4058 discovered during expansion are emitted with the right location. But
4059 it would be better if the diagnostic routines used the source location
4060 embedded in the tree nodes rather than globals. */
4061 if (gimple_has_location (stmt))
4062 input_location = gimple_location (stmt);
4064 expand_gimple_stmt_1 (stmt);
4066 /* Free any temporaries used to evaluate this statement. */
4067 free_temp_slots ();
4069 input_location = saved_location;
4071 /* Mark all insns that may trap. */
4072 lp_nr = lookup_stmt_eh_lp (stmt);
4073 if (lp_nr)
4075 rtx_insn *insn;
4076 for (insn = next_real_insn (last); insn;
4077 insn = next_real_insn (insn))
4079 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
4080 /* If we want exceptions for non-call insns, any
4081 may_trap_p instruction may throw. */
4082 && GET_CODE (PATTERN (insn)) != CLOBBER
4083 && GET_CODE (PATTERN (insn)) != USE
4084 && insn_could_throw_p (insn))
4085 make_reg_eh_region_note (insn, 0, lp_nr);
4089 return last;
4092 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
4093 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
4094 generated a tail call (something that might be denied by the ABI
4095 rules governing the call; see calls.cc).
4097 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
4098 can still reach the rest of BB. The case here is __builtin_sqrt,
4099 where the NaN result goes through the external function (with a
4100 tailcall) and the normal result happens via a sqrt instruction. */
4102 static basic_block
4103 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
4105 rtx_insn *last2, *last;
4106 edge e;
4107 edge_iterator ei;
4108 profile_probability probability;
4110 last2 = last = expand_gimple_stmt (stmt);
4112 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
4113 if (CALL_P (last) && SIBLING_CALL_P (last))
4114 goto found;
4116 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4118 *can_fallthru = true;
4119 return NULL;
4121 found:
4122 /* ??? Wouldn't it be better to just reset any pending stack adjust?
4123 Any instructions emitted here are about to be deleted. */
4124 do_pending_stack_adjust ();
4126 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
4127 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
4128 EH or abnormal edges, we shouldn't have created a tail call in
4129 the first place. So it seems to me we should just be removing
4130 all edges here, or redirecting the existing fallthru edge to
4131 the exit block. */
4133 probability = profile_probability::never ();
4135 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
4137 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
4139 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
4140 e->dest->count -= e->count ();
4141 probability += e->probability;
4142 remove_edge (e);
4144 else
4145 ei_next (&ei);
4148 /* This is somewhat ugly: the call_expr expander often emits instructions
4149 after the sibcall (to perform the function return). These confuse the
4150 find_many_sub_basic_blocks code, so we need to get rid of these. */
4151 last = NEXT_INSN (last);
4152 gcc_assert (BARRIER_P (last));
4154 *can_fallthru = false;
4155 while (NEXT_INSN (last))
4157 /* For instance an sqrt builtin expander expands if with
4158 sibcall in the then and label for `else`. */
4159 if (LABEL_P (NEXT_INSN (last)))
4161 *can_fallthru = true;
4162 break;
4164 delete_insn (NEXT_INSN (last));
4167 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
4168 | EDGE_SIBCALL);
4169 e->probability = probability;
4170 BB_END (bb) = last;
4171 update_bb_for_insn (bb);
4173 if (NEXT_INSN (last))
4175 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
4177 last = BB_END (bb);
4178 if (BARRIER_P (last))
4179 BB_END (bb) = PREV_INSN (last);
4182 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4184 return bb;
4187 /* Return the difference between the floor and the truncated result of
4188 a signed division by OP1 with remainder MOD. */
4189 static rtx
4190 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4192 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4193 return gen_rtx_IF_THEN_ELSE
4194 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4195 gen_rtx_IF_THEN_ELSE
4196 (mode, gen_rtx_LT (BImode,
4197 gen_rtx_DIV (mode, op1, mod),
4198 const0_rtx),
4199 constm1_rtx, const0_rtx),
4200 const0_rtx);
4203 /* Return the difference between the ceil and the truncated result of
4204 a signed division by OP1 with remainder MOD. */
4205 static rtx
4206 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4208 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4209 return gen_rtx_IF_THEN_ELSE
4210 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4211 gen_rtx_IF_THEN_ELSE
4212 (mode, gen_rtx_GT (BImode,
4213 gen_rtx_DIV (mode, op1, mod),
4214 const0_rtx),
4215 const1_rtx, const0_rtx),
4216 const0_rtx);
4219 /* Return the difference between the ceil and the truncated result of
4220 an unsigned division by OP1 with remainder MOD. */
4221 static rtx
4222 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4224 /* (mod != 0 ? 1 : 0) */
4225 return gen_rtx_IF_THEN_ELSE
4226 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4227 const1_rtx, const0_rtx);
4230 /* Return the difference between the rounded and the truncated result
4231 of a signed division by OP1 with remainder MOD. Halfway cases are
4232 rounded away from zero, rather than to the nearest even number. */
4233 static rtx
4234 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4236 /* (abs (mod) >= abs (op1) - abs (mod)
4237 ? (op1 / mod > 0 ? 1 : -1)
4238 : 0) */
4239 return gen_rtx_IF_THEN_ELSE
4240 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4241 gen_rtx_MINUS (mode,
4242 gen_rtx_ABS (mode, op1),
4243 gen_rtx_ABS (mode, mod))),
4244 gen_rtx_IF_THEN_ELSE
4245 (mode, gen_rtx_GT (BImode,
4246 gen_rtx_DIV (mode, op1, mod),
4247 const0_rtx),
4248 const1_rtx, constm1_rtx),
4249 const0_rtx);
4252 /* Return the difference between the rounded and the truncated result
4253 of a unsigned division by OP1 with remainder MOD. Halfway cases
4254 are rounded away from zero, rather than to the nearest even
4255 number. */
4256 static rtx
4257 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4259 /* (mod >= op1 - mod ? 1 : 0) */
4260 return gen_rtx_IF_THEN_ELSE
4261 (mode, gen_rtx_GE (BImode, mod,
4262 gen_rtx_MINUS (mode, op1, mod)),
4263 const1_rtx, const0_rtx);
4266 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4267 any rtl. */
4269 static rtx
4270 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4271 addr_space_t as)
4273 #ifndef POINTERS_EXTEND_UNSIGNED
4274 gcc_assert (mode == Pmode
4275 || mode == targetm.addr_space.address_mode (as));
4276 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4277 #else
4278 rtx temp;
4280 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4282 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4283 return x;
4285 /* X must have some form of address mode already. */
4286 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4287 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4288 x = lowpart_subreg (mode, x, xmode);
4289 else if (POINTERS_EXTEND_UNSIGNED > 0)
4290 x = gen_rtx_ZERO_EXTEND (mode, x);
4291 else if (!POINTERS_EXTEND_UNSIGNED)
4292 x = gen_rtx_SIGN_EXTEND (mode, x);
4293 else
4295 switch (GET_CODE (x))
4297 case SUBREG:
4298 if ((SUBREG_PROMOTED_VAR_P (x)
4299 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4300 || (GET_CODE (SUBREG_REG (x)) == PLUS
4301 && REG_P (XEXP (SUBREG_REG (x), 0))
4302 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4303 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4304 && GET_MODE (SUBREG_REG (x)) == mode)
4305 return SUBREG_REG (x);
4306 break;
4307 case LABEL_REF:
4308 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4309 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4310 return temp;
4311 case SYMBOL_REF:
4312 temp = shallow_copy_rtx (x);
4313 PUT_MODE (temp, mode);
4314 return temp;
4315 case CONST:
4316 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4317 if (temp)
4318 temp = gen_rtx_CONST (mode, temp);
4319 return temp;
4320 case PLUS:
4321 case MINUS:
4322 if (CONST_INT_P (XEXP (x, 1)))
4324 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4325 if (temp)
4326 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4328 break;
4329 default:
4330 break;
4332 /* Don't know how to express ptr_extend as operation in debug info. */
4333 return NULL;
4335 #endif /* POINTERS_EXTEND_UNSIGNED */
4337 return x;
4340 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4341 by avoid_deep_ter_for_debug. */
4343 static hash_map<tree, tree> *deep_ter_debug_map;
4345 /* Split too deep TER chains for debug stmts using debug temporaries. */
4347 static void
4348 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4350 use_operand_p use_p;
4351 ssa_op_iter iter;
4352 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4354 tree use = USE_FROM_PTR (use_p);
4355 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4356 continue;
4357 gimple *g = get_gimple_for_ssa_name (use);
4358 if (g == NULL)
4359 continue;
4360 if (depth > 6 && !stmt_ends_bb_p (g))
4362 if (deep_ter_debug_map == NULL)
4363 deep_ter_debug_map = new hash_map<tree, tree>;
4365 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4366 if (vexpr != NULL)
4367 continue;
4368 vexpr = build_debug_expr_decl (TREE_TYPE (use));
4369 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4370 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4371 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4372 avoid_deep_ter_for_debug (def_temp, 0);
4374 else
4375 avoid_deep_ter_for_debug (g, depth + 1);
4379 /* Return an RTX equivalent to the value of the parameter DECL. */
4381 static rtx
4382 expand_debug_parm_decl (tree decl)
4384 rtx incoming = DECL_INCOMING_RTL (decl);
4386 if (incoming
4387 && GET_MODE (incoming) != BLKmode
4388 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4389 || (MEM_P (incoming)
4390 && REG_P (XEXP (incoming, 0))
4391 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4393 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4395 #ifdef HAVE_window_save
4396 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4397 If the target machine has an explicit window save instruction, the
4398 actual entry value is the corresponding OUTGOING_REGNO instead. */
4399 if (REG_P (incoming)
4400 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4401 incoming
4402 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4403 OUTGOING_REGNO (REGNO (incoming)), 0);
4404 else if (MEM_P (incoming))
4406 rtx reg = XEXP (incoming, 0);
4407 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4409 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4410 incoming = replace_equiv_address_nv (incoming, reg);
4412 else
4413 incoming = copy_rtx (incoming);
4415 #endif
4417 ENTRY_VALUE_EXP (rtl) = incoming;
4418 return rtl;
4421 if (incoming
4422 && GET_MODE (incoming) != BLKmode
4423 && !TREE_ADDRESSABLE (decl)
4424 && MEM_P (incoming)
4425 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4426 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4427 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4428 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4429 return copy_rtx (incoming);
4431 return NULL_RTX;
4434 /* Return an RTX equivalent to the value of the tree expression EXP. */
4436 static rtx
4437 expand_debug_expr (tree exp)
4439 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4440 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4441 machine_mode inner_mode = VOIDmode;
4442 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4443 addr_space_t as;
4444 scalar_int_mode op0_mode, op1_mode, addr_mode;
4446 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4448 case tcc_expression:
4449 switch (TREE_CODE (exp))
4451 case COND_EXPR:
4452 case DOT_PROD_EXPR:
4453 case SAD_EXPR:
4454 case WIDEN_MULT_PLUS_EXPR:
4455 case WIDEN_MULT_MINUS_EXPR:
4456 goto ternary;
4458 case TRUTH_ANDIF_EXPR:
4459 case TRUTH_ORIF_EXPR:
4460 case TRUTH_AND_EXPR:
4461 case TRUTH_OR_EXPR:
4462 case TRUTH_XOR_EXPR:
4463 goto binary;
4465 case TRUTH_NOT_EXPR:
4466 goto unary;
4468 default:
4469 break;
4471 break;
4473 ternary:
4474 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4475 if (!op2)
4476 return NULL_RTX;
4477 /* Fall through. */
4479 binary:
4480 case tcc_binary:
4481 if (mode == BLKmode)
4482 return NULL_RTX;
4483 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4484 if (!op1)
4485 return NULL_RTX;
4486 switch (TREE_CODE (exp))
4488 case LSHIFT_EXPR:
4489 case RSHIFT_EXPR:
4490 case LROTATE_EXPR:
4491 case RROTATE_EXPR:
4492 case WIDEN_LSHIFT_EXPR:
4493 /* Ensure second operand isn't wider than the first one. */
4494 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4495 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4496 && (GET_MODE_UNIT_PRECISION (mode)
4497 < GET_MODE_PRECISION (op1_mode)))
4498 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4499 break;
4500 default:
4501 break;
4503 /* Fall through. */
4505 unary:
4506 case tcc_unary:
4507 if (mode == BLKmode)
4508 return NULL_RTX;
4509 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4510 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4511 if (!op0)
4512 return NULL_RTX;
4513 break;
4515 case tcc_comparison:
4516 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4517 goto binary;
4519 case tcc_type:
4520 case tcc_statement:
4521 gcc_unreachable ();
4523 case tcc_constant:
4524 case tcc_exceptional:
4525 case tcc_declaration:
4526 case tcc_reference:
4527 case tcc_vl_exp:
4528 break;
4531 switch (TREE_CODE (exp))
4533 case STRING_CST:
4534 if (!lookup_constant_def (exp))
4536 if (strlen (TREE_STRING_POINTER (exp)) + 1
4537 != (size_t) TREE_STRING_LENGTH (exp))
4538 return NULL_RTX;
4539 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4540 op0 = gen_rtx_MEM (BLKmode, op0);
4541 set_mem_attributes (op0, exp, 0);
4542 return op0;
4544 /* Fall through. */
4546 case INTEGER_CST:
4547 if (TREE_CODE (TREE_TYPE (exp)) == BITINT_TYPE
4548 && TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
4549 return NULL;
4550 /* FALLTHRU */
4551 case REAL_CST:
4552 case FIXED_CST:
4553 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4554 return op0;
4556 case POLY_INT_CST:
4557 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4559 case COMPLEX_CST:
4560 gcc_assert (COMPLEX_MODE_P (mode));
4561 op0 = expand_debug_expr (TREE_REALPART (exp));
4562 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4563 return gen_rtx_CONCAT (mode, op0, op1);
4565 case DEBUG_EXPR_DECL:
4566 op0 = DECL_RTL_IF_SET (exp);
4568 if (op0)
4570 if (GET_MODE (op0) != mode)
4571 gcc_assert (VECTOR_TYPE_P (TREE_TYPE (exp)));
4572 else
4573 return op0;
4576 op0 = gen_rtx_DEBUG_EXPR (mode);
4577 DEBUG_EXPR_TREE_DECL (op0) = exp;
4578 SET_DECL_RTL (exp, op0);
4580 return op0;
4582 case VAR_DECL:
4583 case PARM_DECL:
4584 case FUNCTION_DECL:
4585 case LABEL_DECL:
4586 case CONST_DECL:
4587 case RESULT_DECL:
4588 op0 = DECL_RTL_IF_SET (exp);
4590 /* This decl was probably optimized away. */
4591 if (!op0
4592 /* At least label RTXen are sometimes replaced by
4593 NOTE_INSN_DELETED_LABEL. Any notes here are not
4594 handled by copy_rtx. */
4595 || NOTE_P (op0))
4597 if (!VAR_P (exp)
4598 || DECL_EXTERNAL (exp)
4599 || !TREE_STATIC (exp)
4600 || !DECL_NAME (exp)
4601 || DECL_HARD_REGISTER (exp)
4602 || DECL_IN_CONSTANT_POOL (exp)
4603 || mode == VOIDmode
4604 || symtab_node::get (exp) == NULL)
4605 return NULL;
4607 op0 = make_decl_rtl_for_debug (exp);
4608 if (!MEM_P (op0)
4609 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4610 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4611 return NULL;
4613 else if (VAR_P (exp)
4614 && is_global_var (exp)
4615 && symtab_node::get (exp) == NULL)
4616 return NULL;
4617 else
4618 op0 = copy_rtx (op0);
4620 if (GET_MODE (op0) == BLKmode
4621 /* If op0 is not BLKmode, but mode is, adjust_mode
4622 below would ICE. While it is likely a FE bug,
4623 try to be robust here. See PR43166. */
4624 || mode == BLKmode
4625 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4627 gcc_assert (MEM_P (op0));
4628 op0 = adjust_address_nv (op0, mode, 0);
4629 return op0;
4632 /* Fall through. */
4634 adjust_mode:
4635 case PAREN_EXPR:
4636 CASE_CONVERT:
4638 inner_mode = GET_MODE (op0);
4640 if (mode == inner_mode)
4641 return op0;
4643 if (inner_mode == VOIDmode)
4645 if (TREE_CODE (exp) == SSA_NAME)
4646 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4647 else
4648 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4649 if (mode == inner_mode)
4650 return op0;
4653 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4655 if (GET_MODE_UNIT_BITSIZE (mode)
4656 == GET_MODE_UNIT_BITSIZE (inner_mode))
4657 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4658 else if (GET_MODE_UNIT_BITSIZE (mode)
4659 < GET_MODE_UNIT_BITSIZE (inner_mode))
4660 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4661 else
4662 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4664 else if (FLOAT_MODE_P (mode))
4666 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4667 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4668 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4669 else
4670 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4672 else if (FLOAT_MODE_P (inner_mode))
4674 if (unsignedp)
4675 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4676 else
4677 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4679 else if (GET_MODE_UNIT_PRECISION (mode)
4680 == GET_MODE_UNIT_PRECISION (inner_mode))
4681 op0 = lowpart_subreg (mode, op0, inner_mode);
4682 else if (GET_MODE_UNIT_PRECISION (mode)
4683 < GET_MODE_UNIT_PRECISION (inner_mode))
4684 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4685 else if (UNARY_CLASS_P (exp)
4686 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4687 : unsignedp)
4688 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4689 else
4690 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4692 return op0;
4695 case MEM_REF:
4696 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4698 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4699 TREE_OPERAND (exp, 0),
4700 TREE_OPERAND (exp, 1));
4701 if (newexp)
4702 return expand_debug_expr (newexp);
4704 /* FALLTHROUGH */
4705 case INDIRECT_REF:
4706 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4707 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4708 if (!op0)
4709 return NULL;
4711 if (TREE_CODE (exp) == MEM_REF)
4713 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4714 || (GET_CODE (op0) == PLUS
4715 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4716 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4717 Instead just use get_inner_reference. */
4718 goto component_ref;
4720 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4721 poly_int64 offset;
4722 if (!op1 || !poly_int_rtx_p (op1, &offset))
4723 return NULL;
4725 op0 = plus_constant (inner_mode, op0, offset);
4728 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4730 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4731 op0, as);
4732 if (op0 == NULL_RTX)
4733 return NULL;
4735 op0 = gen_rtx_MEM (mode, op0);
4736 set_mem_attributes (op0, exp, 0);
4737 if (TREE_CODE (exp) == MEM_REF
4738 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4739 set_mem_expr (op0, NULL_TREE);
4740 set_mem_addr_space (op0, as);
4742 return op0;
4744 case TARGET_MEM_REF:
4745 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4746 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4747 return NULL;
4749 op0 = expand_debug_expr
4750 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4751 if (!op0)
4752 return NULL;
4754 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4755 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4756 op0, as);
4757 if (op0 == NULL_RTX)
4758 return NULL;
4760 op0 = gen_rtx_MEM (mode, op0);
4762 set_mem_attributes (op0, exp, 0);
4763 set_mem_addr_space (op0, as);
4765 return op0;
4767 component_ref:
4768 case ARRAY_REF:
4769 case ARRAY_RANGE_REF:
4770 case COMPONENT_REF:
4771 case BIT_FIELD_REF:
4772 case REALPART_EXPR:
4773 case IMAGPART_EXPR:
4774 case VIEW_CONVERT_EXPR:
4776 machine_mode mode1;
4777 poly_int64 bitsize, bitpos;
4778 tree offset;
4779 int reversep, volatilep = 0;
4780 tree tem
4781 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4782 &unsignedp, &reversep, &volatilep);
4783 rtx orig_op0;
4785 if (known_eq (bitsize, 0))
4786 return NULL;
4788 orig_op0 = op0 = expand_debug_expr (tem);
4790 if (!op0)
4791 return NULL;
4793 if (offset)
4795 machine_mode addrmode, offmode;
4797 if (!MEM_P (op0))
4798 return NULL;
4800 op0 = XEXP (op0, 0);
4801 addrmode = GET_MODE (op0);
4802 if (addrmode == VOIDmode)
4803 addrmode = Pmode;
4805 op1 = expand_debug_expr (offset);
4806 if (!op1)
4807 return NULL;
4809 offmode = GET_MODE (op1);
4810 if (offmode == VOIDmode)
4811 offmode = TYPE_MODE (TREE_TYPE (offset));
4813 if (addrmode != offmode)
4814 op1 = lowpart_subreg (addrmode, op1, offmode);
4816 /* Don't use offset_address here, we don't need a
4817 recognizable address, and we don't want to generate
4818 code. */
4819 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4820 op0, op1));
4823 if (MEM_P (op0))
4825 if (mode1 == VOIDmode)
4827 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4828 return NULL;
4829 /* Bitfield. */
4830 mode1 = smallest_int_mode_for_size (bitsize);
4832 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4833 if (maybe_ne (bytepos, 0))
4835 op0 = adjust_address_nv (op0, mode1, bytepos);
4836 bitpos = num_trailing_bits (bitpos);
4838 else if (known_eq (bitpos, 0)
4839 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4840 op0 = adjust_address_nv (op0, mode, 0);
4841 else if (GET_MODE (op0) != mode1)
4842 op0 = adjust_address_nv (op0, mode1, 0);
4843 else
4844 op0 = copy_rtx (op0);
4845 if (op0 == orig_op0)
4846 op0 = shallow_copy_rtx (op0);
4847 if (TREE_CODE (tem) != SSA_NAME)
4848 set_mem_attributes (op0, exp, 0);
4851 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4852 return op0;
4854 if (maybe_lt (bitpos, 0))
4855 return NULL;
4857 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4858 return NULL;
4860 poly_int64 bytepos;
4861 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4862 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4864 machine_mode opmode = GET_MODE (op0);
4866 if (opmode == VOIDmode)
4867 opmode = TYPE_MODE (TREE_TYPE (tem));
4869 /* This condition may hold if we're expanding the address
4870 right past the end of an array that turned out not to
4871 be addressable (i.e., the address was only computed in
4872 debug stmts). The gen_subreg below would rightfully
4873 crash, and the address doesn't really exist, so just
4874 drop it. */
4875 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4876 return NULL;
4878 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4879 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4882 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4883 && TYPE_UNSIGNED (TREE_TYPE (exp))
4884 ? SIGN_EXTRACT
4885 : ZERO_EXTRACT, mode,
4886 GET_MODE (op0) != VOIDmode
4887 ? GET_MODE (op0)
4888 : TYPE_MODE (TREE_TYPE (tem)),
4889 op0, gen_int_mode (bitsize, word_mode),
4890 gen_int_mode (bitpos, word_mode));
4893 case ABS_EXPR:
4894 case ABSU_EXPR:
4895 return simplify_gen_unary (ABS, mode, op0, mode);
4897 case NEGATE_EXPR:
4898 return simplify_gen_unary (NEG, mode, op0, mode);
4900 case BIT_NOT_EXPR:
4901 return simplify_gen_unary (NOT, mode, op0, mode);
4903 case FLOAT_EXPR:
4904 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4905 0)))
4906 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4907 inner_mode);
4909 case FIX_TRUNC_EXPR:
4910 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4911 inner_mode);
4913 case POINTER_PLUS_EXPR:
4914 /* For the rare target where pointers are not the same size as
4915 size_t, we need to check for mis-matched modes and correct
4916 the addend. */
4917 if (op0 && op1
4918 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4919 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4920 && op0_mode != op1_mode)
4922 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4923 /* If OP0 is a partial mode, then we must truncate, even
4924 if it has the same bitsize as OP1 as GCC's
4925 representation of partial modes is opaque. */
4926 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4927 && (GET_MODE_BITSIZE (op0_mode)
4928 == GET_MODE_BITSIZE (op1_mode))))
4929 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4930 else
4931 /* We always sign-extend, regardless of the signedness of
4932 the operand, because the operand is always unsigned
4933 here even if the original C expression is signed. */
4934 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4936 /* Fall through. */
4937 case PLUS_EXPR:
4938 return simplify_gen_binary (PLUS, mode, op0, op1);
4940 case MINUS_EXPR:
4941 case POINTER_DIFF_EXPR:
4942 return simplify_gen_binary (MINUS, mode, op0, op1);
4944 case MULT_EXPR:
4945 return simplify_gen_binary (MULT, mode, op0, op1);
4947 case RDIV_EXPR:
4948 case TRUNC_DIV_EXPR:
4949 case EXACT_DIV_EXPR:
4950 if (unsignedp)
4951 return simplify_gen_binary (UDIV, mode, op0, op1);
4952 else
4953 return simplify_gen_binary (DIV, mode, op0, op1);
4955 case TRUNC_MOD_EXPR:
4956 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4958 case FLOOR_DIV_EXPR:
4959 if (unsignedp)
4960 return simplify_gen_binary (UDIV, mode, op0, op1);
4961 else
4963 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4964 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4965 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4966 return simplify_gen_binary (PLUS, mode, div, adj);
4969 case FLOOR_MOD_EXPR:
4970 if (unsignedp)
4971 return simplify_gen_binary (UMOD, mode, op0, op1);
4972 else
4974 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4975 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4976 adj = simplify_gen_unary (NEG, mode,
4977 simplify_gen_binary (MULT, mode, adj, op1),
4978 mode);
4979 return simplify_gen_binary (PLUS, mode, mod, adj);
4982 case CEIL_DIV_EXPR:
4983 if (unsignedp)
4985 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4986 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4987 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4988 return simplify_gen_binary (PLUS, mode, div, adj);
4990 else
4992 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4993 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4994 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4995 return simplify_gen_binary (PLUS, mode, div, adj);
4998 case CEIL_MOD_EXPR:
4999 if (unsignedp)
5001 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5002 rtx adj = ceil_udiv_adjust (mode, mod, op1);
5003 adj = simplify_gen_unary (NEG, mode,
5004 simplify_gen_binary (MULT, mode, adj, op1),
5005 mode);
5006 return simplify_gen_binary (PLUS, mode, mod, adj);
5008 else
5010 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5011 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
5012 adj = simplify_gen_unary (NEG, mode,
5013 simplify_gen_binary (MULT, mode, adj, op1),
5014 mode);
5015 return simplify_gen_binary (PLUS, mode, mod, adj);
5018 case ROUND_DIV_EXPR:
5019 if (unsignedp)
5021 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
5022 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5023 rtx adj = round_udiv_adjust (mode, mod, op1);
5024 return simplify_gen_binary (PLUS, mode, div, adj);
5026 else
5028 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
5029 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5030 rtx adj = round_sdiv_adjust (mode, mod, op1);
5031 return simplify_gen_binary (PLUS, mode, div, adj);
5034 case ROUND_MOD_EXPR:
5035 if (unsignedp)
5037 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5038 rtx adj = round_udiv_adjust (mode, mod, op1);
5039 adj = simplify_gen_unary (NEG, mode,
5040 simplify_gen_binary (MULT, mode, adj, op1),
5041 mode);
5042 return simplify_gen_binary (PLUS, mode, mod, adj);
5044 else
5046 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5047 rtx adj = round_sdiv_adjust (mode, mod, op1);
5048 adj = simplify_gen_unary (NEG, mode,
5049 simplify_gen_binary (MULT, mode, adj, op1),
5050 mode);
5051 return simplify_gen_binary (PLUS, mode, mod, adj);
5054 case LSHIFT_EXPR:
5055 return simplify_gen_binary (ASHIFT, mode, op0, op1);
5057 case RSHIFT_EXPR:
5058 if (unsignedp)
5059 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
5060 else
5061 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
5063 case LROTATE_EXPR:
5064 return simplify_gen_binary (ROTATE, mode, op0, op1);
5066 case RROTATE_EXPR:
5067 return simplify_gen_binary (ROTATERT, mode, op0, op1);
5069 case MIN_EXPR:
5070 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
5072 case MAX_EXPR:
5073 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
5075 case BIT_AND_EXPR:
5076 case TRUTH_AND_EXPR:
5077 return simplify_gen_binary (AND, mode, op0, op1);
5079 case BIT_IOR_EXPR:
5080 case TRUTH_OR_EXPR:
5081 return simplify_gen_binary (IOR, mode, op0, op1);
5083 case BIT_XOR_EXPR:
5084 case TRUTH_XOR_EXPR:
5085 return simplify_gen_binary (XOR, mode, op0, op1);
5087 case TRUTH_ANDIF_EXPR:
5088 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
5090 case TRUTH_ORIF_EXPR:
5091 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
5093 case TRUTH_NOT_EXPR:
5094 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
5096 case LT_EXPR:
5097 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
5098 op0, op1);
5100 case LE_EXPR:
5101 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
5102 op0, op1);
5104 case GT_EXPR:
5105 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
5106 op0, op1);
5108 case GE_EXPR:
5109 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
5110 op0, op1);
5112 case EQ_EXPR:
5113 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
5115 case NE_EXPR:
5116 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
5118 case UNORDERED_EXPR:
5119 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
5121 case ORDERED_EXPR:
5122 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
5124 case UNLT_EXPR:
5125 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
5127 case UNLE_EXPR:
5128 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
5130 case UNGT_EXPR:
5131 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
5133 case UNGE_EXPR:
5134 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
5136 case UNEQ_EXPR:
5137 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
5139 case LTGT_EXPR:
5140 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
5142 case COND_EXPR:
5143 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
5145 case COMPLEX_EXPR:
5146 gcc_assert (COMPLEX_MODE_P (mode));
5147 if (GET_MODE (op0) == VOIDmode)
5148 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
5149 if (GET_MODE (op1) == VOIDmode)
5150 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
5151 return gen_rtx_CONCAT (mode, op0, op1);
5153 case CONJ_EXPR:
5154 if (GET_CODE (op0) == CONCAT)
5155 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
5156 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
5157 XEXP (op0, 1),
5158 GET_MODE_INNER (mode)));
5159 else
5161 scalar_mode imode = GET_MODE_INNER (mode);
5162 rtx re, im;
5164 if (MEM_P (op0))
5166 re = adjust_address_nv (op0, imode, 0);
5167 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
5169 else
5171 scalar_int_mode ifmode;
5172 scalar_int_mode ihmode;
5173 rtx halfsize;
5174 if (!int_mode_for_mode (mode).exists (&ifmode)
5175 || !int_mode_for_mode (imode).exists (&ihmode))
5176 return NULL;
5177 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
5178 re = op0;
5179 if (mode != ifmode)
5180 re = gen_rtx_SUBREG (ifmode, re, 0);
5181 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
5182 if (imode != ihmode)
5183 re = gen_rtx_SUBREG (imode, re, 0);
5184 im = copy_rtx (op0);
5185 if (mode != ifmode)
5186 im = gen_rtx_SUBREG (ifmode, im, 0);
5187 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
5188 if (imode != ihmode)
5189 im = gen_rtx_SUBREG (imode, im, 0);
5191 im = gen_rtx_NEG (imode, im);
5192 return gen_rtx_CONCAT (mode, re, im);
5195 case ADDR_EXPR:
5196 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
5197 if (!op0 || !MEM_P (op0))
5199 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5200 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5201 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5202 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5203 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5204 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5206 if (handled_component_p (TREE_OPERAND (exp, 0)))
5208 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5209 bool reverse;
5210 tree decl
5211 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5212 &bitsize, &maxsize, &reverse);
5213 if ((VAR_P (decl)
5214 || TREE_CODE (decl) == PARM_DECL
5215 || TREE_CODE (decl) == RESULT_DECL)
5216 && (!TREE_ADDRESSABLE (decl)
5217 || target_for_debug_bind (decl))
5218 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5219 && known_gt (bitsize, 0)
5220 && known_eq (bitsize, maxsize))
5222 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5223 return plus_constant (mode, base, byteoffset);
5227 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5228 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5229 == ADDR_EXPR)
5231 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5232 0));
5233 if (op0 != NULL
5234 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5235 || (GET_CODE (op0) == PLUS
5236 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5237 && CONST_INT_P (XEXP (op0, 1)))))
5239 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5240 1));
5241 poly_int64 offset;
5242 if (!op1 || !poly_int_rtx_p (op1, &offset))
5243 return NULL;
5245 return plus_constant (mode, op0, offset);
5249 return NULL;
5252 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5253 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5254 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5256 return op0;
5258 case VECTOR_CST:
5260 unsigned HOST_WIDE_INT i, nelts;
5262 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5263 return NULL;
5265 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5267 for (i = 0; i < nelts; ++i)
5269 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5270 if (!op1)
5271 return NULL;
5272 XVECEXP (op0, 0, i) = op1;
5275 return op0;
5278 case CONSTRUCTOR:
5279 if (TREE_CLOBBER_P (exp))
5280 return NULL;
5281 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5283 unsigned i;
5284 unsigned HOST_WIDE_INT nelts;
5285 tree val;
5287 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5288 goto flag_unsupported;
5290 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5292 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5294 op1 = expand_debug_expr (val);
5295 if (!op1)
5296 return NULL;
5297 XVECEXP (op0, 0, i) = op1;
5300 if (i < nelts)
5302 op1 = expand_debug_expr
5303 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5305 if (!op1)
5306 return NULL;
5308 for (; i < nelts; i++)
5309 XVECEXP (op0, 0, i) = op1;
5312 return op0;
5314 else
5315 goto flag_unsupported;
5317 case CALL_EXPR:
5318 /* ??? Maybe handle some builtins? */
5319 return NULL;
5321 case SSA_NAME:
5323 gimple *g = get_gimple_for_ssa_name (exp);
5324 if (g)
5326 tree t = NULL_TREE;
5327 if (deep_ter_debug_map)
5329 tree *slot = deep_ter_debug_map->get (exp);
5330 if (slot)
5331 t = *slot;
5333 if (t == NULL_TREE)
5334 t = gimple_assign_rhs_to_tree (g);
5335 op0 = expand_debug_expr (t);
5336 if (!op0)
5337 return NULL;
5339 else
5341 /* If this is a reference to an incoming value of
5342 parameter that is never used in the code or where the
5343 incoming value is never used in the code, use
5344 PARM_DECL's DECL_RTL if set. */
5345 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5346 && SSA_NAME_VAR (exp)
5347 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5348 && has_zero_uses (exp))
5350 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5351 if (op0)
5352 goto adjust_mode;
5353 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5354 if (op0)
5355 goto adjust_mode;
5358 int part = var_to_partition (SA.map, exp);
5360 if (part == NO_PARTITION)
5361 return NULL;
5363 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5365 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5367 goto adjust_mode;
5370 case ERROR_MARK:
5371 return NULL;
5373 /* Vector stuff. For most of the codes we don't have rtl codes. */
5374 case REALIGN_LOAD_EXPR:
5375 case VEC_COND_EXPR:
5376 case VEC_PACK_FIX_TRUNC_EXPR:
5377 case VEC_PACK_FLOAT_EXPR:
5378 case VEC_PACK_SAT_EXPR:
5379 case VEC_PACK_TRUNC_EXPR:
5380 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5381 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5382 case VEC_UNPACK_FLOAT_HI_EXPR:
5383 case VEC_UNPACK_FLOAT_LO_EXPR:
5384 case VEC_UNPACK_HI_EXPR:
5385 case VEC_UNPACK_LO_EXPR:
5386 case VEC_WIDEN_MULT_HI_EXPR:
5387 case VEC_WIDEN_MULT_LO_EXPR:
5388 case VEC_WIDEN_MULT_EVEN_EXPR:
5389 case VEC_WIDEN_MULT_ODD_EXPR:
5390 case VEC_WIDEN_LSHIFT_HI_EXPR:
5391 case VEC_WIDEN_LSHIFT_LO_EXPR:
5392 case VEC_PERM_EXPR:
5393 case VEC_DUPLICATE_EXPR:
5394 case VEC_SERIES_EXPR:
5395 case SAD_EXPR:
5396 return NULL;
5398 /* Misc codes. */
5399 case ADDR_SPACE_CONVERT_EXPR:
5400 case FIXED_CONVERT_EXPR:
5401 case OBJ_TYPE_REF:
5402 case WITH_SIZE_EXPR:
5403 case BIT_INSERT_EXPR:
5404 return NULL;
5406 case DOT_PROD_EXPR:
5407 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5408 && SCALAR_INT_MODE_P (mode))
5411 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5412 0)))
5413 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5414 inner_mode);
5416 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5417 1)))
5418 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5419 inner_mode);
5420 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5421 return simplify_gen_binary (PLUS, mode, op0, op2);
5423 return NULL;
5425 case WIDEN_MULT_EXPR:
5426 case WIDEN_MULT_PLUS_EXPR:
5427 case WIDEN_MULT_MINUS_EXPR:
5428 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5429 && SCALAR_INT_MODE_P (mode))
5431 inner_mode = GET_MODE (op0);
5432 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5433 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5434 else
5435 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5436 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5437 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5438 else
5439 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5440 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5441 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5442 return op0;
5443 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5444 return simplify_gen_binary (PLUS, mode, op0, op2);
5445 else
5446 return simplify_gen_binary (MINUS, mode, op2, op0);
5448 return NULL;
5450 case MULT_HIGHPART_EXPR:
5451 /* ??? Similar to the above. */
5452 return NULL;
5454 case WIDEN_SUM_EXPR:
5455 case WIDEN_LSHIFT_EXPR:
5456 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5457 && SCALAR_INT_MODE_P (mode))
5460 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5461 0)))
5462 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5463 inner_mode);
5464 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5465 ? ASHIFT : PLUS, mode, op0, op1);
5467 return NULL;
5469 default:
5470 flag_unsupported:
5471 if (flag_checking)
5473 debug_tree (exp);
5474 gcc_unreachable ();
5476 return NULL;
5480 /* Return an RTX equivalent to the source bind value of the tree expression
5481 EXP. */
5483 static rtx
5484 expand_debug_source_expr (tree exp)
5486 rtx op0 = NULL_RTX;
5487 machine_mode mode = VOIDmode, inner_mode;
5489 switch (TREE_CODE (exp))
5491 case VAR_DECL:
5492 if (DECL_ABSTRACT_ORIGIN (exp))
5493 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5494 break;
5495 case PARM_DECL:
5497 mode = DECL_MODE (exp);
5498 op0 = expand_debug_parm_decl (exp);
5499 if (op0)
5500 break;
5501 /* See if this isn't an argument that has been completely
5502 optimized out. */
5503 if (!DECL_RTL_SET_P (exp)
5504 && !DECL_INCOMING_RTL (exp)
5505 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5507 tree aexp = DECL_ORIGIN (exp);
5508 if (DECL_CONTEXT (aexp)
5509 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5511 vec<tree, va_gc> **debug_args;
5512 unsigned int ix;
5513 tree ddecl;
5514 debug_args = decl_debug_args_lookup (current_function_decl);
5515 if (debug_args != NULL)
5517 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5518 ix += 2)
5519 if (ddecl == aexp)
5520 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5524 break;
5526 default:
5527 break;
5530 if (op0 == NULL_RTX)
5531 return NULL_RTX;
5533 inner_mode = GET_MODE (op0);
5534 if (mode == inner_mode)
5535 return op0;
5537 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5539 if (GET_MODE_UNIT_BITSIZE (mode)
5540 == GET_MODE_UNIT_BITSIZE (inner_mode))
5541 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5542 else if (GET_MODE_UNIT_BITSIZE (mode)
5543 < GET_MODE_UNIT_BITSIZE (inner_mode))
5544 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5545 else
5546 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5548 else if (FLOAT_MODE_P (mode))
5549 gcc_unreachable ();
5550 else if (FLOAT_MODE_P (inner_mode))
5552 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5553 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5554 else
5555 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5557 else if (GET_MODE_UNIT_PRECISION (mode)
5558 == GET_MODE_UNIT_PRECISION (inner_mode))
5559 op0 = lowpart_subreg (mode, op0, inner_mode);
5560 else if (GET_MODE_UNIT_PRECISION (mode)
5561 < GET_MODE_UNIT_PRECISION (inner_mode))
5562 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5563 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5564 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5565 else
5566 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5568 return op0;
5571 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5572 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5573 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5575 static void
5576 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5578 rtx exp = *exp_p;
5580 if (exp == NULL_RTX)
5581 return;
5583 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5584 return;
5586 if (depth == 4)
5588 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5589 rtx dval = make_debug_expr_from_rtl (exp);
5591 /* Emit a debug bind insn before INSN. */
5592 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5593 DEBUG_EXPR_TREE_DECL (dval), exp,
5594 VAR_INIT_STATUS_INITIALIZED);
5596 emit_debug_insn_before (bind, insn);
5597 *exp_p = dval;
5598 return;
5601 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5602 int i, j;
5603 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5604 switch (*format_ptr++)
5606 case 'e':
5607 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5608 break;
5610 case 'E':
5611 case 'V':
5612 for (j = 0; j < XVECLEN (exp, i); j++)
5613 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5614 break;
5616 default:
5617 break;
5621 /* Expand the _LOCs in debug insns. We run this after expanding all
5622 regular insns, so that any variables referenced in the function
5623 will have their DECL_RTLs set. */
5625 static void
5626 expand_debug_locations (void)
5628 rtx_insn *insn;
5629 rtx_insn *last = get_last_insn ();
5630 int save_strict_alias = flag_strict_aliasing;
5632 /* New alias sets while setting up memory attributes cause
5633 -fcompare-debug failures, even though it doesn't bring about any
5634 codegen changes. */
5635 flag_strict_aliasing = 0;
5637 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5638 if (DEBUG_BIND_INSN_P (insn))
5640 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5641 rtx val;
5642 rtx_insn *prev_insn, *insn2;
5643 machine_mode mode;
5645 if (value == NULL_TREE)
5646 val = NULL_RTX;
5647 else
5649 if (INSN_VAR_LOCATION_STATUS (insn)
5650 == VAR_INIT_STATUS_UNINITIALIZED)
5651 val = expand_debug_source_expr (value);
5652 /* The avoid_deep_ter_for_debug function inserts
5653 debug bind stmts after SSA_NAME definition, with the
5654 SSA_NAME as the whole bind location. Disable temporarily
5655 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5656 being defined in this DEBUG_INSN. */
5657 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5659 tree *slot = deep_ter_debug_map->get (value);
5660 if (slot)
5662 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5663 *slot = NULL_TREE;
5664 else
5665 slot = NULL;
5667 val = expand_debug_expr (value);
5668 if (slot)
5669 *slot = INSN_VAR_LOCATION_DECL (insn);
5671 else
5672 val = expand_debug_expr (value);
5673 gcc_assert (last == get_last_insn ());
5676 if (!val)
5677 val = gen_rtx_UNKNOWN_VAR_LOC ();
5678 else
5680 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5682 gcc_assert (mode == GET_MODE (val)
5683 || (GET_MODE (val) == VOIDmode
5684 && (CONST_SCALAR_INT_P (val)
5685 || GET_CODE (val) == CONST_FIXED
5686 || GET_CODE (val) == LABEL_REF)));
5689 INSN_VAR_LOCATION_LOC (insn) = val;
5690 prev_insn = PREV_INSN (insn);
5691 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5692 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5695 flag_strict_aliasing = save_strict_alias;
5698 /* Performs swapping operands of commutative operations to expand
5699 the expensive one first. */
5701 static void
5702 reorder_operands (basic_block bb)
5704 unsigned int *lattice; /* Hold cost of each statement. */
5705 unsigned int i = 0, n = 0;
5706 gimple_stmt_iterator gsi;
5707 gimple_seq stmts;
5708 gimple *stmt;
5709 bool swap;
5710 tree op0, op1;
5711 ssa_op_iter iter;
5712 use_operand_p use_p;
5713 gimple *def0, *def1;
5715 /* Compute cost of each statement using estimate_num_insns. */
5716 stmts = bb_seq (bb);
5717 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5719 stmt = gsi_stmt (gsi);
5720 if (!is_gimple_debug (stmt))
5721 gimple_set_uid (stmt, n++);
5723 lattice = XNEWVEC (unsigned int, n);
5724 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5726 unsigned cost;
5727 stmt = gsi_stmt (gsi);
5728 if (is_gimple_debug (stmt))
5729 continue;
5730 cost = estimate_num_insns (stmt, &eni_size_weights);
5731 lattice[i] = cost;
5732 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5734 tree use = USE_FROM_PTR (use_p);
5735 gimple *def_stmt;
5736 if (TREE_CODE (use) != SSA_NAME)
5737 continue;
5738 def_stmt = get_gimple_for_ssa_name (use);
5739 if (!def_stmt)
5740 continue;
5741 lattice[i] += lattice[gimple_uid (def_stmt)];
5743 i++;
5744 if (!is_gimple_assign (stmt)
5745 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5746 continue;
5747 op0 = gimple_op (stmt, 1);
5748 op1 = gimple_op (stmt, 2);
5749 if (TREE_CODE (op0) != SSA_NAME
5750 || TREE_CODE (op1) != SSA_NAME)
5751 continue;
5752 /* Swap operands if the second one is more expensive. */
5753 def0 = get_gimple_for_ssa_name (op0);
5754 def1 = get_gimple_for_ssa_name (op1);
5755 if (!def1)
5756 continue;
5757 swap = false;
5758 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5759 swap = true;
5760 if (swap)
5762 if (dump_file && (dump_flags & TDF_DETAILS))
5764 fprintf (dump_file, "Swap operands in stmt:\n");
5765 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5766 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5767 def0 ? lattice[gimple_uid (def0)] : 0,
5768 lattice[gimple_uid (def1)]);
5770 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5771 gimple_assign_rhs2_ptr (stmt));
5774 XDELETE (lattice);
5777 /* Expand basic block BB from GIMPLE trees to RTL. */
5779 static basic_block
5780 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5782 gimple_stmt_iterator gsi;
5783 gimple_seq stmts;
5784 gimple *stmt = NULL;
5785 rtx_note *note = NULL;
5786 rtx_insn *last;
5787 edge e;
5788 edge_iterator ei;
5789 bool nondebug_stmt_seen = false;
5791 if (dump_file)
5792 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5793 bb->index);
5795 /* Note that since we are now transitioning from GIMPLE to RTL, we
5796 cannot use the gsi_*_bb() routines because they expect the basic
5797 block to be in GIMPLE, instead of RTL. Therefore, we need to
5798 access the BB sequence directly. */
5799 if (optimize)
5800 reorder_operands (bb);
5801 stmts = bb_seq (bb);
5802 bb->il.gimple.seq = NULL;
5803 bb->il.gimple.phi_nodes = NULL;
5804 rtl_profile_for_bb (bb);
5805 init_rtl_bb_info (bb);
5806 bb->flags |= BB_RTL;
5808 /* Remove the RETURN_EXPR if we may fall though to the exit
5809 instead. */
5810 gsi = gsi_last (stmts);
5811 if (!gsi_end_p (gsi)
5812 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5814 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5816 gcc_assert (single_succ_p (bb));
5817 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5819 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5820 && !gimple_return_retval (ret_stmt))
5822 gsi_remove (&gsi, false);
5823 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5827 gsi = gsi_start (stmts);
5828 if (!gsi_end_p (gsi))
5830 stmt = gsi_stmt (gsi);
5831 if (gimple_code (stmt) != GIMPLE_LABEL)
5832 stmt = NULL;
5835 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5837 if (stmt || elt)
5839 gcc_checking_assert (!note);
5840 last = get_last_insn ();
5842 if (stmt)
5844 expand_gimple_stmt (stmt);
5845 gsi_next (&gsi);
5848 if (elt)
5849 emit_label (*elt);
5851 BB_HEAD (bb) = NEXT_INSN (last);
5852 if (NOTE_P (BB_HEAD (bb)))
5853 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5854 gcc_assert (LABEL_P (BB_HEAD (bb)));
5855 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5857 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5859 else
5860 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5862 if (note)
5863 NOTE_BASIC_BLOCK (note) = bb;
5865 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5867 basic_block new_bb;
5869 stmt = gsi_stmt (gsi);
5870 if (!is_gimple_debug (stmt))
5871 nondebug_stmt_seen = true;
5873 /* If this statement is a non-debug one, and we generate debug
5874 insns, then this one might be the last real use of a TERed
5875 SSA_NAME, but where there are still some debug uses further
5876 down. Expanding the current SSA name in such further debug
5877 uses by their RHS might lead to wrong debug info, as coalescing
5878 might make the operands of such RHS be placed into the same
5879 pseudo as something else. Like so:
5880 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5881 use(a_1);
5882 a_2 = ...
5883 #DEBUG ... => a_1
5884 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5885 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5886 the write to a_2 would actually have clobbered the place which
5887 formerly held a_0.
5889 So, instead of that, we recognize the situation, and generate
5890 debug temporaries at the last real use of TERed SSA names:
5891 a_1 = a_0 + 1;
5892 #DEBUG #D1 => a_1
5893 use(a_1);
5894 a_2 = ...
5895 #DEBUG ... => #D1
5897 if (MAY_HAVE_DEBUG_BIND_INSNS
5898 && SA.values
5899 && !is_gimple_debug (stmt))
5901 ssa_op_iter iter;
5902 tree op;
5903 gimple *def;
5905 location_t sloc = curr_insn_location ();
5907 /* Look for SSA names that have their last use here (TERed
5908 names always have only one real use). */
5909 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5910 if ((def = get_gimple_for_ssa_name (op)))
5912 imm_use_iterator imm_iter;
5913 use_operand_p use_p;
5914 bool have_debug_uses = false;
5916 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5918 if (gimple_debug_bind_p (USE_STMT (use_p)))
5920 have_debug_uses = true;
5921 break;
5925 if (have_debug_uses)
5927 /* OP is a TERed SSA name, with DEF its defining
5928 statement, and where OP is used in further debug
5929 instructions. Generate a debug temporary, and
5930 replace all uses of OP in debug insns with that
5931 temporary. */
5932 gimple *debugstmt;
5933 tree value = gimple_assign_rhs_to_tree (def);
5934 tree vexpr = build_debug_expr_decl (TREE_TYPE (value));
5935 rtx val;
5936 machine_mode mode;
5938 set_curr_insn_location (gimple_location (def));
5940 if (DECL_P (value))
5941 mode = DECL_MODE (value);
5942 else
5943 mode = TYPE_MODE (TREE_TYPE (value));
5944 /* FIXME: Is setting the mode really necessary? */
5945 SET_DECL_MODE (vexpr, mode);
5947 val = gen_rtx_VAR_LOCATION
5948 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5950 emit_debug_insn (val);
5952 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5954 if (!gimple_debug_bind_p (debugstmt))
5955 continue;
5957 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5958 SET_USE (use_p, vexpr);
5960 update_stmt (debugstmt);
5964 set_curr_insn_location (sloc);
5967 currently_expanding_gimple_stmt = stmt;
5969 /* Expand this statement, then evaluate the resulting RTL and
5970 fixup the CFG accordingly. */
5971 if (gimple_code (stmt) == GIMPLE_COND)
5973 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5974 if (new_bb)
5976 currently_expanding_gimple_stmt = NULL;
5977 return new_bb;
5980 else if (is_gimple_debug (stmt))
5982 location_t sloc = curr_insn_location ();
5983 gimple_stmt_iterator nsi = gsi;
5985 for (;;)
5987 tree var;
5988 tree value = NULL_TREE;
5989 rtx val = NULL_RTX;
5990 machine_mode mode;
5992 if (!gimple_debug_nonbind_marker_p (stmt))
5994 if (gimple_debug_bind_p (stmt))
5996 var = gimple_debug_bind_get_var (stmt);
5998 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5999 && TREE_CODE (var) != LABEL_DECL
6000 && !target_for_debug_bind (var))
6001 goto delink_debug_stmt;
6003 if (DECL_P (var) && !VECTOR_TYPE_P (TREE_TYPE (var)))
6004 mode = DECL_MODE (var);
6005 else
6006 mode = TYPE_MODE (TREE_TYPE (var));
6008 if (gimple_debug_bind_has_value_p (stmt))
6009 value = gimple_debug_bind_get_value (stmt);
6011 val = gen_rtx_VAR_LOCATION
6012 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
6014 else if (gimple_debug_source_bind_p (stmt))
6016 var = gimple_debug_source_bind_get_var (stmt);
6018 value = gimple_debug_source_bind_get_value (stmt);
6020 if (!VECTOR_TYPE_P (TREE_TYPE (var)))
6021 mode = DECL_MODE (var);
6022 else
6023 mode = TYPE_MODE (TREE_TYPE (var));
6025 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
6026 VAR_INIT_STATUS_UNINITIALIZED);
6028 else
6029 gcc_unreachable ();
6031 /* If this function was first compiled with markers
6032 enabled, but they're now disable (e.g. LTO), drop
6033 them on the floor. */
6034 else if (gimple_debug_nonbind_marker_p (stmt)
6035 && !MAY_HAVE_DEBUG_MARKER_INSNS)
6036 goto delink_debug_stmt;
6037 else if (gimple_debug_begin_stmt_p (stmt))
6038 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
6039 else if (gimple_debug_inline_entry_p (stmt))
6040 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
6041 else
6042 gcc_unreachable ();
6044 last = get_last_insn ();
6046 set_curr_insn_location (gimple_location (stmt));
6048 emit_debug_insn (val);
6050 if (dump_file && (dump_flags & TDF_DETAILS))
6052 /* We can't dump the insn with a TREE where an RTX
6053 is expected. */
6054 if (GET_CODE (val) == VAR_LOCATION)
6056 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
6057 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
6059 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6060 if (GET_CODE (val) == VAR_LOCATION)
6061 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
6064 delink_debug_stmt:
6065 /* In order not to generate too many debug temporaries,
6066 we delink all uses of debug statements we already expanded.
6067 Therefore debug statements between definition and real
6068 use of TERed SSA names will continue to use the SSA name,
6069 and not be replaced with debug temps. */
6070 delink_stmt_imm_use (stmt);
6072 gsi = nsi;
6073 gsi_next (&nsi);
6074 if (gsi_end_p (nsi))
6075 break;
6076 stmt = gsi_stmt (nsi);
6077 if (!is_gimple_debug (stmt))
6078 break;
6081 set_curr_insn_location (sloc);
6083 else
6085 gcall *call_stmt = dyn_cast <gcall *> (stmt);
6086 if (call_stmt
6087 && gimple_call_tail_p (call_stmt)
6088 && disable_tail_calls)
6089 gimple_call_set_tail (call_stmt, false);
6091 if (call_stmt && gimple_call_tail_p (call_stmt))
6093 bool can_fallthru;
6094 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
6095 if (new_bb)
6097 if (can_fallthru)
6098 bb = new_bb;
6099 else
6101 currently_expanding_gimple_stmt = NULL;
6102 return new_bb;
6106 else
6108 def_operand_p def_p;
6109 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
6111 if (def_p != NULL)
6113 /* Ignore this stmt if it is in the list of
6114 replaceable expressions. */
6115 if (SA.values
6116 && bitmap_bit_p (SA.values,
6117 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
6118 continue;
6120 last = expand_gimple_stmt (stmt);
6121 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6126 currently_expanding_gimple_stmt = NULL;
6128 /* Expand implicit goto and convert goto_locus. */
6129 FOR_EACH_EDGE (e, ei, bb->succs)
6131 if (e->goto_locus != UNKNOWN_LOCATION || !nondebug_stmt_seen)
6132 set_curr_insn_location (e->goto_locus);
6133 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
6135 emit_jump (label_rtx_for_bb (e->dest));
6136 e->flags &= ~EDGE_FALLTHRU;
6140 /* Expanded RTL can create a jump in the last instruction of block.
6141 This later might be assumed to be a jump to successor and break edge insertion.
6142 We need to insert dummy move to prevent this. PR41440. */
6143 if (single_succ_p (bb)
6144 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
6145 && (last = get_last_insn ())
6146 && (JUMP_P (last)
6147 || (DEBUG_INSN_P (last)
6148 && JUMP_P (prev_nondebug_insn (last)))))
6150 rtx dummy = gen_reg_rtx (SImode);
6151 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
6154 do_pending_stack_adjust ();
6156 /* Find the block tail. The last insn in the block is the insn
6157 before a barrier and/or table jump insn. */
6158 last = get_last_insn ();
6159 if (BARRIER_P (last))
6160 last = PREV_INSN (last);
6161 if (JUMP_TABLE_DATA_P (last))
6162 last = PREV_INSN (PREV_INSN (last));
6163 if (BARRIER_P (last))
6164 last = PREV_INSN (last);
6165 BB_END (bb) = last;
6167 update_bb_for_insn (bb);
6169 return bb;
6173 /* Create a basic block for initialization code. */
6175 static basic_block
6176 construct_init_block (void)
6178 basic_block init_block, first_block;
6179 edge e = NULL;
6180 int flags;
6182 /* Multiple entry points not supported yet. */
6183 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
6184 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
6185 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
6186 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6187 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6189 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
6191 /* When entry edge points to first basic block, we don't need jump,
6192 otherwise we have to jump into proper target. */
6193 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
6195 tree label = gimple_block_label (e->dest);
6197 emit_jump (jump_target_rtx (label));
6198 flags = 0;
6200 else
6201 flags = EDGE_FALLTHRU;
6203 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6204 get_last_insn (),
6205 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6206 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6207 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6208 if (e)
6210 first_block = e->dest;
6211 redirect_edge_succ (e, init_block);
6212 make_single_succ_edge (init_block, first_block, flags);
6214 else
6215 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6216 EDGE_FALLTHRU);
6218 update_bb_for_insn (init_block);
6219 return init_block;
6222 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6223 found in the block tree. */
6225 static void
6226 set_block_levels (tree block, int level)
6228 while (block)
6230 BLOCK_NUMBER (block) = level;
6231 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6232 block = BLOCK_CHAIN (block);
6236 /* Create a block containing landing pads and similar stuff. */
6238 static void
6239 construct_exit_block (void)
6241 rtx_insn *head = get_last_insn ();
6242 rtx_insn *end;
6243 basic_block exit_block;
6244 edge e, e2;
6245 unsigned ix;
6246 edge_iterator ei;
6247 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6248 rtx_insn *orig_end = BB_END (prev_bb);
6250 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6252 /* Make sure the locus is set to the end of the function, so that
6253 epilogue line numbers and warnings are set properly. */
6254 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6255 input_location = cfun->function_end_locus;
6257 /* Generate rtl for function exit. */
6258 expand_function_end ();
6260 end = get_last_insn ();
6261 if (head == end)
6262 return;
6263 /* While emitting the function end we could move end of the last basic
6264 block. */
6265 BB_END (prev_bb) = orig_end;
6266 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6267 head = NEXT_INSN (head);
6268 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6269 bb count counting will be confused. Any instructions before that
6270 label are emitted for the case where PREV_BB falls through into the
6271 exit block, so append those instructions to prev_bb in that case. */
6272 if (NEXT_INSN (head) != return_label)
6274 while (NEXT_INSN (head) != return_label)
6276 if (!NOTE_P (NEXT_INSN (head)))
6277 BB_END (prev_bb) = NEXT_INSN (head);
6278 head = NEXT_INSN (head);
6281 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6282 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6283 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6285 ix = 0;
6286 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6288 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6289 if (!(e->flags & EDGE_ABNORMAL))
6290 redirect_edge_succ (e, exit_block);
6291 else
6292 ix++;
6295 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6296 EDGE_FALLTHRU);
6297 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6298 if (e2 != e)
6300 exit_block->count -= e2->count ();
6302 update_bb_for_insn (exit_block);
6305 /* Helper function for discover_nonconstant_array_refs.
6306 Look for ARRAY_REF nodes with non-constant indexes and mark them
6307 addressable. */
6309 static tree
6310 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6311 void *data)
6313 tree t = *tp;
6314 bitmap forced_stack_vars = (bitmap)((walk_stmt_info *)data)->info;
6316 if (IS_TYPE_OR_DECL_P (t))
6317 *walk_subtrees = 0;
6318 else if (REFERENCE_CLASS_P (t) && TREE_THIS_VOLATILE (t))
6320 t = get_base_address (t);
6321 if (t && DECL_P (t)
6322 && DECL_MODE (t) != BLKmode
6323 && !TREE_ADDRESSABLE (t))
6324 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6325 *walk_subtrees = 0;
6327 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6329 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6330 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6331 && (!TREE_OPERAND (t, 2)
6332 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6333 || (TREE_CODE (t) == COMPONENT_REF
6334 && (!TREE_OPERAND (t,2)
6335 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6336 || TREE_CODE (t) == BIT_FIELD_REF
6337 || TREE_CODE (t) == REALPART_EXPR
6338 || TREE_CODE (t) == IMAGPART_EXPR
6339 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6340 || CONVERT_EXPR_P (t))
6341 t = TREE_OPERAND (t, 0);
6343 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6345 t = get_base_address (t);
6346 if (t && DECL_P (t)
6347 && DECL_MODE (t) != BLKmode
6348 && !TREE_ADDRESSABLE (t))
6349 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6352 *walk_subtrees = 0;
6354 /* References of size POLY_INT_CST to a fixed-size object must go
6355 through memory. It's more efficient to force that here than
6356 to create temporary slots on the fly.
6357 RTL expansion expectes TARGET_MEM_REF to always address actual memory. */
6358 else if (TREE_CODE (t) == TARGET_MEM_REF
6359 || (TREE_CODE (t) == MEM_REF
6360 && TYPE_SIZE (TREE_TYPE (t))
6361 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t)))))
6363 tree base = get_base_address (t);
6364 if (base
6365 && DECL_P (base)
6366 && !TREE_ADDRESSABLE (base)
6367 && DECL_MODE (base) != BLKmode
6368 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6369 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6370 *walk_subtrees = 0;
6373 return NULL_TREE;
6376 /* If there's a chance to get a pseudo for t then if it would be of float mode
6377 and the actual access is via an integer mode (lowered memcpy or similar
6378 access) then avoid the register expansion if the mode likely is not storage
6379 suitable for raw bits processing (like XFmode on i?86). */
6381 static void
6382 avoid_type_punning_on_regs (tree t, bitmap forced_stack_vars)
6384 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6385 if (access_mode != BLKmode
6386 && !SCALAR_INT_MODE_P (access_mode))
6387 return;
6388 tree base = get_base_address (t);
6389 if (DECL_P (base)
6390 && !TREE_ADDRESSABLE (base)
6391 && FLOAT_MODE_P (DECL_MODE (base))
6392 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6393 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6394 /* Double check in the expensive way we really would get a pseudo. */
6395 && use_register_for_decl (base))
6396 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6399 /* RTL expansion is not able to compile array references with variable
6400 offsets for arrays stored in single register. Discover such
6401 expressions and mark variables as addressable to avoid this
6402 scenario. */
6404 static void
6405 discover_nonconstant_array_refs (bitmap forced_stack_vars)
6407 basic_block bb;
6408 gimple_stmt_iterator gsi;
6410 walk_stmt_info wi = {};
6411 wi.info = forced_stack_vars;
6412 FOR_EACH_BB_FN (bb, cfun)
6413 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6415 gimple *stmt = gsi_stmt (gsi);
6416 if (!is_gimple_debug (stmt))
6418 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, &wi);
6419 gcall *call = dyn_cast <gcall *> (stmt);
6420 if (call && gimple_call_internal_p (call))
6422 tree cand = NULL_TREE;
6423 switch (gimple_call_internal_fn (call))
6425 case IFN_LOAD_LANES:
6426 /* The source must be a MEM. */
6427 cand = gimple_call_arg (call, 0);
6428 break;
6429 case IFN_STORE_LANES:
6430 /* The destination must be a MEM. */
6431 cand = gimple_call_lhs (call);
6432 break;
6433 default:
6434 break;
6436 if (cand)
6437 cand = get_base_address (cand);
6438 if (cand
6439 && DECL_P (cand)
6440 && use_register_for_decl (cand))
6441 bitmap_set_bit (forced_stack_vars, DECL_UID (cand));
6443 if (gimple_vdef (stmt))
6445 tree t = gimple_get_lhs (stmt);
6446 if (t && REFERENCE_CLASS_P (t))
6447 avoid_type_punning_on_regs (t, forced_stack_vars);
6453 /* This function sets crtl->args.internal_arg_pointer to a virtual
6454 register if DRAP is needed. Local register allocator will replace
6455 virtual_incoming_args_rtx with the virtual register. */
6457 static void
6458 expand_stack_alignment (void)
6460 rtx drap_rtx;
6461 unsigned int preferred_stack_boundary;
6463 if (! SUPPORTS_STACK_ALIGNMENT)
6464 return;
6466 if (cfun->calls_alloca
6467 || cfun->has_nonlocal_label
6468 || crtl->has_nonlocal_goto)
6469 crtl->need_drap = true;
6471 /* Call update_stack_boundary here again to update incoming stack
6472 boundary. It may set incoming stack alignment to a different
6473 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6474 use the minimum incoming stack alignment to check if it is OK
6475 to perform sibcall optimization since sibcall optimization will
6476 only align the outgoing stack to incoming stack boundary. */
6477 if (targetm.calls.update_stack_boundary)
6478 targetm.calls.update_stack_boundary ();
6480 /* The incoming stack frame has to be aligned at least at
6481 parm_stack_boundary. */
6482 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6484 /* Update crtl->stack_alignment_estimated and use it later to align
6485 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6486 exceptions since callgraph doesn't collect incoming stack alignment
6487 in this case. */
6488 if (cfun->can_throw_non_call_exceptions
6489 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6490 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6491 else
6492 preferred_stack_boundary = crtl->preferred_stack_boundary;
6493 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6494 crtl->stack_alignment_estimated = preferred_stack_boundary;
6495 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6496 crtl->stack_alignment_needed = preferred_stack_boundary;
6498 gcc_assert (crtl->stack_alignment_needed
6499 <= crtl->stack_alignment_estimated);
6501 crtl->stack_realign_needed
6502 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6503 crtl->stack_realign_tried = crtl->stack_realign_needed;
6505 crtl->stack_realign_processed = true;
6507 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6508 alignment. */
6509 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6510 drap_rtx = targetm.calls.get_drap_rtx ();
6512 /* stack_realign_drap and drap_rtx must match. */
6513 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6515 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6516 if (drap_rtx != NULL)
6518 crtl->args.internal_arg_pointer = drap_rtx;
6520 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6521 needed. */
6522 fixup_tail_calls ();
6527 static void
6528 expand_main_function (void)
6530 #if (defined(INVOKE__main) \
6531 || (!defined(HAS_INIT_SECTION) \
6532 && !defined(INIT_SECTION_ASM_OP) \
6533 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6534 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6535 #endif
6539 /* Expand code to initialize the stack_protect_guard. This is invoked at
6540 the beginning of a function to be protected. */
6542 static void
6543 stack_protect_prologue (void)
6545 tree guard_decl = targetm.stack_protect_guard ();
6546 rtx x, y;
6548 crtl->stack_protect_guard_decl = guard_decl;
6549 x = expand_normal (crtl->stack_protect_guard);
6551 if (targetm.have_stack_protect_combined_set () && guard_decl)
6553 gcc_assert (DECL_P (guard_decl));
6554 y = DECL_RTL (guard_decl);
6556 /* Allow the target to compute address of Y and copy it to X without
6557 leaking Y into a register. This combined address + copy pattern
6558 allows the target to prevent spilling of any intermediate results by
6559 splitting it after register allocator. */
6560 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6562 emit_insn (insn);
6563 return;
6567 if (guard_decl)
6568 y = expand_normal (guard_decl);
6569 else
6570 y = const0_rtx;
6572 /* Allow the target to copy from Y to X without leaking Y into a
6573 register. */
6574 if (targetm.have_stack_protect_set ())
6575 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6577 emit_insn (insn);
6578 return;
6581 /* Otherwise do a straight move. */
6582 emit_move_insn (x, y);
6585 /* Translate the intermediate representation contained in the CFG
6586 from GIMPLE trees to RTL.
6588 We do conversion per basic block and preserve/update the tree CFG.
6589 This implies we have to do some magic as the CFG can simultaneously
6590 consist of basic blocks containing RTL and GIMPLE trees. This can
6591 confuse the CFG hooks, so be careful to not manipulate CFG during
6592 the expansion. */
6594 namespace {
6596 const pass_data pass_data_expand =
6598 RTL_PASS, /* type */
6599 "expand", /* name */
6600 OPTGROUP_NONE, /* optinfo_flags */
6601 TV_EXPAND, /* tv_id */
6602 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6603 | PROP_gimple_lcx
6604 | PROP_gimple_lvec
6605 | PROP_gimple_lva), /* properties_required */
6606 PROP_rtl, /* properties_provided */
6607 ( PROP_ssa | PROP_gimple ), /* properties_destroyed */
6608 0, /* todo_flags_start */
6609 0, /* todo_flags_finish */
6612 class pass_expand : public rtl_opt_pass
6614 public:
6615 pass_expand (gcc::context *ctxt)
6616 : rtl_opt_pass (pass_data_expand, ctxt)
6619 /* opt_pass methods: */
6620 unsigned int execute (function *) final override;
6622 }; // class pass_expand
6624 unsigned int
6625 pass_expand::execute (function *fun)
6627 basic_block bb, init_block;
6628 edge_iterator ei;
6629 edge e;
6630 rtx_insn *var_seq, *var_ret_seq;
6631 unsigned i;
6633 timevar_push (TV_OUT_OF_SSA);
6634 rewrite_out_of_ssa (&SA);
6635 timevar_pop (TV_OUT_OF_SSA);
6636 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6638 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6640 gimple_stmt_iterator gsi;
6641 FOR_EACH_BB_FN (bb, cfun)
6642 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6643 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6644 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6647 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6648 auto_bitmap forced_stack_vars;
6649 discover_nonconstant_array_refs (forced_stack_vars);
6651 /* Make sure all values used by the optimization passes have sane
6652 defaults. */
6653 reg_renumber = 0;
6655 /* Some backends want to know that we are expanding to RTL. */
6656 currently_expanding_to_rtl = 1;
6657 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6658 free_dominance_info (CDI_DOMINATORS);
6660 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6662 insn_locations_init ();
6663 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6665 /* Eventually, all FEs should explicitly set function_start_locus. */
6666 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6667 set_curr_insn_location
6668 (DECL_SOURCE_LOCATION (current_function_decl));
6669 else
6670 set_curr_insn_location (fun->function_start_locus);
6672 else
6673 set_curr_insn_location (UNKNOWN_LOCATION);
6674 prologue_location = curr_insn_location ();
6676 #ifdef INSN_SCHEDULING
6677 init_sched_attrs ();
6678 #endif
6680 /* Make sure first insn is a note even if we don't want linenums.
6681 This makes sure the first insn will never be deleted.
6682 Also, final expects a note to appear there. */
6683 emit_note (NOTE_INSN_DELETED);
6685 targetm.expand_to_rtl_hook ();
6686 crtl->init_stack_alignment ();
6687 fun->cfg->max_jumptable_ents = 0;
6689 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6690 of the function section at exapnsion time to predict distance of calls. */
6691 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6693 /* Expand the variables recorded during gimple lowering. */
6694 timevar_push (TV_VAR_EXPAND);
6695 start_sequence ();
6697 var_ret_seq = expand_used_vars (forced_stack_vars);
6699 var_seq = get_insns ();
6700 end_sequence ();
6701 timevar_pop (TV_VAR_EXPAND);
6703 /* Honor stack protection warnings. */
6704 if (warn_stack_protect)
6706 if (fun->calls_alloca)
6707 warning (OPT_Wstack_protector,
6708 "stack protector not protecting local variables: "
6709 "variable length buffer");
6710 if (has_short_buffer && !crtl->stack_protect_guard)
6711 warning (OPT_Wstack_protector,
6712 "stack protector not protecting function: "
6713 "all local arrays are less than %d bytes long",
6714 (int) param_ssp_buffer_size);
6717 /* Temporarily mark PARM_DECLs and RESULT_DECLs we need to expand to
6718 memory addressable so expand_function_start can emit the required
6719 copies. */
6720 auto_vec<tree, 16> marked_parms;
6721 for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
6722 parm = DECL_CHAIN (parm))
6723 if (!TREE_ADDRESSABLE (parm)
6724 && bitmap_bit_p (forced_stack_vars, DECL_UID (parm)))
6726 TREE_ADDRESSABLE (parm) = 1;
6727 marked_parms.safe_push (parm);
6729 if (DECL_RESULT (current_function_decl)
6730 && !TREE_ADDRESSABLE (DECL_RESULT (current_function_decl))
6731 && bitmap_bit_p (forced_stack_vars,
6732 DECL_UID (DECL_RESULT (current_function_decl))))
6734 TREE_ADDRESSABLE (DECL_RESULT (current_function_decl)) = 1;
6735 marked_parms.safe_push (DECL_RESULT (current_function_decl));
6738 /* Set up parameters and prepare for return, for the function. */
6739 expand_function_start (current_function_decl);
6741 /* Clear TREE_ADDRESSABLE again. */
6742 while (!marked_parms.is_empty ())
6743 TREE_ADDRESSABLE (marked_parms.pop ()) = 0;
6745 /* If we emitted any instructions for setting up the variables,
6746 emit them before the FUNCTION_START note. */
6747 if (var_seq)
6749 emit_insn_before (var_seq, parm_birth_insn);
6751 /* In expand_function_end we'll insert the alloca save/restore
6752 before parm_birth_insn. We've just insertted an alloca call.
6753 Adjust the pointer to match. */
6754 parm_birth_insn = var_seq;
6757 /* Now propagate the RTL assignment of each partition to the
6758 underlying var of each SSA_NAME. */
6759 tree name;
6761 FOR_EACH_SSA_NAME (i, name, cfun)
6763 /* We might have generated new SSA names in
6764 update_alias_info_with_stack_vars. They will have a NULL
6765 defining statements, and won't be part of the partitioning,
6766 so ignore those. */
6767 if (!SSA_NAME_DEF_STMT (name))
6768 continue;
6770 adjust_one_expanded_partition_var (name);
6773 /* Clean up RTL of variables that straddle across multiple
6774 partitions, and check that the rtl of any PARM_DECLs that are not
6775 cleaned up is that of their default defs. */
6776 FOR_EACH_SSA_NAME (i, name, cfun)
6778 int part;
6780 /* We might have generated new SSA names in
6781 update_alias_info_with_stack_vars. They will have a NULL
6782 defining statements, and won't be part of the partitioning,
6783 so ignore those. */
6784 if (!SSA_NAME_DEF_STMT (name))
6785 continue;
6786 part = var_to_partition (SA.map, name);
6787 if (part == NO_PARTITION)
6788 continue;
6790 /* If this decl was marked as living in multiple places, reset
6791 this now to NULL. */
6792 tree var = SSA_NAME_VAR (name);
6793 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6794 SET_DECL_RTL (var, NULL);
6795 /* Check that the pseudos chosen by assign_parms are those of
6796 the corresponding default defs. */
6797 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6798 && (TREE_CODE (var) == PARM_DECL
6799 || TREE_CODE (var) == RESULT_DECL))
6801 rtx in = DECL_RTL_IF_SET (var);
6802 gcc_assert (in);
6803 rtx out = SA.partition_to_pseudo[part];
6804 gcc_assert (in == out);
6806 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6807 those expected by debug backends for each parm and for
6808 the result. This is particularly important for stabs,
6809 whose register elimination from parm's DECL_RTL may cause
6810 -fcompare-debug differences as SET_DECL_RTL changes reg's
6811 attrs. So, make sure the RTL already has the parm as the
6812 EXPR, so that it won't change. */
6813 SET_DECL_RTL (var, NULL_RTX);
6814 if (MEM_P (in))
6815 set_mem_attributes (in, var, true);
6816 SET_DECL_RTL (var, in);
6820 /* If this function is `main', emit a call to `__main'
6821 to run global initializers, etc. */
6822 if (DECL_NAME (current_function_decl)
6823 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6824 && DECL_FILE_SCOPE_P (current_function_decl))
6825 expand_main_function ();
6827 /* Initialize the stack_protect_guard field. This must happen after the
6828 call to __main (if any) so that the external decl is initialized. */
6829 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6830 stack_protect_prologue ();
6832 expand_phi_nodes (&SA);
6834 /* Release any stale SSA redirection data. */
6835 redirect_edge_var_map_empty ();
6837 /* Register rtl specific functions for cfg. */
6838 rtl_register_cfg_hooks ();
6840 init_block = construct_init_block ();
6842 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6843 remaining edges later. */
6844 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6845 e->flags &= ~EDGE_EXECUTABLE;
6847 /* If the function has too many markers, drop them while expanding. */
6848 if (cfun->debug_marker_count
6849 >= param_max_debug_marker_count)
6850 cfun->debug_nonbind_markers = false;
6852 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6853 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6854 next_bb)
6855 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6857 if (MAY_HAVE_DEBUG_BIND_INSNS)
6858 expand_debug_locations ();
6860 if (deep_ter_debug_map)
6862 delete deep_ter_debug_map;
6863 deep_ter_debug_map = NULL;
6866 /* Free stuff we no longer need after GIMPLE optimizations. */
6867 free_dominance_info (CDI_DOMINATORS);
6868 free_dominance_info (CDI_POST_DOMINATORS);
6869 delete_tree_cfg_annotations (fun);
6871 timevar_push (TV_OUT_OF_SSA);
6872 finish_out_of_ssa (&SA);
6873 timevar_pop (TV_OUT_OF_SSA);
6875 timevar_push (TV_POST_EXPAND);
6876 /* We are no longer in SSA form. */
6877 fun->gimple_df->in_ssa_p = false;
6878 loops_state_clear (LOOP_CLOSED_SSA);
6880 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6881 conservatively to true until they are all profile aware. */
6882 delete lab_rtx_for_bb;
6883 free_histograms (fun);
6885 construct_exit_block ();
6886 insn_locations_finalize ();
6888 if (var_ret_seq)
6890 rtx_insn *after = return_label;
6891 rtx_insn *next = NEXT_INSN (after);
6892 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6893 after = next;
6894 emit_insn_after (var_ret_seq, after);
6897 if (hwasan_sanitize_stack_p ())
6898 hwasan_maybe_emit_frame_base_init ();
6900 /* Zap the tree EH table. */
6901 set_eh_throw_stmt_table (fun, NULL);
6903 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6904 split edges which edge insertions might do. */
6905 rebuild_jump_labels (get_insns ());
6907 /* If we have a single successor to the entry block, put the pending insns
6908 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6909 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6911 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6912 if (e->insns.r)
6914 rtx_insn *insns = e->insns.r;
6915 e->insns.r = NULL;
6916 rebuild_jump_labels_chain (insns);
6917 if (NOTE_P (parm_birth_insn)
6918 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6919 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6920 else
6921 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6925 /* Otherwise, as well as for other edges, take the usual way. */
6926 commit_edge_insertions ();
6928 /* We're done expanding trees to RTL. */
6929 currently_expanding_to_rtl = 0;
6931 flush_mark_addressable_queue ();
6933 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6934 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6936 edge e;
6937 edge_iterator ei;
6938 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6940 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6941 e->flags &= ~EDGE_EXECUTABLE;
6943 /* At the moment not all abnormal edges match the RTL
6944 representation. It is safe to remove them here as
6945 find_many_sub_basic_blocks will rediscover them.
6946 In the future we should get this fixed properly. */
6947 if ((e->flags & EDGE_ABNORMAL)
6948 && !(e->flags & EDGE_SIBCALL))
6949 remove_edge (e);
6950 else
6951 ei_next (&ei);
6955 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6956 bitmap_ones (blocks);
6957 find_many_sub_basic_blocks (blocks);
6958 purge_all_dead_edges ();
6960 /* After initial rtl generation, call back to finish generating
6961 exception support code. We need to do this before cleaning up
6962 the CFG as the code does not expect dead landing pads. */
6963 if (fun->eh->region_tree != NULL)
6964 finish_eh_generation ();
6966 /* Call expand_stack_alignment after finishing all
6967 updates to crtl->preferred_stack_boundary. */
6968 expand_stack_alignment ();
6970 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6971 function. */
6972 if (crtl->tail_call_emit)
6973 fixup_tail_calls ();
6975 HOST_WIDE_INT patch_area_size, patch_area_entry;
6976 parse_and_check_patch_area (flag_patchable_function_entry, false,
6977 &patch_area_size, &patch_area_entry);
6979 tree patchable_function_entry_attr
6980 = lookup_attribute ("patchable_function_entry",
6981 DECL_ATTRIBUTES (cfun->decl));
6982 if (patchable_function_entry_attr)
6984 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
6985 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
6987 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
6988 patch_area_entry = 0;
6989 if (TREE_CHAIN (pp_val) != NULL_TREE)
6991 tree patchable_function_entry_value2
6992 = TREE_VALUE (TREE_CHAIN (pp_val));
6993 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
6997 if (patch_area_entry > patch_area_size)
6999 if (patch_area_size > 0)
7000 warning (OPT_Wattributes,
7001 "patchable function entry %wu exceeds size %wu",
7002 patch_area_entry, patch_area_size);
7003 patch_area_entry = 0;
7006 crtl->patch_area_size = patch_area_size;
7007 crtl->patch_area_entry = patch_area_entry;
7009 /* BB subdivision may have created basic blocks that are only reachable
7010 from unlikely bbs but not marked as such in the profile. */
7011 if (optimize)
7012 propagate_unlikely_bbs_forward ();
7014 /* Remove unreachable blocks, otherwise we cannot compute dominators
7015 which are needed for loop state verification. As a side-effect
7016 this also compacts blocks.
7017 ??? We cannot remove trivially dead insns here as for example
7018 the DRAP reg on i?86 is not magically live at this point.
7019 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
7020 cleanup_cfg (CLEANUP_NO_INSN_DEL);
7022 checking_verify_flow_info ();
7024 /* Initialize pseudos allocated for hard registers. */
7025 emit_initial_value_sets ();
7027 /* And finally unshare all RTL. */
7028 unshare_all_rtl ();
7030 /* There's no need to defer outputting this function any more; we
7031 know we want to output it. */
7032 DECL_DEFER_OUTPUT (current_function_decl) = 0;
7034 /* Now that we're done expanding trees to RTL, we shouldn't have any
7035 more CONCATs anywhere. */
7036 generating_concat_p = 0;
7038 if (dump_file)
7040 fprintf (dump_file,
7041 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
7042 /* And the pass manager will dump RTL for us. */
7045 /* If we're emitting a nested function, make sure its parent gets
7046 emitted as well. Doing otherwise confuses debug info. */
7048 tree parent;
7049 for (parent = DECL_CONTEXT (current_function_decl);
7050 parent != NULL_TREE;
7051 parent = get_containing_scope (parent))
7052 if (TREE_CODE (parent) == FUNCTION_DECL)
7053 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
7056 TREE_ASM_WRITTEN (current_function_decl) = 1;
7058 /* After expanding, the return labels are no longer needed. */
7059 return_label = NULL;
7060 naked_return_label = NULL;
7062 /* After expanding, the tm_restart map is no longer needed. */
7063 if (fun->gimple_df->tm_restart)
7064 fun->gimple_df->tm_restart = NULL;
7066 /* Tag the blocks with a depth number so that change_scope can find
7067 the common parent easily. */
7068 set_block_levels (DECL_INITIAL (fun->decl), 0);
7069 default_rtl_profile ();
7071 /* For -dx discard loops now, otherwise IL verify in clean_state will
7072 ICE. */
7073 if (rtl_dump_and_exit)
7075 cfun->curr_properties &= ~PROP_loops;
7076 loop_optimizer_finalize ();
7079 timevar_pop (TV_POST_EXPAND);
7081 return 0;
7084 } // anon namespace
7086 rtl_opt_pass *
7087 make_pass_expand (gcc::context *ctxt)
7089 return new pass_expand (ctxt);