c++: trait patch tweak
[official-gcc.git] / gcc / cfgexpand.cc
blobb860be8bb77b84357a439e6b25734e285fd8b418
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2023 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
76 #include "opts.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 switch (gimple_assign_rhs_class (stmt))
109 case GIMPLE_TERNARY_RHS:
110 t = build3 (gimple_assign_rhs_code (stmt),
111 TREE_TYPE (gimple_assign_lhs (stmt)),
112 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
113 gimple_assign_rhs3 (stmt));
114 break;
115 case GIMPLE_BINARY_RHS:
116 t = build2 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
119 break;
120 case GIMPLE_UNARY_RHS:
121 t = build1 (gimple_assign_rhs_code (stmt),
122 TREE_TYPE (gimple_assign_lhs (stmt)),
123 gimple_assign_rhs1 (stmt));
124 break;
125 case GIMPLE_SINGLE_RHS:
127 t = gimple_assign_rhs1 (stmt);
128 /* Avoid modifying this tree in place below. */
129 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
130 && gimple_location (stmt) != EXPR_LOCATION (t))
131 || (gimple_block (stmt) && currently_expanding_to_rtl
132 && EXPR_P (t)))
133 t = copy_node (t);
134 break;
136 default:
137 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 class stack_var
310 public:
311 /* The Variable. */
312 tree decl;
314 /* Initially, the size of the variable. Later, the size of the partition,
315 if this variable becomes it's partition's representative. */
316 poly_uint64 size;
318 /* The *byte* alignment required for this variable. Or as, with the
319 size, the alignment for this partition. */
320 unsigned int alignb;
322 /* The partition representative. */
323 size_t representative;
325 /* The next stack variable in the partition, or EOC. */
326 size_t next;
328 /* The numbers of conflicting stack variables. */
329 bitmap conflicts;
332 #define EOC ((size_t)-1)
334 /* We have an array of such objects while deciding allocation. */
335 static class stack_var *stack_vars;
336 static size_t stack_vars_alloc;
337 static size_t stack_vars_num;
338 static hash_map<tree, size_t> *decl_to_stack_part;
340 /* Conflict bitmaps go on this obstack. This allows us to destroy
341 all of them in one big sweep. */
342 static bitmap_obstack stack_var_bitmap_obstack;
344 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
345 is non-decreasing. */
346 static size_t *stack_vars_sorted;
348 /* The phase of the stack frame. This is the known misalignment of
349 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
350 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
351 static int frame_phase;
353 /* Used during expand_used_vars to remember if we saw any decls for
354 which we'd like to enable stack smashing protection. */
355 static bool has_protected_decls;
357 /* Used during expand_used_vars. Remember if we say a character buffer
358 smaller than our cutoff threshold. Used for -Wstack-protector. */
359 static bool has_short_buffer;
361 /* Compute the byte alignment to use for DECL. Ignore alignment
362 we can't do with expected alignment of the stack boundary. */
364 static unsigned int
365 align_local_variable (tree decl, bool really_expand)
367 unsigned int align;
369 if (TREE_CODE (decl) == SSA_NAME)
371 tree type = TREE_TYPE (decl);
372 machine_mode mode = TYPE_MODE (type);
374 align = TYPE_ALIGN (type);
375 if (mode != BLKmode
376 && align < GET_MODE_ALIGNMENT (mode))
377 align = GET_MODE_ALIGNMENT (mode);
379 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
382 if (hwasan_sanitize_stack_p ())
383 align = MAX (align, (unsigned) HWASAN_TAG_GRANULE_SIZE * BITS_PER_UNIT);
385 if (TREE_CODE (decl) != SSA_NAME && really_expand)
386 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
387 That is done before IPA and could bump alignment based on host
388 backend even for offloaded code which wants different
389 LOCAL_DECL_ALIGNMENT. */
390 SET_DECL_ALIGN (decl, align);
392 return align / BITS_PER_UNIT;
395 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
396 down otherwise. Return truncated BASE value. */
398 static inline unsigned HOST_WIDE_INT
399 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
401 return align_up ? (base + align - 1) & -align : base & -align;
404 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
405 Return the frame offset. */
407 static poly_int64
408 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
410 poly_int64 offset, new_frame_offset;
412 if (FRAME_GROWS_DOWNWARD)
414 new_frame_offset
415 = aligned_lower_bound (frame_offset - frame_phase - size,
416 align) + frame_phase;
417 offset = new_frame_offset;
419 else
421 new_frame_offset
422 = aligned_upper_bound (frame_offset - frame_phase,
423 align) + frame_phase;
424 offset = new_frame_offset;
425 new_frame_offset += size;
427 frame_offset = new_frame_offset;
429 if (frame_offset_overflow (frame_offset, cfun->decl))
430 frame_offset = offset = 0;
432 return offset;
435 /* Ensure that the stack is aligned to ALIGN bytes.
436 Return the new frame offset. */
437 static poly_int64
438 align_frame_offset (unsigned HOST_WIDE_INT align)
440 return alloc_stack_frame_space (0, align);
443 /* Accumulate DECL into STACK_VARS. */
445 static void
446 add_stack_var (tree decl, bool really_expand)
448 class stack_var *v;
450 if (stack_vars_num >= stack_vars_alloc)
452 if (stack_vars_alloc)
453 stack_vars_alloc = stack_vars_alloc * 3 / 2;
454 else
455 stack_vars_alloc = 32;
456 stack_vars
457 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
459 if (!decl_to_stack_part)
460 decl_to_stack_part = new hash_map<tree, size_t>;
462 v = &stack_vars[stack_vars_num];
463 decl_to_stack_part->put (decl, stack_vars_num);
465 v->decl = decl;
466 tree size = TREE_CODE (decl) == SSA_NAME
467 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
468 : DECL_SIZE_UNIT (decl);
469 v->size = tree_to_poly_uint64 (size);
470 /* Ensure that all variables have size, so that &a != &b for any two
471 variables that are simultaneously live. */
472 if (known_eq (v->size, 0U))
473 v->size = 1;
474 v->alignb = align_local_variable (decl, really_expand);
475 /* An alignment of zero can mightily confuse us later. */
476 gcc_assert (v->alignb != 0);
478 /* All variables are initially in their own partition. */
479 v->representative = stack_vars_num;
480 v->next = EOC;
482 /* All variables initially conflict with no other. */
483 v->conflicts = NULL;
485 /* Ensure that this decl doesn't get put onto the list twice. */
486 set_rtl (decl, pc_rtx);
488 stack_vars_num++;
491 /* Make the decls associated with luid's X and Y conflict. */
493 static void
494 add_stack_var_conflict (size_t x, size_t y)
496 class stack_var *a = &stack_vars[x];
497 class stack_var *b = &stack_vars[y];
498 if (x == y)
499 return;
500 if (!a->conflicts)
501 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
502 if (!b->conflicts)
503 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
504 bitmap_set_bit (a->conflicts, y);
505 bitmap_set_bit (b->conflicts, x);
508 /* Check whether the decls associated with luid's X and Y conflict. */
510 static bool
511 stack_var_conflict_p (size_t x, size_t y)
513 class stack_var *a = &stack_vars[x];
514 class stack_var *b = &stack_vars[y];
515 if (x == y)
516 return false;
517 /* Partitions containing an SSA name result from gimple registers
518 with things like unsupported modes. They are top-level and
519 hence conflict with everything else. */
520 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
521 return true;
523 if (!a->conflicts || !b->conflicts)
524 return false;
525 return bitmap_bit_p (a->conflicts, y);
528 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
529 enter its partition number into bitmap DATA. */
531 static bool
532 visit_op (gimple *, tree op, tree, void *data)
534 bitmap active = (bitmap)data;
535 op = get_base_address (op);
536 if (op
537 && DECL_P (op)
538 && DECL_RTL_IF_SET (op) == pc_rtx)
540 size_t *v = decl_to_stack_part->get (op);
541 if (v)
542 bitmap_set_bit (active, *v);
544 return false;
547 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
548 record conflicts between it and all currently active other partitions
549 from bitmap DATA. */
551 static bool
552 visit_conflict (gimple *, tree op, tree, void *data)
554 bitmap active = (bitmap)data;
555 op = get_base_address (op);
556 if (op
557 && DECL_P (op)
558 && DECL_RTL_IF_SET (op) == pc_rtx)
560 size_t *v = decl_to_stack_part->get (op);
561 if (v && bitmap_set_bit (active, *v))
563 size_t num = *v;
564 bitmap_iterator bi;
565 unsigned i;
566 gcc_assert (num < stack_vars_num);
567 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
568 add_stack_var_conflict (num, i);
571 return false;
574 /* Helper routine for add_scope_conflicts, calculating the active partitions
575 at the end of BB, leaving the result in WORK. We're called to generate
576 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
577 liveness. */
579 static void
580 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
582 edge e;
583 edge_iterator ei;
584 gimple_stmt_iterator gsi;
585 walk_stmt_load_store_addr_fn visit;
587 bitmap_clear (work);
588 FOR_EACH_EDGE (e, ei, bb->preds)
589 bitmap_ior_into (work, (bitmap)e->src->aux);
591 visit = visit_op;
593 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
595 gimple *stmt = gsi_stmt (gsi);
596 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
598 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
600 gimple *stmt = gsi_stmt (gsi);
602 if (gimple_clobber_p (stmt))
604 tree lhs = gimple_assign_lhs (stmt);
605 size_t *v;
606 /* Nested function lowering might introduce LHSs
607 that are COMPONENT_REFs. */
608 if (!VAR_P (lhs))
609 continue;
610 if (DECL_RTL_IF_SET (lhs) == pc_rtx
611 && (v = decl_to_stack_part->get (lhs)))
612 bitmap_clear_bit (work, *v);
614 else if (!is_gimple_debug (stmt))
616 if (for_conflict
617 && visit == visit_op)
619 /* If this is the first real instruction in this BB we need
620 to add conflicts for everything live at this point now.
621 Unlike classical liveness for named objects we can't
622 rely on seeing a def/use of the names we're interested in.
623 There might merely be indirect loads/stores. We'd not add any
624 conflicts for such partitions. */
625 bitmap_iterator bi;
626 unsigned i;
627 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
629 class stack_var *a = &stack_vars[i];
630 if (!a->conflicts)
631 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
632 bitmap_ior_into (a->conflicts, work);
634 visit = visit_conflict;
636 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
641 /* Generate stack partition conflicts between all partitions that are
642 simultaneously live. */
644 static void
645 add_scope_conflicts (void)
647 basic_block bb;
648 bool changed;
649 bitmap work = BITMAP_ALLOC (NULL);
650 int *rpo;
651 int n_bbs;
653 /* We approximate the live range of a stack variable by taking the first
654 mention of its name as starting point(s), and by the end-of-scope
655 death clobber added by gimplify as ending point(s) of the range.
656 This overapproximates in the case we for instance moved an address-taken
657 operation upward, without also moving a dereference to it upwards.
658 But it's conservatively correct as a variable never can hold values
659 before its name is mentioned at least once.
661 We then do a mostly classical bitmap liveness algorithm. */
663 FOR_ALL_BB_FN (bb, cfun)
664 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
666 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
667 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
669 changed = true;
670 while (changed)
672 int i;
673 changed = false;
674 for (i = 0; i < n_bbs; i++)
676 bitmap active;
677 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
678 active = (bitmap)bb->aux;
679 add_scope_conflicts_1 (bb, work, false);
680 if (bitmap_ior_into (active, work))
681 changed = true;
685 FOR_EACH_BB_FN (bb, cfun)
686 add_scope_conflicts_1 (bb, work, true);
688 free (rpo);
689 BITMAP_FREE (work);
690 FOR_ALL_BB_FN (bb, cfun)
691 BITMAP_FREE (bb->aux);
694 /* A subroutine of partition_stack_vars. A comparison function for qsort,
695 sorting an array of indices by the properties of the object. */
697 static int
698 stack_var_cmp (const void *a, const void *b)
700 size_t ia = *(const size_t *)a;
701 size_t ib = *(const size_t *)b;
702 unsigned int aligna = stack_vars[ia].alignb;
703 unsigned int alignb = stack_vars[ib].alignb;
704 poly_int64 sizea = stack_vars[ia].size;
705 poly_int64 sizeb = stack_vars[ib].size;
706 tree decla = stack_vars[ia].decl;
707 tree declb = stack_vars[ib].decl;
708 bool largea, largeb;
709 unsigned int uida, uidb;
711 /* Primary compare on "large" alignment. Large comes first. */
712 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
713 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
714 if (largea != largeb)
715 return (int)largeb - (int)largea;
717 /* Secondary compare on size, decreasing */
718 int diff = compare_sizes_for_sort (sizeb, sizea);
719 if (diff != 0)
720 return diff;
722 /* Tertiary compare on true alignment, decreasing. */
723 if (aligna < alignb)
724 return -1;
725 if (aligna > alignb)
726 return 1;
728 /* Final compare on ID for sort stability, increasing.
729 Two SSA names are compared by their version, SSA names come before
730 non-SSA names, and two normal decls are compared by their DECL_UID. */
731 if (TREE_CODE (decla) == SSA_NAME)
733 if (TREE_CODE (declb) == SSA_NAME)
734 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
735 else
736 return -1;
738 else if (TREE_CODE (declb) == SSA_NAME)
739 return 1;
740 else
741 uida = DECL_UID (decla), uidb = DECL_UID (declb);
742 if (uida < uidb)
743 return 1;
744 if (uida > uidb)
745 return -1;
746 return 0;
749 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
750 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
752 /* If the points-to solution *PI points to variables that are in a partition
753 together with other variables add all partition members to the pointed-to
754 variables bitmap. */
756 static void
757 add_partitioned_vars_to_ptset (struct pt_solution *pt,
758 part_hashmap *decls_to_partitions,
759 hash_set<bitmap> *visited, bitmap temp)
761 bitmap_iterator bi;
762 unsigned i;
763 bitmap *part;
765 if (pt->anything
766 || pt->vars == NULL
767 /* The pointed-to vars bitmap is shared, it is enough to
768 visit it once. */
769 || visited->add (pt->vars))
770 return;
772 bitmap_clear (temp);
774 /* By using a temporary bitmap to store all members of the partitions
775 we have to add we make sure to visit each of the partitions only
776 once. */
777 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
778 if ((!temp
779 || !bitmap_bit_p (temp, i))
780 && (part = decls_to_partitions->get (i)))
781 bitmap_ior_into (temp, *part);
782 if (!bitmap_empty_p (temp))
783 bitmap_ior_into (pt->vars, temp);
786 /* Update points-to sets based on partition info, so we can use them on RTL.
787 The bitmaps representing stack partitions will be saved until expand,
788 where partitioned decls used as bases in memory expressions will be
789 rewritten. */
791 static void
792 update_alias_info_with_stack_vars (void)
794 part_hashmap *decls_to_partitions = NULL;
795 size_t i, j;
796 tree var = NULL_TREE;
798 for (i = 0; i < stack_vars_num; i++)
800 bitmap part = NULL;
801 tree name;
802 struct ptr_info_def *pi;
804 /* Not interested in partitions with single variable. */
805 if (stack_vars[i].representative != i
806 || stack_vars[i].next == EOC)
807 continue;
809 if (!decls_to_partitions)
811 decls_to_partitions = new part_hashmap;
812 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
815 /* Create an SSA_NAME that points to the partition for use
816 as base during alias-oracle queries on RTL for bases that
817 have been partitioned. */
818 if (var == NULL_TREE)
819 var = create_tmp_var (ptr_type_node);
820 name = make_ssa_name (var);
822 /* Create bitmaps representing partitions. They will be used for
823 points-to sets later, so use GGC alloc. */
824 part = BITMAP_GGC_ALLOC ();
825 for (j = i; j != EOC; j = stack_vars[j].next)
827 tree decl = stack_vars[j].decl;
828 unsigned int uid = DECL_PT_UID (decl);
829 bitmap_set_bit (part, uid);
830 decls_to_partitions->put (uid, part);
831 cfun->gimple_df->decls_to_pointers->put (decl, name);
832 if (TREE_ADDRESSABLE (decl))
833 TREE_ADDRESSABLE (name) = 1;
836 /* Make the SSA name point to all partition members. */
837 pi = get_ptr_info (name);
838 pt_solution_set (&pi->pt, part, false);
841 /* Make all points-to sets that contain one member of a partition
842 contain all members of the partition. */
843 if (decls_to_partitions)
845 unsigned i;
846 tree name;
847 hash_set<bitmap> visited;
848 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
850 FOR_EACH_SSA_NAME (i, name, cfun)
852 struct ptr_info_def *pi;
854 if (POINTER_TYPE_P (TREE_TYPE (name))
855 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
856 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
857 &visited, temp);
860 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
861 decls_to_partitions, &visited, temp);
862 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped_return,
863 decls_to_partitions, &visited, temp);
864 delete decls_to_partitions;
865 BITMAP_FREE (temp);
869 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
870 partitioning algorithm. Partitions A and B are known to be non-conflicting.
871 Merge them into a single partition A. */
873 static void
874 union_stack_vars (size_t a, size_t b)
876 class stack_var *vb = &stack_vars[b];
877 bitmap_iterator bi;
878 unsigned u;
880 gcc_assert (stack_vars[b].next == EOC);
881 /* Add B to A's partition. */
882 stack_vars[b].next = stack_vars[a].next;
883 stack_vars[b].representative = a;
884 stack_vars[a].next = b;
886 /* Make sure A is big enough to hold B. */
887 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
889 /* Update the required alignment of partition A to account for B. */
890 if (stack_vars[a].alignb < stack_vars[b].alignb)
891 stack_vars[a].alignb = stack_vars[b].alignb;
893 /* Update the interference graph and merge the conflicts. */
894 if (vb->conflicts)
896 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
897 add_stack_var_conflict (a, stack_vars[u].representative);
898 BITMAP_FREE (vb->conflicts);
902 /* A subroutine of expand_used_vars. Binpack the variables into
903 partitions constrained by the interference graph. The overall
904 algorithm used is as follows:
906 Sort the objects by size in descending order.
907 For each object A {
908 S = size(A)
909 O = 0
910 loop {
911 Look for the largest non-conflicting object B with size <= S.
912 UNION (A, B)
917 static void
918 partition_stack_vars (void)
920 size_t si, sj, n = stack_vars_num;
922 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
923 for (si = 0; si < n; ++si)
924 stack_vars_sorted[si] = si;
926 if (n == 1)
927 return;
929 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
931 for (si = 0; si < n; ++si)
933 size_t i = stack_vars_sorted[si];
934 unsigned int ialign = stack_vars[i].alignb;
935 poly_int64 isize = stack_vars[i].size;
937 /* Ignore objects that aren't partition representatives. If we
938 see a var that is not a partition representative, it must
939 have been merged earlier. */
940 if (stack_vars[i].representative != i)
941 continue;
943 for (sj = si + 1; sj < n; ++sj)
945 size_t j = stack_vars_sorted[sj];
946 unsigned int jalign = stack_vars[j].alignb;
947 poly_int64 jsize = stack_vars[j].size;
949 /* Ignore objects that aren't partition representatives. */
950 if (stack_vars[j].representative != j)
951 continue;
953 /* Do not mix objects of "small" (supported) alignment
954 and "large" (unsupported) alignment. */
955 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
956 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
957 break;
959 /* For Address Sanitizer do not mix objects with different
960 sizes, as the shorter vars wouldn't be adequately protected.
961 Don't do that for "large" (unsupported) alignment objects,
962 those aren't protected anyway. */
963 if (asan_sanitize_stack_p ()
964 && maybe_ne (isize, jsize)
965 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
966 break;
968 /* Ignore conflicting objects. */
969 if (stack_var_conflict_p (i, j))
970 continue;
972 /* UNION the objects, placing J at OFFSET. */
973 union_stack_vars (i, j);
977 update_alias_info_with_stack_vars ();
980 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
982 static void
983 dump_stack_var_partition (void)
985 size_t si, i, j, n = stack_vars_num;
987 for (si = 0; si < n; ++si)
989 i = stack_vars_sorted[si];
991 /* Skip variables that aren't partition representatives, for now. */
992 if (stack_vars[i].representative != i)
993 continue;
995 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
996 print_dec (stack_vars[i].size, dump_file);
997 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
999 for (j = i; j != EOC; j = stack_vars[j].next)
1001 fputc ('\t', dump_file);
1002 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
1004 fputc ('\n', dump_file);
1008 /* Assign rtl to DECL at BASE + OFFSET. */
1010 static void
1011 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1012 poly_int64 offset)
1014 unsigned align;
1015 rtx x;
1017 /* If this fails, we've overflowed the stack frame. Error nicely? */
1018 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1020 if (hwasan_sanitize_stack_p ())
1021 x = targetm.memtag.add_tag (base, offset,
1022 hwasan_current_frame_tag ());
1023 else
1024 x = plus_constant (Pmode, base, offset);
1026 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1027 ? TYPE_MODE (TREE_TYPE (decl))
1028 : DECL_MODE (decl), x);
1030 /* Set alignment we actually gave this decl if it isn't an SSA name.
1031 If it is we generate stack slots only accidentally so it isn't as
1032 important, we'll simply set the alignment directly on the MEM. */
1034 if (stack_vars_base_reg_p (base))
1035 offset -= frame_phase;
1036 align = known_alignment (offset);
1037 align *= BITS_PER_UNIT;
1038 if (align == 0 || align > base_align)
1039 align = base_align;
1041 if (TREE_CODE (decl) != SSA_NAME)
1043 /* One would think that we could assert that we're not decreasing
1044 alignment here, but (at least) the i386 port does exactly this
1045 via the MINIMUM_ALIGNMENT hook. */
1047 SET_DECL_ALIGN (decl, align);
1048 DECL_USER_ALIGN (decl) = 0;
1051 set_rtl (decl, x);
1053 set_mem_align (x, align);
1056 class stack_vars_data
1058 public:
1059 /* Vector of offset pairs, always end of some padding followed
1060 by start of the padding that needs Address Sanitizer protection.
1061 The vector is in reversed, highest offset pairs come first. */
1062 auto_vec<HOST_WIDE_INT> asan_vec;
1064 /* Vector of partition representative decls in between the paddings. */
1065 auto_vec<tree> asan_decl_vec;
1067 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1068 rtx asan_base;
1070 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1071 unsigned int asan_alignb;
1074 /* A subroutine of expand_used_vars. Give each partition representative
1075 a unique location within the stack frame. Update each partition member
1076 with that location. */
1077 static void
1078 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1080 size_t si, i, j, n = stack_vars_num;
1081 poly_uint64 large_size = 0, large_alloc = 0;
1082 rtx large_base = NULL;
1083 rtx large_untagged_base = NULL;
1084 unsigned large_align = 0;
1085 bool large_allocation_done = false;
1086 tree decl;
1088 /* Determine if there are any variables requiring "large" alignment.
1089 Since these are dynamically allocated, we only process these if
1090 no predicate involved. */
1091 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1092 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1094 /* Find the total size of these variables. */
1095 for (si = 0; si < n; ++si)
1097 unsigned alignb;
1099 i = stack_vars_sorted[si];
1100 alignb = stack_vars[i].alignb;
1102 /* All "large" alignment decls come before all "small" alignment
1103 decls, but "large" alignment decls are not sorted based on
1104 their alignment. Increase large_align to track the largest
1105 required alignment. */
1106 if ((alignb * BITS_PER_UNIT) > large_align)
1107 large_align = alignb * BITS_PER_UNIT;
1109 /* Stop when we get to the first decl with "small" alignment. */
1110 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1111 break;
1113 /* Skip variables that aren't partition representatives. */
1114 if (stack_vars[i].representative != i)
1115 continue;
1117 /* Skip variables that have already had rtl assigned. See also
1118 add_stack_var where we perpetrate this pc_rtx hack. */
1119 decl = stack_vars[i].decl;
1120 if (TREE_CODE (decl) == SSA_NAME
1121 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1122 : DECL_RTL (decl) != pc_rtx)
1123 continue;
1125 large_size = aligned_upper_bound (large_size, alignb);
1126 large_size += stack_vars[i].size;
1130 for (si = 0; si < n; ++si)
1132 rtx base;
1133 unsigned base_align, alignb;
1134 poly_int64 offset = 0;
1136 i = stack_vars_sorted[si];
1138 /* Skip variables that aren't partition representatives, for now. */
1139 if (stack_vars[i].representative != i)
1140 continue;
1142 /* Skip variables that have already had rtl assigned. See also
1143 add_stack_var where we perpetrate this pc_rtx hack. */
1144 decl = stack_vars[i].decl;
1145 if (TREE_CODE (decl) == SSA_NAME
1146 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1147 : DECL_RTL (decl) != pc_rtx)
1148 continue;
1150 /* Check the predicate to see whether this variable should be
1151 allocated in this pass. */
1152 if (pred && !pred (i))
1153 continue;
1155 base = (hwasan_sanitize_stack_p ()
1156 ? hwasan_frame_base ()
1157 : virtual_stack_vars_rtx);
1158 alignb = stack_vars[i].alignb;
1159 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1161 poly_int64 hwasan_orig_offset;
1162 if (hwasan_sanitize_stack_p ())
1164 /* There must be no tag granule "shared" between different
1165 objects. This means that no HWASAN_TAG_GRANULE_SIZE byte
1166 chunk can have more than one object in it.
1168 We ensure this by forcing the end of the last bit of data to
1169 be aligned to HWASAN_TAG_GRANULE_SIZE bytes here, and setting
1170 the start of each variable to be aligned to
1171 HWASAN_TAG_GRANULE_SIZE bytes in `align_local_variable`.
1173 We can't align just one of the start or end, since there are
1174 untagged things stored on the stack which we do not align to
1175 HWASAN_TAG_GRANULE_SIZE bytes. If we only aligned the start
1176 or the end of tagged objects then untagged objects could end
1177 up sharing the first granule of a tagged object or sharing the
1178 last granule of a tagged object respectively. */
1179 hwasan_orig_offset = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1180 gcc_assert (stack_vars[i].alignb >= HWASAN_TAG_GRANULE_SIZE);
1182 /* ASAN description strings don't yet have a syntax for expressing
1183 polynomial offsets. */
1184 HOST_WIDE_INT prev_offset;
1185 if (asan_sanitize_stack_p ()
1186 && pred
1187 && frame_offset.is_constant (&prev_offset)
1188 && stack_vars[i].size.is_constant ())
1190 if (data->asan_vec.is_empty ())
1192 align_frame_offset (ASAN_RED_ZONE_SIZE);
1193 prev_offset = frame_offset.to_constant ();
1195 prev_offset = align_base (prev_offset,
1196 ASAN_MIN_RED_ZONE_SIZE,
1197 !FRAME_GROWS_DOWNWARD);
1198 tree repr_decl = NULL_TREE;
1199 unsigned HOST_WIDE_INT size
1200 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1201 if (data->asan_vec.is_empty ())
1202 size = MAX (size, ASAN_RED_ZONE_SIZE);
1204 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1205 ASAN_MIN_RED_ZONE_SIZE);
1206 offset = alloc_stack_frame_space (size, alignment);
1208 data->asan_vec.safe_push (prev_offset);
1209 /* Allocating a constant amount of space from a constant
1210 starting offset must give a constant result. */
1211 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1212 .to_constant ());
1213 /* Find best representative of the partition.
1214 Prefer those with DECL_NAME, even better
1215 satisfying asan_protect_stack_decl predicate. */
1216 for (j = i; j != EOC; j = stack_vars[j].next)
1217 if (asan_protect_stack_decl (stack_vars[j].decl)
1218 && DECL_NAME (stack_vars[j].decl))
1220 repr_decl = stack_vars[j].decl;
1221 break;
1223 else if (repr_decl == NULL_TREE
1224 && DECL_P (stack_vars[j].decl)
1225 && DECL_NAME (stack_vars[j].decl))
1226 repr_decl = stack_vars[j].decl;
1227 if (repr_decl == NULL_TREE)
1228 repr_decl = stack_vars[i].decl;
1229 data->asan_decl_vec.safe_push (repr_decl);
1231 /* Make sure a representative is unpoison if another
1232 variable in the partition is handled by
1233 use-after-scope sanitization. */
1234 if (asan_handled_variables != NULL
1235 && !asan_handled_variables->contains (repr_decl))
1237 for (j = i; j != EOC; j = stack_vars[j].next)
1238 if (asan_handled_variables->contains (stack_vars[j].decl))
1239 break;
1240 if (j != EOC)
1241 asan_handled_variables->add (repr_decl);
1244 data->asan_alignb = MAX (data->asan_alignb, alignb);
1245 if (data->asan_base == NULL)
1246 data->asan_base = gen_reg_rtx (Pmode);
1247 base = data->asan_base;
1249 if (!STRICT_ALIGNMENT)
1250 base_align = crtl->max_used_stack_slot_alignment;
1251 else
1252 base_align = MAX (crtl->max_used_stack_slot_alignment,
1253 GET_MODE_ALIGNMENT (SImode)
1254 << ASAN_SHADOW_SHIFT);
1256 else
1258 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1259 base_align = crtl->max_used_stack_slot_alignment;
1261 if (hwasan_sanitize_stack_p ())
1263 /* Align again since the point of this alignment is to handle
1264 the "end" of the object (i.e. smallest address after the
1265 stack object). For FRAME_GROWS_DOWNWARD that requires
1266 aligning the stack before allocating, but for a frame that
1267 grows upwards that requires aligning the stack after
1268 allocation.
1270 Use `frame_offset` to record the offset value rather than
1271 `offset` since the `frame_offset` describes the extent
1272 allocated for this particular variable while `offset`
1273 describes the address that this variable starts at. */
1274 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1275 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1276 hwasan_orig_offset, frame_offset);
1280 else
1282 /* Large alignment is only processed in the last pass. */
1283 if (pred)
1284 continue;
1286 /* If there were any variables requiring "large" alignment, allocate
1287 space. */
1288 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1290 poly_int64 loffset;
1291 rtx large_allocsize;
1293 large_allocsize = gen_int_mode (large_size, Pmode);
1294 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1295 loffset = alloc_stack_frame_space
1296 (rtx_to_poly_int64 (large_allocsize),
1297 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1298 large_base = get_dynamic_stack_base (loffset, large_align, base);
1299 large_allocation_done = true;
1302 gcc_assert (large_base != NULL);
1303 large_alloc = aligned_upper_bound (large_alloc, alignb);
1304 offset = large_alloc;
1305 large_alloc += stack_vars[i].size;
1306 if (hwasan_sanitize_stack_p ())
1308 /* An object with a large alignment requirement means that the
1309 alignment requirement is greater than the required alignment
1310 for tags. */
1311 if (!large_untagged_base)
1312 large_untagged_base
1313 = targetm.memtag.untagged_pointer (large_base, NULL_RTX);
1314 /* Ensure the end of the variable is also aligned correctly. */
1315 poly_int64 align_again
1316 = aligned_upper_bound (large_alloc, HWASAN_TAG_GRANULE_SIZE);
1317 /* For large allocations we always allocate a chunk of space
1318 (which is addressed by large_untagged_base/large_base) and
1319 then use positive offsets from that. Hence the farthest
1320 offset is `align_again` and the nearest offset from the base
1321 is `offset`. */
1322 hwasan_record_stack_var (large_untagged_base, large_base,
1323 offset, align_again);
1326 base = large_base;
1327 base_align = large_align;
1330 /* Create rtl for each variable based on their location within the
1331 partition. */
1332 for (j = i; j != EOC; j = stack_vars[j].next)
1334 expand_one_stack_var_at (stack_vars[j].decl,
1335 base, base_align, offset);
1337 if (hwasan_sanitize_stack_p ())
1338 hwasan_increment_frame_tag ();
1341 gcc_assert (known_eq (large_alloc, large_size));
1344 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1345 static poly_uint64
1346 account_stack_vars (void)
1348 size_t si, j, i, n = stack_vars_num;
1349 poly_uint64 size = 0;
1351 for (si = 0; si < n; ++si)
1353 i = stack_vars_sorted[si];
1355 /* Skip variables that aren't partition representatives, for now. */
1356 if (stack_vars[i].representative != i)
1357 continue;
1359 size += stack_vars[i].size;
1360 for (j = i; j != EOC; j = stack_vars[j].next)
1361 set_rtl (stack_vars[j].decl, NULL);
1363 return size;
1366 /* Record the RTL assignment X for the default def of PARM. */
1368 extern void
1369 set_parm_rtl (tree parm, rtx x)
1371 gcc_assert (TREE_CODE (parm) == PARM_DECL
1372 || TREE_CODE (parm) == RESULT_DECL);
1374 if (x && !MEM_P (x))
1376 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1377 TYPE_MODE (TREE_TYPE (parm)),
1378 TYPE_ALIGN (TREE_TYPE (parm)));
1380 /* If the variable alignment is very large we'll dynamicaly
1381 allocate it, which means that in-frame portion is just a
1382 pointer. ??? We've got a pseudo for sure here, do we
1383 actually dynamically allocate its spilling area if needed?
1384 ??? Isn't it a problem when Pmode alignment also exceeds
1385 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1386 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1387 align = GET_MODE_ALIGNMENT (Pmode);
1389 record_alignment_for_reg_var (align);
1392 tree ssa = ssa_default_def (cfun, parm);
1393 if (!ssa)
1394 return set_rtl (parm, x);
1396 int part = var_to_partition (SA.map, ssa);
1397 gcc_assert (part != NO_PARTITION);
1399 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1400 gcc_assert (changed);
1402 set_rtl (ssa, x);
1403 gcc_assert (DECL_RTL (parm) == x);
1406 /* A subroutine of expand_one_var. Called to immediately assign rtl
1407 to a variable to be allocated in the stack frame. */
1409 static void
1410 expand_one_stack_var_1 (tree var)
1412 poly_uint64 size;
1413 poly_int64 offset;
1414 unsigned byte_align;
1416 if (TREE_CODE (var) == SSA_NAME)
1418 tree type = TREE_TYPE (var);
1419 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1421 else
1422 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1424 byte_align = align_local_variable (var, true);
1426 /* We handle highly aligned variables in expand_stack_vars. */
1427 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1429 rtx base;
1430 if (hwasan_sanitize_stack_p ())
1432 /* Allocate zero bytes to align the stack. */
1433 poly_int64 hwasan_orig_offset
1434 = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1435 offset = alloc_stack_frame_space (size, byte_align);
1436 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1437 base = hwasan_frame_base ();
1438 /* Use `frame_offset` to automatically account for machines where the
1439 frame grows upwards.
1441 `offset` will always point to the "start" of the stack object, which
1442 will be the smallest address, for ! FRAME_GROWS_DOWNWARD this is *not*
1443 the "furthest" offset from the base delimiting the current stack
1444 object. `frame_offset` will always delimit the extent that the frame.
1446 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1447 hwasan_orig_offset, frame_offset);
1449 else
1451 offset = alloc_stack_frame_space (size, byte_align);
1452 base = virtual_stack_vars_rtx;
1455 expand_one_stack_var_at (var, base,
1456 crtl->max_used_stack_slot_alignment, offset);
1458 if (hwasan_sanitize_stack_p ())
1459 hwasan_increment_frame_tag ();
1462 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1463 already assigned some MEM. */
1465 static void
1466 expand_one_stack_var (tree var)
1468 if (TREE_CODE (var) == SSA_NAME)
1470 int part = var_to_partition (SA.map, var);
1471 if (part != NO_PARTITION)
1473 rtx x = SA.partition_to_pseudo[part];
1474 gcc_assert (x);
1475 gcc_assert (MEM_P (x));
1476 return;
1480 return expand_one_stack_var_1 (var);
1483 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1484 that will reside in a hard register. */
1486 static void
1487 expand_one_hard_reg_var (tree var)
1489 rest_of_decl_compilation (var, 0, 0);
1492 /* Record the alignment requirements of some variable assigned to a
1493 pseudo. */
1495 static void
1496 record_alignment_for_reg_var (unsigned int align)
1498 if (SUPPORTS_STACK_ALIGNMENT
1499 && crtl->stack_alignment_estimated < align)
1501 /* stack_alignment_estimated shouldn't change after stack
1502 realign decision made */
1503 gcc_assert (!crtl->stack_realign_processed);
1504 crtl->stack_alignment_estimated = align;
1507 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1508 So here we only make sure stack_alignment_needed >= align. */
1509 if (crtl->stack_alignment_needed < align)
1510 crtl->stack_alignment_needed = align;
1511 if (crtl->max_used_stack_slot_alignment < align)
1512 crtl->max_used_stack_slot_alignment = align;
1515 /* Create RTL for an SSA partition. */
1517 static void
1518 expand_one_ssa_partition (tree var)
1520 int part = var_to_partition (SA.map, var);
1521 gcc_assert (part != NO_PARTITION);
1523 if (SA.partition_to_pseudo[part])
1524 return;
1526 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1527 TYPE_MODE (TREE_TYPE (var)),
1528 TYPE_ALIGN (TREE_TYPE (var)));
1530 /* If the variable alignment is very large we'll dynamicaly allocate
1531 it, which means that in-frame portion is just a pointer. */
1532 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1533 align = GET_MODE_ALIGNMENT (Pmode);
1535 record_alignment_for_reg_var (align);
1537 if (!use_register_for_decl (var))
1539 if (defer_stack_allocation (var, true))
1540 add_stack_var (var, true);
1541 else
1542 expand_one_stack_var_1 (var);
1543 return;
1546 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1547 rtx x = gen_reg_rtx (reg_mode);
1549 set_rtl (var, x);
1551 /* For a promoted variable, X will not be used directly but wrapped in a
1552 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1553 will assume that its upper bits can be inferred from its lower bits.
1554 Therefore, if X isn't initialized on every path from the entry, then
1555 we must do it manually in order to fulfill the above assumption. */
1556 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1557 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1558 emit_move_insn (x, CONST0_RTX (reg_mode));
1561 /* Record the association between the RTL generated for partition PART
1562 and the underlying variable of the SSA_NAME VAR. */
1564 static void
1565 adjust_one_expanded_partition_var (tree var)
1567 if (!var)
1568 return;
1570 tree decl = SSA_NAME_VAR (var);
1572 int part = var_to_partition (SA.map, var);
1573 if (part == NO_PARTITION)
1574 return;
1576 rtx x = SA.partition_to_pseudo[part];
1578 gcc_assert (x);
1580 set_rtl (var, x);
1582 if (!REG_P (x))
1583 return;
1585 /* Note if the object is a user variable. */
1586 if (decl && !DECL_ARTIFICIAL (decl))
1587 mark_user_reg (x);
1589 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1590 mark_reg_pointer (x, get_pointer_alignment (var));
1593 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1594 that will reside in a pseudo register. */
1596 static void
1597 expand_one_register_var (tree var)
1599 if (TREE_CODE (var) == SSA_NAME)
1601 int part = var_to_partition (SA.map, var);
1602 if (part != NO_PARTITION)
1604 rtx x = SA.partition_to_pseudo[part];
1605 gcc_assert (x);
1606 gcc_assert (REG_P (x));
1607 return;
1609 gcc_unreachable ();
1612 tree decl = var;
1613 tree type = TREE_TYPE (decl);
1614 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1615 rtx x = gen_reg_rtx (reg_mode);
1617 set_rtl (var, x);
1619 /* Note if the object is a user variable. */
1620 if (!DECL_ARTIFICIAL (decl))
1621 mark_user_reg (x);
1623 if (POINTER_TYPE_P (type))
1624 mark_reg_pointer (x, get_pointer_alignment (var));
1627 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1628 has some associated error, e.g. its type is error-mark. We just need
1629 to pick something that won't crash the rest of the compiler. */
1631 static void
1632 expand_one_error_var (tree var)
1634 machine_mode mode = DECL_MODE (var);
1635 rtx x;
1637 if (mode == BLKmode)
1638 x = gen_rtx_MEM (BLKmode, const0_rtx);
1639 else if (mode == VOIDmode)
1640 x = const0_rtx;
1641 else
1642 x = gen_reg_rtx (mode);
1644 SET_DECL_RTL (var, x);
1647 /* A subroutine of expand_one_var. VAR is a variable that will be
1648 allocated to the local stack frame. Return true if we wish to
1649 add VAR to STACK_VARS so that it will be coalesced with other
1650 variables. Return false to allocate VAR immediately.
1652 This function is used to reduce the number of variables considered
1653 for coalescing, which reduces the size of the quadratic problem. */
1655 static bool
1656 defer_stack_allocation (tree var, bool toplevel)
1658 tree size_unit = TREE_CODE (var) == SSA_NAME
1659 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1660 : DECL_SIZE_UNIT (var);
1661 poly_uint64 size;
1663 /* Whether the variable is small enough for immediate allocation not to be
1664 a problem with regard to the frame size. */
1665 bool smallish
1666 = (poly_int_tree_p (size_unit, &size)
1667 && (estimated_poly_value (size)
1668 < param_min_size_for_stack_sharing));
1670 /* If stack protection is enabled, *all* stack variables must be deferred,
1671 so that we can re-order the strings to the top of the frame.
1672 Similarly for Address Sanitizer. */
1673 if (flag_stack_protect || asan_sanitize_stack_p ())
1674 return true;
1676 unsigned int align = TREE_CODE (var) == SSA_NAME
1677 ? TYPE_ALIGN (TREE_TYPE (var))
1678 : DECL_ALIGN (var);
1680 /* We handle "large" alignment via dynamic allocation. We want to handle
1681 this extra complication in only one place, so defer them. */
1682 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1683 return true;
1685 bool ignored = TREE_CODE (var) == SSA_NAME
1686 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1687 : DECL_IGNORED_P (var);
1689 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1690 might be detached from their block and appear at toplevel when we reach
1691 here. We want to coalesce them with variables from other blocks when
1692 the immediate contribution to the frame size would be noticeable. */
1693 if (toplevel && optimize > 0 && ignored && !smallish)
1694 return true;
1696 /* Variables declared in the outermost scope automatically conflict
1697 with every other variable. The only reason to want to defer them
1698 at all is that, after sorting, we can more efficiently pack
1699 small variables in the stack frame. Continue to defer at -O2. */
1700 if (toplevel && optimize < 2)
1701 return false;
1703 /* Without optimization, *most* variables are allocated from the
1704 stack, which makes the quadratic problem large exactly when we
1705 want compilation to proceed as quickly as possible. On the
1706 other hand, we don't want the function's stack frame size to
1707 get completely out of hand. So we avoid adding scalars and
1708 "small" aggregates to the list at all. */
1709 if (optimize == 0 && smallish)
1710 return false;
1712 return true;
1715 /* A subroutine of expand_used_vars. Expand one variable according to
1716 its flavor. Variables to be placed on the stack are not actually
1717 expanded yet, merely recorded.
1718 When REALLY_EXPAND is false, only add stack values to be allocated.
1719 Return stack usage this variable is supposed to take.
1722 static poly_uint64
1723 expand_one_var (tree var, bool toplevel, bool really_expand,
1724 bitmap forced_stack_var = NULL)
1726 unsigned int align = BITS_PER_UNIT;
1727 tree origvar = var;
1729 var = SSAVAR (var);
1731 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1733 if (is_global_var (var))
1734 return 0;
1736 /* Because we don't know if VAR will be in register or on stack,
1737 we conservatively assume it will be on stack even if VAR is
1738 eventually put into register after RA pass. For non-automatic
1739 variables, which won't be on stack, we collect alignment of
1740 type and ignore user specified alignment. Similarly for
1741 SSA_NAMEs for which use_register_for_decl returns true. */
1742 if (TREE_STATIC (var)
1743 || DECL_EXTERNAL (var)
1744 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1745 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1746 TYPE_MODE (TREE_TYPE (var)),
1747 TYPE_ALIGN (TREE_TYPE (var)));
1748 else if (DECL_HAS_VALUE_EXPR_P (var)
1749 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1750 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1751 or variables which were assigned a stack slot already by
1752 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1753 changed from the offset chosen to it. */
1754 align = crtl->stack_alignment_estimated;
1755 else
1756 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1758 /* If the variable alignment is very large we'll dynamicaly allocate
1759 it, which means that in-frame portion is just a pointer. */
1760 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1761 align = GET_MODE_ALIGNMENT (Pmode);
1764 record_alignment_for_reg_var (align);
1766 poly_uint64 size;
1767 if (TREE_CODE (origvar) == SSA_NAME)
1769 gcc_assert (!VAR_P (var)
1770 || (!DECL_EXTERNAL (var)
1771 && !DECL_HAS_VALUE_EXPR_P (var)
1772 && !TREE_STATIC (var)
1773 && TREE_TYPE (var) != error_mark_node
1774 && !DECL_HARD_REGISTER (var)
1775 && really_expand));
1777 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1779 else if (DECL_EXTERNAL (var))
1781 else if (DECL_HAS_VALUE_EXPR_P (var))
1783 else if (TREE_STATIC (var))
1785 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1787 else if (TREE_TYPE (var) == error_mark_node)
1789 if (really_expand)
1790 expand_one_error_var (var);
1792 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1794 if (really_expand)
1796 expand_one_hard_reg_var (var);
1797 if (!DECL_HARD_REGISTER (var))
1798 /* Invalid register specification. */
1799 expand_one_error_var (var);
1802 else if (use_register_for_decl (var)
1803 && (!forced_stack_var
1804 || !bitmap_bit_p (forced_stack_var, DECL_UID (var))))
1806 if (really_expand)
1807 expand_one_register_var (origvar);
1809 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1810 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1812 /* Reject variables which cover more than half of the address-space. */
1813 if (really_expand)
1815 if (DECL_NONLOCAL_FRAME (var))
1816 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1817 "total size of local objects is too large");
1818 else
1819 error_at (DECL_SOURCE_LOCATION (var),
1820 "size of variable %q+D is too large", var);
1821 expand_one_error_var (var);
1824 else if (defer_stack_allocation (var, toplevel))
1825 add_stack_var (origvar, really_expand);
1826 else
1828 if (really_expand)
1830 if (lookup_attribute ("naked",
1831 DECL_ATTRIBUTES (current_function_decl)))
1832 error ("cannot allocate stack for variable %q+D, naked function",
1833 var);
1835 expand_one_stack_var (origvar);
1837 return size;
1839 return 0;
1842 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1843 expanding variables. Those variables that can be put into registers
1844 are allocated pseudos; those that can't are put on the stack.
1846 TOPLEVEL is true if this is the outermost BLOCK. */
1848 static void
1849 expand_used_vars_for_block (tree block, bool toplevel, bitmap forced_stack_vars)
1851 tree t;
1853 /* Expand all variables at this level. */
1854 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1855 if (TREE_USED (t)
1856 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1857 || !DECL_NONSHAREABLE (t)))
1858 expand_one_var (t, toplevel, true, forced_stack_vars);
1860 /* Expand all variables at containing levels. */
1861 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1862 expand_used_vars_for_block (t, false, forced_stack_vars);
1865 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1866 and clear TREE_USED on all local variables. */
1868 static void
1869 clear_tree_used (tree block)
1871 tree t;
1873 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1874 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1875 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1876 || !DECL_NONSHAREABLE (t))
1877 TREE_USED (t) = 0;
1879 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1880 clear_tree_used (t);
1883 /* Examine TYPE and determine a bit mask of the following features. */
1885 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1886 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1887 #define SPCT_HAS_ARRAY 4
1888 #define SPCT_HAS_AGGREGATE 8
1890 static unsigned int
1891 stack_protect_classify_type (tree type)
1893 unsigned int ret = 0;
1894 tree t;
1896 switch (TREE_CODE (type))
1898 case ARRAY_TYPE:
1899 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1900 if (t == char_type_node
1901 || t == signed_char_type_node
1902 || t == unsigned_char_type_node)
1904 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1905 unsigned HOST_WIDE_INT len;
1907 if (!TYPE_SIZE_UNIT (type)
1908 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1909 len = max;
1910 else
1911 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1913 if (len < max)
1914 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1915 else
1916 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1918 else
1919 ret = SPCT_HAS_ARRAY;
1920 break;
1922 case UNION_TYPE:
1923 case QUAL_UNION_TYPE:
1924 case RECORD_TYPE:
1925 ret = SPCT_HAS_AGGREGATE;
1926 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1927 if (TREE_CODE (t) == FIELD_DECL)
1928 ret |= stack_protect_classify_type (TREE_TYPE (t));
1929 break;
1931 default:
1932 break;
1935 return ret;
1938 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1939 part of the local stack frame. Remember if we ever return nonzero for
1940 any variable in this function. The return value is the phase number in
1941 which the variable should be allocated. */
1943 static int
1944 stack_protect_decl_phase (tree decl)
1946 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1947 int ret = 0;
1949 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1950 has_short_buffer = true;
1952 tree attribs = DECL_ATTRIBUTES (current_function_decl);
1953 if (!lookup_attribute ("no_stack_protector", attribs)
1954 && (flag_stack_protect == SPCT_FLAG_ALL
1955 || flag_stack_protect == SPCT_FLAG_STRONG
1956 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1957 && lookup_attribute ("stack_protect", attribs))))
1959 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1960 && !(bits & SPCT_HAS_AGGREGATE))
1961 ret = 1;
1962 else if (bits & SPCT_HAS_ARRAY)
1963 ret = 2;
1965 else
1966 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1968 if (ret)
1969 has_protected_decls = true;
1971 return ret;
1974 /* Two helper routines that check for phase 1 and phase 2. These are used
1975 as callbacks for expand_stack_vars. */
1977 static bool
1978 stack_protect_decl_phase_1 (size_t i)
1980 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1983 static bool
1984 stack_protect_decl_phase_2 (size_t i)
1986 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1989 /* And helper function that checks for asan phase (with stack protector
1990 it is phase 3). This is used as callback for expand_stack_vars.
1991 Returns true if any of the vars in the partition need to be protected. */
1993 static bool
1994 asan_decl_phase_3 (size_t i)
1996 while (i != EOC)
1998 if (asan_protect_stack_decl (stack_vars[i].decl))
1999 return true;
2000 i = stack_vars[i].next;
2002 return false;
2005 /* Ensure that variables in different stack protection phases conflict
2006 so that they are not merged and share the same stack slot.
2007 Return true if there are any address taken variables. */
2009 static bool
2010 add_stack_protection_conflicts (void)
2012 size_t i, j, n = stack_vars_num;
2013 unsigned char *phase;
2014 bool ret = false;
2016 phase = XNEWVEC (unsigned char, n);
2017 for (i = 0; i < n; ++i)
2019 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
2020 if (TREE_ADDRESSABLE (stack_vars[i].decl))
2021 ret = true;
2024 for (i = 0; i < n; ++i)
2026 unsigned char ph_i = phase[i];
2027 for (j = i + 1; j < n; ++j)
2028 if (ph_i != phase[j])
2029 add_stack_var_conflict (i, j);
2032 XDELETEVEC (phase);
2033 return ret;
2036 /* Create a decl for the guard at the top of the stack frame. */
2038 static void
2039 create_stack_guard (void)
2041 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
2042 VAR_DECL, NULL, ptr_type_node);
2043 TREE_THIS_VOLATILE (guard) = 1;
2044 TREE_USED (guard) = 1;
2045 expand_one_stack_var (guard);
2046 crtl->stack_protect_guard = guard;
2049 /* Prepare for expanding variables. */
2050 static void
2051 init_vars_expansion (void)
2053 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
2054 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
2056 /* A map from decl to stack partition. */
2057 decl_to_stack_part = new hash_map<tree, size_t>;
2059 /* Initialize local stack smashing state. */
2060 has_protected_decls = false;
2061 has_short_buffer = false;
2062 if (hwasan_sanitize_stack_p ())
2063 hwasan_record_frame_init ();
2066 /* Free up stack variable graph data. */
2067 static void
2068 fini_vars_expansion (void)
2070 bitmap_obstack_release (&stack_var_bitmap_obstack);
2071 if (stack_vars)
2072 XDELETEVEC (stack_vars);
2073 if (stack_vars_sorted)
2074 XDELETEVEC (stack_vars_sorted);
2075 stack_vars = NULL;
2076 stack_vars_sorted = NULL;
2077 stack_vars_alloc = stack_vars_num = 0;
2078 delete decl_to_stack_part;
2079 decl_to_stack_part = NULL;
2082 /* Make a fair guess for the size of the stack frame of the function
2083 in NODE. This doesn't have to be exact, the result is only used in
2084 the inline heuristics. So we don't want to run the full stack var
2085 packing algorithm (which is quadratic in the number of stack vars).
2086 Instead, we calculate the total size of all stack vars. This turns
2087 out to be a pretty fair estimate -- packing of stack vars doesn't
2088 happen very often. */
2090 HOST_WIDE_INT
2091 estimated_stack_frame_size (struct cgraph_node *node)
2093 poly_int64 size = 0;
2094 size_t i;
2095 tree var;
2096 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2098 push_cfun (fn);
2100 init_vars_expansion ();
2102 FOR_EACH_LOCAL_DECL (fn, i, var)
2103 if (auto_var_in_fn_p (var, fn->decl))
2104 size += expand_one_var (var, true, false);
2106 if (stack_vars_num > 0)
2108 /* Fake sorting the stack vars for account_stack_vars (). */
2109 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
2110 for (i = 0; i < stack_vars_num; ++i)
2111 stack_vars_sorted[i] = i;
2112 size += account_stack_vars ();
2115 fini_vars_expansion ();
2116 pop_cfun ();
2117 return estimated_poly_value (size);
2120 /* Check if the current function has calls that use a return slot. */
2122 static bool
2123 stack_protect_return_slot_p ()
2125 basic_block bb;
2127 FOR_ALL_BB_FN (bb, cfun)
2128 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2129 !gsi_end_p (gsi); gsi_next (&gsi))
2131 gimple *stmt = gsi_stmt (gsi);
2132 /* This assumes that calls to internal-only functions never
2133 use a return slot. */
2134 if (is_gimple_call (stmt)
2135 && !gimple_call_internal_p (stmt)
2136 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2137 gimple_call_fndecl (stmt)))
2138 return true;
2140 return false;
2143 /* Expand all variables used in the function. */
2145 static rtx_insn *
2146 expand_used_vars (bitmap forced_stack_vars)
2148 tree var, outer_block = DECL_INITIAL (current_function_decl);
2149 auto_vec<tree> maybe_local_decls;
2150 rtx_insn *var_end_seq = NULL;
2151 unsigned i;
2152 unsigned len;
2153 bool gen_stack_protect_signal = false;
2155 /* Compute the phase of the stack frame for this function. */
2157 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2158 int off = targetm.starting_frame_offset () % align;
2159 frame_phase = off ? align - off : 0;
2162 /* Set TREE_USED on all variables in the local_decls. */
2163 FOR_EACH_LOCAL_DECL (cfun, i, var)
2164 TREE_USED (var) = 1;
2165 /* Clear TREE_USED on all variables associated with a block scope. */
2166 clear_tree_used (DECL_INITIAL (current_function_decl));
2168 init_vars_expansion ();
2170 if (targetm.use_pseudo_pic_reg ())
2171 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2173 for (i = 0; i < SA.map->num_partitions; i++)
2175 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2176 continue;
2178 tree var = partition_to_var (SA.map, i);
2180 gcc_assert (!virtual_operand_p (var));
2182 expand_one_ssa_partition (var);
2185 if (flag_stack_protect == SPCT_FLAG_STRONG)
2186 gen_stack_protect_signal = stack_protect_return_slot_p ();
2188 /* At this point all variables on the local_decls with TREE_USED
2189 set are not associated with any block scope. Lay them out. */
2191 len = vec_safe_length (cfun->local_decls);
2192 FOR_EACH_LOCAL_DECL (cfun, i, var)
2194 bool expand_now = false;
2196 /* Expanded above already. */
2197 if (is_gimple_reg (var))
2199 TREE_USED (var) = 0;
2200 goto next;
2202 /* We didn't set a block for static or extern because it's hard
2203 to tell the difference between a global variable (re)declared
2204 in a local scope, and one that's really declared there to
2205 begin with. And it doesn't really matter much, since we're
2206 not giving them stack space. Expand them now. */
2207 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2208 expand_now = true;
2210 /* Expand variables not associated with any block now. Those created by
2211 the optimizers could be live anywhere in the function. Those that
2212 could possibly have been scoped originally and detached from their
2213 block will have their allocation deferred so we coalesce them with
2214 others when optimization is enabled. */
2215 else if (TREE_USED (var))
2216 expand_now = true;
2218 /* Finally, mark all variables on the list as used. We'll use
2219 this in a moment when we expand those associated with scopes. */
2220 TREE_USED (var) = 1;
2222 if (expand_now)
2223 expand_one_var (var, true, true, forced_stack_vars);
2225 next:
2226 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2228 rtx rtl = DECL_RTL_IF_SET (var);
2230 /* Keep artificial non-ignored vars in cfun->local_decls
2231 chain until instantiate_decls. */
2232 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2233 add_local_decl (cfun, var);
2234 else if (rtl == NULL_RTX)
2235 /* If rtl isn't set yet, which can happen e.g. with
2236 -fstack-protector, retry before returning from this
2237 function. */
2238 maybe_local_decls.safe_push (var);
2242 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2244 +-----------------+-----------------+
2245 | ...processed... | ...duplicates...|
2246 +-----------------+-----------------+
2248 +-- LEN points here.
2250 We just want the duplicates, as those are the artificial
2251 non-ignored vars that we want to keep until instantiate_decls.
2252 Move them down and truncate the array. */
2253 if (!vec_safe_is_empty (cfun->local_decls))
2254 cfun->local_decls->block_remove (0, len);
2256 /* At this point, all variables within the block tree with TREE_USED
2257 set are actually used by the optimized function. Lay them out. */
2258 expand_used_vars_for_block (outer_block, true, forced_stack_vars);
2260 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2261 if (stack_vars_num > 0)
2263 bool has_addressable_vars = false;
2265 add_scope_conflicts ();
2267 /* If stack protection is enabled, we don't share space between
2268 vulnerable data and non-vulnerable data. */
2269 if (flag_stack_protect != 0
2270 && !lookup_attribute ("no_stack_protector", attribs)
2271 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2272 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2273 && lookup_attribute ("stack_protect", attribs))))
2274 has_addressable_vars = add_stack_protection_conflicts ();
2276 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2277 gen_stack_protect_signal = true;
2279 /* Now that we have collected all stack variables, and have computed a
2280 minimal interference graph, attempt to save some stack space. */
2281 partition_stack_vars ();
2282 if (dump_file)
2283 dump_stack_var_partition ();
2287 if (!lookup_attribute ("no_stack_protector", attribs))
2288 switch (flag_stack_protect)
2290 case SPCT_FLAG_ALL:
2291 create_stack_guard ();
2292 break;
2294 case SPCT_FLAG_STRONG:
2295 if (gen_stack_protect_signal
2296 || cfun->calls_alloca
2297 || has_protected_decls
2298 || lookup_attribute ("stack_protect", attribs))
2299 create_stack_guard ();
2300 break;
2302 case SPCT_FLAG_DEFAULT:
2303 if (cfun->calls_alloca
2304 || has_protected_decls
2305 || lookup_attribute ("stack_protect", attribs))
2306 create_stack_guard ();
2307 break;
2309 case SPCT_FLAG_EXPLICIT:
2310 if (lookup_attribute ("stack_protect", attribs))
2311 create_stack_guard ();
2312 break;
2314 default:
2315 break;
2318 /* Assign rtl to each variable based on these partitions. */
2319 if (stack_vars_num > 0)
2321 class stack_vars_data data;
2323 data.asan_base = NULL_RTX;
2324 data.asan_alignb = 0;
2326 /* Reorder decls to be protected by iterating over the variables
2327 array multiple times, and allocating out of each phase in turn. */
2328 /* ??? We could probably integrate this into the qsort we did
2329 earlier, such that we naturally see these variables first,
2330 and thus naturally allocate things in the right order. */
2331 if (has_protected_decls)
2333 /* Phase 1 contains only character arrays. */
2334 expand_stack_vars (stack_protect_decl_phase_1, &data);
2336 /* Phase 2 contains other kinds of arrays. */
2337 if (!lookup_attribute ("no_stack_protector", attribs)
2338 && (flag_stack_protect == SPCT_FLAG_ALL
2339 || flag_stack_protect == SPCT_FLAG_STRONG
2340 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2341 && lookup_attribute ("stack_protect", attribs))))
2342 expand_stack_vars (stack_protect_decl_phase_2, &data);
2345 if (asan_sanitize_stack_p ())
2346 /* Phase 3, any partitions that need asan protection
2347 in addition to phase 1 and 2. */
2348 expand_stack_vars (asan_decl_phase_3, &data);
2350 /* ASAN description strings don't yet have a syntax for expressing
2351 polynomial offsets. */
2352 HOST_WIDE_INT prev_offset;
2353 if (!data.asan_vec.is_empty ()
2354 && frame_offset.is_constant (&prev_offset))
2356 HOST_WIDE_INT offset, sz, redzonesz;
2357 redzonesz = ASAN_RED_ZONE_SIZE;
2358 sz = data.asan_vec[0] - prev_offset;
2359 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2360 && data.asan_alignb <= 4096
2361 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2362 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2363 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2364 /* Allocating a constant amount of space from a constant
2365 starting offset must give a constant result. */
2366 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2367 .to_constant ());
2368 data.asan_vec.safe_push (prev_offset);
2369 data.asan_vec.safe_push (offset);
2370 /* Leave space for alignment if STRICT_ALIGNMENT. */
2371 if (STRICT_ALIGNMENT)
2372 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2373 << ASAN_SHADOW_SHIFT)
2374 / BITS_PER_UNIT, 1);
2376 var_end_seq
2377 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2378 data.asan_base,
2379 data.asan_alignb,
2380 data.asan_vec.address (),
2381 data.asan_decl_vec.address (),
2382 data.asan_vec.length ());
2385 expand_stack_vars (NULL, &data);
2388 if (hwasan_sanitize_stack_p ())
2389 hwasan_emit_prologue ();
2390 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2391 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2392 virtual_stack_vars_rtx,
2393 var_end_seq);
2394 else if (hwasan_sanitize_allocas_p () && cfun->calls_alloca)
2395 /* When using out-of-line instrumentation we only want to emit one function
2396 call for clearing the tags in a region of shadow stack. When there are
2397 alloca calls in this frame we want to emit a call using the
2398 virtual_stack_dynamic_rtx, but when not we use the hwasan_frame_extent
2399 rtx we created in expand_stack_vars. */
2400 var_end_seq = hwasan_emit_untag_frame (virtual_stack_dynamic_rtx,
2401 virtual_stack_vars_rtx);
2402 else if (hwasan_sanitize_stack_p ())
2403 /* If no variables were stored on the stack, `hwasan_get_frame_extent`
2404 will return NULL_RTX and hence `hwasan_emit_untag_frame` will return
2405 NULL (i.e. an empty sequence). */
2406 var_end_seq = hwasan_emit_untag_frame (hwasan_get_frame_extent (),
2407 virtual_stack_vars_rtx);
2409 fini_vars_expansion ();
2411 /* If there were any artificial non-ignored vars without rtl
2412 found earlier, see if deferred stack allocation hasn't assigned
2413 rtl to them. */
2414 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2416 rtx rtl = DECL_RTL_IF_SET (var);
2418 /* Keep artificial non-ignored vars in cfun->local_decls
2419 chain until instantiate_decls. */
2420 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2421 add_local_decl (cfun, var);
2424 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2425 if (STACK_ALIGNMENT_NEEDED)
2427 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2428 if (FRAME_GROWS_DOWNWARD)
2429 frame_offset = aligned_lower_bound (frame_offset, align);
2430 else
2431 frame_offset = aligned_upper_bound (frame_offset, align);
2434 return var_end_seq;
2438 /* If we need to produce a detailed dump, print the tree representation
2439 for STMT to the dump file. SINCE is the last RTX after which the RTL
2440 generated for STMT should have been appended. */
2442 static void
2443 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2445 if (dump_file && (dump_flags & TDF_DETAILS))
2447 fprintf (dump_file, "\n;; ");
2448 print_gimple_stmt (dump_file, stmt, 0,
2449 TDF_SLIM | (dump_flags & TDF_LINENO));
2450 fprintf (dump_file, "\n");
2452 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2456 /* Maps the blocks that do not contain tree labels to rtx labels. */
2458 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2460 /* Returns the label_rtx expression for a label starting basic block BB. */
2462 static rtx_code_label *
2463 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2465 if (bb->flags & BB_RTL)
2466 return block_label (bb);
2468 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2469 if (elt)
2470 return *elt;
2472 /* Find the tree label if it is present. */
2473 gimple_stmt_iterator gsi = gsi_start_bb (bb);
2474 glabel *lab_stmt;
2475 if (!gsi_end_p (gsi)
2476 && (lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi)))
2477 && !DECL_NONLOCAL (gimple_label_label (lab_stmt)))
2478 return jump_target_rtx (gimple_label_label (lab_stmt));
2480 rtx_code_label *l = gen_label_rtx ();
2481 lab_rtx_for_bb->put (bb, l);
2482 return l;
2486 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2487 of a basic block where we just expanded the conditional at the end,
2488 possibly clean up the CFG and instruction sequence. LAST is the
2489 last instruction before the just emitted jump sequence. */
2491 static void
2492 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2494 /* Special case: when jumpif decides that the condition is
2495 trivial it emits an unconditional jump (and the necessary
2496 barrier). But we still have two edges, the fallthru one is
2497 wrong. purge_dead_edges would clean this up later. Unfortunately
2498 we have to insert insns (and split edges) before
2499 find_many_sub_basic_blocks and hence before purge_dead_edges.
2500 But splitting edges might create new blocks which depend on the
2501 fact that if there are two edges there's no barrier. So the
2502 barrier would get lost and verify_flow_info would ICE. Instead
2503 of auditing all edge splitters to care for the barrier (which
2504 normally isn't there in a cleaned CFG), fix it here. */
2505 if (BARRIER_P (get_last_insn ()))
2507 rtx_insn *insn;
2508 remove_edge (e);
2509 /* Now, we have a single successor block, if we have insns to
2510 insert on the remaining edge we potentially will insert
2511 it at the end of this block (if the dest block isn't feasible)
2512 in order to avoid splitting the edge. This insertion will take
2513 place in front of the last jump. But we might have emitted
2514 multiple jumps (conditional and one unconditional) to the
2515 same destination. Inserting in front of the last one then
2516 is a problem. See PR 40021. We fix this by deleting all
2517 jumps except the last unconditional one. */
2518 insn = PREV_INSN (get_last_insn ());
2519 /* Make sure we have an unconditional jump. Otherwise we're
2520 confused. */
2521 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2522 for (insn = PREV_INSN (insn); insn != last;)
2524 insn = PREV_INSN (insn);
2525 if (JUMP_P (NEXT_INSN (insn)))
2527 if (!any_condjump_p (NEXT_INSN (insn)))
2529 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2530 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2532 delete_insn (NEXT_INSN (insn));
2538 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2539 Returns a new basic block if we've terminated the current basic
2540 block and created a new one. */
2542 static basic_block
2543 expand_gimple_cond (basic_block bb, gcond *stmt)
2545 basic_block new_bb, dest;
2546 edge true_edge;
2547 edge false_edge;
2548 rtx_insn *last2, *last;
2549 enum tree_code code;
2550 tree op0, op1;
2552 code = gimple_cond_code (stmt);
2553 op0 = gimple_cond_lhs (stmt);
2554 op1 = gimple_cond_rhs (stmt);
2555 /* We're sometimes presented with such code:
2556 D.123_1 = x < y;
2557 if (D.123_1 != 0)
2559 This would expand to two comparisons which then later might
2560 be cleaned up by combine. But some pattern matchers like if-conversion
2561 work better when there's only one compare, so make up for this
2562 here as special exception if TER would have made the same change. */
2563 if (SA.values
2564 && TREE_CODE (op0) == SSA_NAME
2565 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2566 && TREE_CODE (op1) == INTEGER_CST
2567 && ((gimple_cond_code (stmt) == NE_EXPR
2568 && integer_zerop (op1))
2569 || (gimple_cond_code (stmt) == EQ_EXPR
2570 && integer_onep (op1)))
2571 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2573 gimple *second = SSA_NAME_DEF_STMT (op0);
2574 if (gimple_code (second) == GIMPLE_ASSIGN)
2576 enum tree_code code2 = gimple_assign_rhs_code (second);
2577 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2579 code = code2;
2580 op0 = gimple_assign_rhs1 (second);
2581 op1 = gimple_assign_rhs2 (second);
2583 /* If jumps are cheap and the target does not support conditional
2584 compare, turn some more codes into jumpy sequences. */
2585 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2586 && targetm.gen_ccmp_first == NULL)
2588 if ((code2 == BIT_AND_EXPR
2589 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2590 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2591 || code2 == TRUTH_AND_EXPR)
2593 code = TRUTH_ANDIF_EXPR;
2594 op0 = gimple_assign_rhs1 (second);
2595 op1 = gimple_assign_rhs2 (second);
2597 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2599 code = TRUTH_ORIF_EXPR;
2600 op0 = gimple_assign_rhs1 (second);
2601 op1 = gimple_assign_rhs2 (second);
2607 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2608 into (x - C2) * C3 < C4. */
2609 if ((code == EQ_EXPR || code == NE_EXPR)
2610 && TREE_CODE (op0) == SSA_NAME
2611 && TREE_CODE (op1) == INTEGER_CST)
2612 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2614 /* Optimize (x - y) < 0 into x < y if x - y has undefined overflow. */
2615 if (!TYPE_UNSIGNED (TREE_TYPE (op0))
2616 && (code == LT_EXPR || code == LE_EXPR
2617 || code == GT_EXPR || code == GE_EXPR)
2618 && integer_zerop (op1)
2619 && TREE_CODE (op0) == SSA_NAME)
2620 maybe_optimize_sub_cmp_0 (code, &op0, &op1);
2622 last2 = last = get_last_insn ();
2624 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2625 set_curr_insn_location (gimple_location (stmt));
2627 /* These flags have no purpose in RTL land. */
2628 true_edge->flags &= ~EDGE_TRUE_VALUE;
2629 false_edge->flags &= ~EDGE_FALSE_VALUE;
2631 /* We can either have a pure conditional jump with one fallthru edge or
2632 two-way jump that needs to be decomposed into two basic blocks. */
2633 if (false_edge->dest == bb->next_bb)
2635 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2636 true_edge->probability);
2637 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2638 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2639 set_curr_insn_location (true_edge->goto_locus);
2640 false_edge->flags |= EDGE_FALLTHRU;
2641 maybe_cleanup_end_of_block (false_edge, last);
2642 return NULL;
2644 if (true_edge->dest == bb->next_bb)
2646 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2647 false_edge->probability);
2648 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2649 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2650 set_curr_insn_location (false_edge->goto_locus);
2651 true_edge->flags |= EDGE_FALLTHRU;
2652 maybe_cleanup_end_of_block (true_edge, last);
2653 return NULL;
2656 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2657 true_edge->probability);
2658 last = get_last_insn ();
2659 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2660 set_curr_insn_location (false_edge->goto_locus);
2661 emit_jump (label_rtx_for_bb (false_edge->dest));
2663 BB_END (bb) = last;
2664 if (BARRIER_P (BB_END (bb)))
2665 BB_END (bb) = PREV_INSN (BB_END (bb));
2666 update_bb_for_insn (bb);
2668 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2669 dest = false_edge->dest;
2670 redirect_edge_succ (false_edge, new_bb);
2671 false_edge->flags |= EDGE_FALLTHRU;
2672 new_bb->count = false_edge->count ();
2673 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2674 add_bb_to_loop (new_bb, loop);
2675 if (loop->latch == bb
2676 && loop->header == dest)
2677 loop->latch = new_bb;
2678 make_single_succ_edge (new_bb, dest, 0);
2679 if (BARRIER_P (BB_END (new_bb)))
2680 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2681 update_bb_for_insn (new_bb);
2683 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2685 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2687 set_curr_insn_location (true_edge->goto_locus);
2688 true_edge->goto_locus = curr_insn_location ();
2691 return new_bb;
2694 /* Mark all calls that can have a transaction restart. */
2696 static void
2697 mark_transaction_restart_calls (gimple *stmt)
2699 struct tm_restart_node dummy;
2700 tm_restart_node **slot;
2702 if (!cfun->gimple_df->tm_restart)
2703 return;
2705 dummy.stmt = stmt;
2706 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2707 if (slot)
2709 struct tm_restart_node *n = *slot;
2710 tree list = n->label_or_list;
2711 rtx_insn *insn;
2713 for (insn = next_real_insn (get_last_insn ());
2714 !CALL_P (insn);
2715 insn = next_real_insn (insn))
2716 continue;
2718 if (TREE_CODE (list) == LABEL_DECL)
2719 add_reg_note (insn, REG_TM, label_rtx (list));
2720 else
2721 for (; list ; list = TREE_CHAIN (list))
2722 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2726 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2727 statement STMT. */
2729 static void
2730 expand_call_stmt (gcall *stmt)
2732 tree exp, decl, lhs;
2733 bool builtin_p;
2734 size_t i;
2736 if (gimple_call_internal_p (stmt))
2738 expand_internal_call (stmt);
2739 return;
2742 /* If this is a call to a built-in function and it has no effect other
2743 than setting the lhs, try to implement it using an internal function
2744 instead. */
2745 decl = gimple_call_fndecl (stmt);
2746 if (gimple_call_lhs (stmt)
2747 && !gimple_has_side_effects (stmt)
2748 && (optimize || (decl && called_as_built_in (decl))))
2750 internal_fn ifn = replacement_internal_fn (stmt);
2751 if (ifn != IFN_LAST)
2753 expand_internal_call (ifn, stmt);
2754 return;
2758 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2760 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2761 builtin_p = decl && fndecl_built_in_p (decl);
2763 /* If this is not a builtin function, the function type through which the
2764 call is made may be different from the type of the function. */
2765 if (!builtin_p)
2766 CALL_EXPR_FN (exp)
2767 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2768 CALL_EXPR_FN (exp));
2770 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2771 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2773 for (i = 0; i < gimple_call_num_args (stmt); i++)
2775 tree arg = gimple_call_arg (stmt, i);
2776 gimple *def;
2777 /* TER addresses into arguments of builtin functions so we have a
2778 chance to infer more correct alignment information. See PR39954. */
2779 if (builtin_p
2780 && TREE_CODE (arg) == SSA_NAME
2781 && (def = get_gimple_for_ssa_name (arg))
2782 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2783 arg = gimple_assign_rhs1 (def);
2784 CALL_EXPR_ARG (exp, i) = arg;
2787 if (gimple_has_side_effects (stmt)
2788 /* ??? Downstream in expand_expr_real_1 we assume that expressions
2789 w/o side-effects do not throw so work around this here. */
2790 || stmt_could_throw_p (cfun, stmt))
2791 TREE_SIDE_EFFECTS (exp) = 1;
2793 if (gimple_call_nothrow_p (stmt))
2794 TREE_NOTHROW (exp) = 1;
2796 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2797 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2798 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2799 if (decl
2800 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2801 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2802 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2803 else
2804 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2805 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2806 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2807 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2809 /* Must come after copying location. */
2810 copy_warning (exp, stmt);
2812 /* Ensure RTL is created for debug args. */
2813 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2815 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2816 unsigned int ix;
2817 tree dtemp;
2819 if (debug_args)
2820 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2822 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2823 expand_debug_expr (dtemp);
2827 rtx_insn *before_call = get_last_insn ();
2828 lhs = gimple_call_lhs (stmt);
2829 if (lhs)
2830 expand_assignment (lhs, exp, false);
2831 else
2832 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2834 /* If the gimple call is an indirect call and has 'nocf_check'
2835 attribute find a generated CALL insn to mark it as no
2836 control-flow verification is needed. */
2837 if (gimple_call_nocf_check_p (stmt)
2838 && !gimple_call_fndecl (stmt))
2840 rtx_insn *last = get_last_insn ();
2841 while (!CALL_P (last)
2842 && last != before_call)
2843 last = PREV_INSN (last);
2845 if (last != before_call)
2846 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2849 mark_transaction_restart_calls (stmt);
2853 /* Generate RTL for an asm statement (explicit assembler code).
2854 STRING is a STRING_CST node containing the assembler code text,
2855 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2856 insn is volatile; don't optimize it. */
2858 static void
2859 expand_asm_loc (tree string, int vol, location_t locus)
2861 rtx body;
2863 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2864 ggc_strdup (TREE_STRING_POINTER (string)),
2865 locus);
2867 MEM_VOLATILE_P (body) = vol;
2869 /* Non-empty basic ASM implicitly clobbers memory. */
2870 if (TREE_STRING_LENGTH (string) != 0)
2872 rtx asm_op, clob;
2873 unsigned i, nclobbers;
2874 auto_vec<rtx> input_rvec, output_rvec;
2875 auto_vec<machine_mode> input_mode;
2876 auto_vec<const char *> constraints;
2877 auto_vec<rtx> use_rvec;
2878 auto_vec<rtx> clobber_rvec;
2879 HARD_REG_SET clobbered_regs;
2880 CLEAR_HARD_REG_SET (clobbered_regs);
2882 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2883 clobber_rvec.safe_push (clob);
2885 if (targetm.md_asm_adjust)
2886 targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
2887 constraints, use_rvec, clobber_rvec,
2888 clobbered_regs, locus);
2890 asm_op = body;
2891 nclobbers = clobber_rvec.length ();
2892 auto nuses = use_rvec.length ();
2893 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nuses + nclobbers));
2895 i = 0;
2896 XVECEXP (body, 0, i++) = asm_op;
2897 for (rtx use : use_rvec)
2898 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
2899 for (rtx clobber : clobber_rvec)
2900 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobber);
2903 emit_insn (body);
2906 /* Return the number of times character C occurs in string S. */
2907 static int
2908 n_occurrences (int c, const char *s)
2910 int n = 0;
2911 while (*s)
2912 n += (*s++ == c);
2913 return n;
2916 /* A subroutine of expand_asm_operands. Check that all operands have
2917 the same number of alternatives. Return true if so. */
2919 static bool
2920 check_operand_nalternatives (const vec<const char *> &constraints)
2922 unsigned len = constraints.length();
2923 if (len > 0)
2925 int nalternatives = n_occurrences (',', constraints[0]);
2927 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2929 error ("too many alternatives in %<asm%>");
2930 return false;
2933 for (unsigned i = 1; i < len; ++i)
2934 if (n_occurrences (',', constraints[i]) != nalternatives)
2936 error ("operand constraints for %<asm%> differ "
2937 "in number of alternatives");
2938 return false;
2941 return true;
2944 /* Check for overlap between registers marked in CLOBBERED_REGS and
2945 anything inappropriate in T. Emit error and return the register
2946 variable definition for error, NULL_TREE for ok. */
2948 static bool
2949 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs,
2950 location_t loc)
2952 /* Conflicts between asm-declared register variables and the clobber
2953 list are not allowed. */
2954 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2956 if (overlap)
2958 error_at (loc, "%<asm%> specifier for variable %qE conflicts with "
2959 "%<asm%> clobber list", DECL_NAME (overlap));
2961 /* Reset registerness to stop multiple errors emitted for a single
2962 variable. */
2963 DECL_REGISTER (overlap) = 0;
2964 return true;
2967 return false;
2970 /* Check that the given REGNO spanning NREGS is a valid
2971 asm clobber operand. Some HW registers cannot be
2972 saved/restored, hence they should not be clobbered by
2973 asm statements. */
2974 static bool
2975 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
2977 bool is_valid = true;
2978 HARD_REG_SET regset;
2980 CLEAR_HARD_REG_SET (regset);
2982 add_range_to_hard_reg_set (&regset, regno, nregs);
2984 /* Clobbering the PIC register is an error. */
2985 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
2986 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
2988 /* ??? Diagnose during gimplification? */
2989 error ("PIC register clobbered by %qs in %<asm%>", regname);
2990 is_valid = false;
2992 else if (!in_hard_reg_set_p
2993 (accessible_reg_set, reg_raw_mode[regno], regno))
2995 /* ??? Diagnose during gimplification? */
2996 error ("the register %qs cannot be clobbered in %<asm%>"
2997 " for the current target", regname);
2998 is_valid = false;
3001 /* Clobbering the stack pointer register is deprecated. GCC expects
3002 the value of the stack pointer after an asm statement to be the same
3003 as it was before, so no asm can validly clobber the stack pointer in
3004 the usual sense. Adding the stack pointer to the clobber list has
3005 traditionally had some undocumented and somewhat obscure side-effects. */
3006 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
3008 crtl->sp_is_clobbered_by_asm = true;
3009 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
3010 " %qs in a clobber list is deprecated", regname))
3011 inform (input_location, "the value of the stack pointer after"
3012 " an %<asm%> statement must be the same as it was before"
3013 " the statement");
3016 return is_valid;
3019 /* Generate RTL for an asm statement with arguments.
3020 STRING is the instruction template.
3021 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
3022 Each output or input has an expression in the TREE_VALUE and
3023 a tree list in TREE_PURPOSE which in turn contains a constraint
3024 name in TREE_VALUE (or NULL_TREE) and a constraint string
3025 in TREE_PURPOSE.
3026 CLOBBERS is a list of STRING_CST nodes each naming a hard register
3027 that is clobbered by this insn.
3029 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
3030 should be the fallthru basic block of the asm goto.
3032 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
3033 Some elements of OUTPUTS may be replaced with trees representing temporary
3034 values. The caller should copy those temporary values to the originally
3035 specified lvalues.
3037 VOL nonzero means the insn is volatile; don't optimize it. */
3039 static void
3040 expand_asm_stmt (gasm *stmt)
3042 class save_input_location
3044 location_t old;
3046 public:
3047 explicit save_input_location(location_t where)
3049 old = input_location;
3050 input_location = where;
3053 ~save_input_location()
3055 input_location = old;
3059 location_t locus = gimple_location (stmt);
3061 if (gimple_asm_input_p (stmt))
3063 const char *s = gimple_asm_string (stmt);
3064 tree string = build_string (strlen (s), s);
3065 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
3066 return;
3069 /* There are some legacy diagnostics in here. */
3070 save_input_location s_i_l(locus);
3072 unsigned noutputs = gimple_asm_noutputs (stmt);
3073 unsigned ninputs = gimple_asm_ninputs (stmt);
3074 unsigned nlabels = gimple_asm_nlabels (stmt);
3075 unsigned i;
3076 bool error_seen = false;
3078 /* ??? Diagnose during gimplification? */
3079 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
3081 error_at (locus, "more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
3082 return;
3085 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
3086 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
3087 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
3089 /* Copy the gimple vectors into new vectors that we can manipulate. */
3091 output_tvec.safe_grow (noutputs, true);
3092 input_tvec.safe_grow (ninputs, true);
3093 constraints.safe_grow (noutputs + ninputs, true);
3095 for (i = 0; i < noutputs; ++i)
3097 tree t = gimple_asm_output_op (stmt, i);
3098 output_tvec[i] = TREE_VALUE (t);
3099 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3101 for (i = 0; i < ninputs; i++)
3103 tree t = gimple_asm_input_op (stmt, i);
3104 input_tvec[i] = TREE_VALUE (t);
3105 constraints[i + noutputs]
3106 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3109 /* ??? Diagnose during gimplification? */
3110 if (! check_operand_nalternatives (constraints))
3111 return;
3113 /* Count the number of meaningful clobbered registers, ignoring what
3114 we would ignore later. */
3115 auto_vec<rtx> clobber_rvec;
3116 HARD_REG_SET clobbered_regs;
3117 CLEAR_HARD_REG_SET (clobbered_regs);
3119 if (unsigned n = gimple_asm_nclobbers (stmt))
3121 clobber_rvec.reserve (n);
3122 for (i = 0; i < n; i++)
3124 tree t = gimple_asm_clobber_op (stmt, i);
3125 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
3126 int nregs, j;
3128 j = decode_reg_name_and_count (regname, &nregs);
3129 if (j < 0)
3131 if (j == -2)
3133 /* ??? Diagnose during gimplification? */
3134 error_at (locus, "unknown register name %qs in %<asm%>",
3135 regname);
3136 error_seen = true;
3138 else if (j == -4)
3140 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3141 clobber_rvec.safe_push (x);
3143 else
3145 /* Otherwise we should have -1 == empty string
3146 or -3 == cc, which is not a register. */
3147 gcc_assert (j == -1 || j == -3);
3150 else
3151 for (int reg = j; reg < j + nregs; reg++)
3153 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3154 return;
3156 SET_HARD_REG_BIT (clobbered_regs, reg);
3157 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3158 clobber_rvec.safe_push (x);
3163 /* First pass over inputs and outputs checks validity and sets
3164 mark_addressable if needed. */
3165 /* ??? Diagnose during gimplification? */
3167 for (i = 0; i < noutputs; ++i)
3169 tree val = output_tvec[i];
3170 tree type = TREE_TYPE (val);
3171 const char *constraint;
3172 bool is_inout;
3173 bool allows_reg;
3174 bool allows_mem;
3176 /* Try to parse the output constraint. If that fails, there's
3177 no point in going further. */
3178 constraint = constraints[i];
3179 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3180 &allows_mem, &allows_reg, &is_inout))
3181 return;
3183 /* If the output is a hard register, verify it doesn't conflict with
3184 any other operand's possible hard register use. */
3185 if (DECL_P (val)
3186 && REG_P (DECL_RTL (val))
3187 && HARD_REGISTER_P (DECL_RTL (val)))
3189 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3190 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3191 unsigned long match;
3193 /* Verify the other outputs do not use the same hard register. */
3194 for (j = i + 1; j < noutputs; ++j)
3195 if (DECL_P (output_tvec[j])
3196 && REG_P (DECL_RTL (output_tvec[j]))
3197 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3198 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3200 error_at (locus, "invalid hard register usage between output "
3201 "operands");
3202 error_seen = true;
3205 /* Verify matching constraint operands use the same hard register
3206 and that the non-matching constraint operands do not use the same
3207 hard register if the output is an early clobber operand. */
3208 for (j = 0; j < ninputs; ++j)
3209 if (DECL_P (input_tvec[j])
3210 && REG_P (DECL_RTL (input_tvec[j]))
3211 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3213 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3214 switch (*constraints[j + noutputs])
3216 case '0': case '1': case '2': case '3': case '4':
3217 case '5': case '6': case '7': case '8': case '9':
3218 match = strtoul (constraints[j + noutputs], NULL, 10);
3219 break;
3220 default:
3221 match = ULONG_MAX;
3222 break;
3224 if (i == match
3225 && output_hregno != input_hregno)
3227 error_at (locus, "invalid hard register usage between "
3228 "output operand and matching constraint operand");
3229 error_seen = true;
3231 else if (early_clobber_p
3232 && i != match
3233 && output_hregno == input_hregno)
3235 error_at (locus, "invalid hard register usage between "
3236 "earlyclobber operand and input operand");
3237 error_seen = true;
3242 if (! allows_reg
3243 && (allows_mem
3244 || is_inout
3245 || (DECL_P (val)
3246 && REG_P (DECL_RTL (val))
3247 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3248 mark_addressable (val);
3251 for (i = 0; i < ninputs; ++i)
3253 bool allows_reg, allows_mem;
3254 const char *constraint;
3256 constraint = constraints[i + noutputs];
3257 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3258 constraints.address (),
3259 &allows_mem, &allows_reg))
3260 return;
3262 if (! allows_reg && allows_mem)
3263 mark_addressable (input_tvec[i]);
3266 /* Second pass evaluates arguments. */
3268 /* Make sure stack is consistent for asm goto. */
3269 if (nlabels > 0)
3270 do_pending_stack_adjust ();
3271 int old_generating_concat_p = generating_concat_p;
3273 /* Vector of RTX's of evaluated output operands. */
3274 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3275 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3276 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3278 output_rvec.safe_grow (noutputs, true);
3280 for (i = 0; i < noutputs; ++i)
3282 tree val = output_tvec[i];
3283 tree type = TREE_TYPE (val);
3284 bool is_inout, allows_reg, allows_mem, ok;
3285 rtx op;
3287 ok = parse_output_constraint (&constraints[i], i, ninputs,
3288 noutputs, &allows_mem, &allows_reg,
3289 &is_inout);
3290 gcc_assert (ok);
3292 /* If an output operand is not a decl or indirect ref and our constraint
3293 allows a register, make a temporary to act as an intermediate.
3294 Make the asm insn write into that, then we will copy it to
3295 the real output operand. Likewise for promoted variables. */
3297 generating_concat_p = 0;
3299 gcc_assert (TREE_CODE (val) != INDIRECT_REF);
3300 if (((TREE_CODE (val) == MEM_REF
3301 && TREE_CODE (TREE_OPERAND (val, 0)) != ADDR_EXPR)
3302 && allows_mem)
3303 || (DECL_P (val)
3304 && (allows_mem || REG_P (DECL_RTL (val)))
3305 && ! (REG_P (DECL_RTL (val))
3306 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3307 || ! allows_reg
3308 || is_inout
3309 || TREE_ADDRESSABLE (type)
3310 || (!tree_fits_poly_int64_p (TYPE_SIZE (type))
3311 && !known_size_p (max_int_size_in_bytes (type))))
3313 op = expand_expr (val, NULL_RTX, VOIDmode,
3314 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3315 if (MEM_P (op))
3316 op = validize_mem (op);
3318 if (! allows_reg && !MEM_P (op))
3320 error_at (locus, "output number %d not directly addressable", i);
3321 error_seen = true;
3323 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3324 || GET_CODE (op) == CONCAT)
3326 rtx old_op = op;
3327 op = gen_reg_rtx (GET_MODE (op));
3329 generating_concat_p = old_generating_concat_p;
3331 if (is_inout)
3332 emit_move_insn (op, old_op);
3334 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3335 emit_move_insn (old_op, op);
3336 after_rtl_seq = get_insns ();
3337 after_rtl_end = get_last_insn ();
3338 end_sequence ();
3341 else
3343 op = assign_temp (type, 0, 1);
3344 op = validize_mem (op);
3345 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3346 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3348 generating_concat_p = old_generating_concat_p;
3350 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3351 expand_assignment (val, make_tree (type, op), false);
3352 after_rtl_seq = get_insns ();
3353 after_rtl_end = get_last_insn ();
3354 end_sequence ();
3356 output_rvec[i] = op;
3358 if (is_inout)
3359 inout_opnum.safe_push (i);
3362 const char *str = gimple_asm_string (stmt);
3363 if (error_seen)
3365 ninputs = 0;
3366 noutputs = 0;
3367 inout_opnum.truncate (0);
3368 output_rvec.truncate (0);
3369 clobber_rvec.truncate (0);
3370 constraints.truncate (0);
3371 CLEAR_HARD_REG_SET (clobbered_regs);
3372 str = "";
3375 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3376 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3378 input_rvec.safe_grow (ninputs, true);
3379 input_mode.safe_grow (ninputs, true);
3381 generating_concat_p = 0;
3383 for (i = 0; i < ninputs; ++i)
3385 tree val = input_tvec[i];
3386 tree type = TREE_TYPE (val);
3387 bool allows_reg, allows_mem, ok;
3388 const char *constraint;
3389 rtx op;
3391 constraint = constraints[i + noutputs];
3392 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3393 constraints.address (),
3394 &allows_mem, &allows_reg);
3395 gcc_assert (ok);
3397 /* EXPAND_INITIALIZER will not generate code for valid initializer
3398 constants, but will still generate code for other types of operand.
3399 This is the behavior we want for constant constraints. */
3400 op = expand_expr (val, NULL_RTX, VOIDmode,
3401 allows_reg ? EXPAND_NORMAL
3402 : allows_mem ? EXPAND_MEMORY
3403 : EXPAND_INITIALIZER);
3405 /* Never pass a CONCAT to an ASM. */
3406 if (GET_CODE (op) == CONCAT)
3407 op = force_reg (GET_MODE (op), op);
3408 else if (MEM_P (op))
3409 op = validize_mem (op);
3411 if (asm_operand_ok (op, constraint, NULL) <= 0)
3413 if (allows_reg && TYPE_MODE (type) != BLKmode)
3414 op = force_reg (TYPE_MODE (type), op);
3415 else if (!allows_mem)
3416 warning_at (locus, 0, "%<asm%> operand %d probably does not match "
3417 "constraints", i + noutputs);
3418 else if (MEM_P (op))
3420 /* We won't recognize either volatile memory or memory
3421 with a queued address as available a memory_operand
3422 at this point. Ignore it: clearly this *is* a memory. */
3424 else
3425 gcc_unreachable ();
3427 input_rvec[i] = op;
3428 input_mode[i] = TYPE_MODE (type);
3431 /* For in-out operands, copy output rtx to input rtx. */
3432 unsigned ninout = inout_opnum.length ();
3433 for (i = 0; i < ninout; i++)
3435 int j = inout_opnum[i];
3436 rtx o = output_rvec[j];
3438 input_rvec.safe_push (o);
3439 input_mode.safe_push (GET_MODE (o));
3441 char buffer[16];
3442 sprintf (buffer, "%d", j);
3443 constraints.safe_push (ggc_strdup (buffer));
3445 ninputs += ninout;
3447 /* Sometimes we wish to automatically clobber registers across an asm.
3448 Case in point is when the i386 backend moved from cc0 to a hard reg --
3449 maintaining source-level compatibility means automatically clobbering
3450 the flags register. */
3451 rtx_insn *after_md_seq = NULL;
3452 auto_vec<rtx> use_rvec;
3453 if (targetm.md_asm_adjust)
3454 after_md_seq
3455 = targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
3456 constraints, use_rvec, clobber_rvec,
3457 clobbered_regs, locus);
3459 /* Do not allow the hook to change the output and input count,
3460 lest it mess up the operand numbering. */
3461 gcc_assert (output_rvec.length() == noutputs);
3462 gcc_assert (input_rvec.length() == ninputs);
3463 gcc_assert (constraints.length() == noutputs + ninputs);
3465 /* But it certainly can adjust the uses and clobbers. */
3466 unsigned nuses = use_rvec.length ();
3467 unsigned nclobbers = clobber_rvec.length ();
3469 /* Third pass checks for easy conflicts. */
3470 /* ??? Why are we doing this on trees instead of rtx. */
3472 bool clobber_conflict_found = 0;
3473 for (i = 0; i < noutputs; ++i)
3474 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs, locus))
3475 clobber_conflict_found = 1;
3476 for (i = 0; i < ninputs - ninout; ++i)
3477 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs, locus))
3478 clobber_conflict_found = 1;
3480 /* Make vectors for the expression-rtx, constraint strings,
3481 and named operands. */
3483 rtvec argvec = rtvec_alloc (ninputs);
3484 rtvec constraintvec = rtvec_alloc (ninputs);
3485 rtvec labelvec = rtvec_alloc (nlabels);
3487 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3488 : GET_MODE (output_rvec[0])),
3489 ggc_strdup (str),
3490 "", 0, argvec, constraintvec,
3491 labelvec, locus);
3492 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3494 for (i = 0; i < ninputs; ++i)
3496 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3497 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3498 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3499 constraints[i + noutputs],
3500 locus);
3503 /* Copy labels to the vector. */
3504 rtx_code_label *fallthru_label = NULL;
3505 if (nlabels > 0)
3507 basic_block fallthru_bb = NULL;
3508 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3509 if (fallthru)
3510 fallthru_bb = fallthru->dest;
3512 for (i = 0; i < nlabels; ++i)
3514 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3515 rtx_insn *r;
3516 /* If asm goto has any labels in the fallthru basic block, use
3517 a label that we emit immediately after the asm goto. Expansion
3518 may insert further instructions into the same basic block after
3519 asm goto and if we don't do this, insertion of instructions on
3520 the fallthru edge might misbehave. See PR58670. */
3521 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3523 if (fallthru_label == NULL_RTX)
3524 fallthru_label = gen_label_rtx ();
3525 r = fallthru_label;
3527 else
3528 r = label_rtx (label);
3529 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3533 /* Now, for each output, construct an rtx
3534 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3535 ARGVEC CONSTRAINTS OPNAMES))
3536 If there is more than one, put them inside a PARALLEL. */
3538 if (noutputs == 0 && nuses == 0 && nclobbers == 0)
3540 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3541 if (nlabels > 0)
3542 emit_jump_insn (body);
3543 else
3544 emit_insn (body);
3546 else if (noutputs == 1 && nuses == 0 && nclobbers == 0)
3548 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3549 if (nlabels > 0)
3550 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3551 else
3552 emit_insn (gen_rtx_SET (output_rvec[0], body));
3554 else
3556 rtx obody = body;
3557 int num = noutputs;
3559 if (num == 0)
3560 num = 1;
3562 body = gen_rtx_PARALLEL (VOIDmode,
3563 rtvec_alloc (num + nuses + nclobbers));
3565 /* For each output operand, store a SET. */
3566 for (i = 0; i < noutputs; ++i)
3568 rtx src, o = output_rvec[i];
3569 if (i == 0)
3571 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3572 src = obody;
3574 else
3576 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3577 ASM_OPERANDS_TEMPLATE (obody),
3578 constraints[i], i, argvec,
3579 constraintvec, labelvec, locus);
3580 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3582 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3585 /* If there are no outputs (but there are some clobbers)
3586 store the bare ASM_OPERANDS into the PARALLEL. */
3587 if (i == 0)
3588 XVECEXP (body, 0, i++) = obody;
3590 /* Add the uses specified by the target hook. No checking should
3591 be needed since this doesn't come directly from user code. */
3592 for (rtx use : use_rvec)
3593 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
3595 /* Store (clobber REG) for each clobbered register specified. */
3596 for (unsigned j = 0; j < nclobbers; ++j)
3598 rtx clobbered_reg = clobber_rvec[j];
3600 /* Do sanity check for overlap between clobbers and respectively
3601 input and outputs that hasn't been handled. Such overlap
3602 should have been detected and reported above. */
3603 if (!clobber_conflict_found && REG_P (clobbered_reg))
3605 /* We test the old body (obody) contents to avoid
3606 tripping over the under-construction body. */
3607 for (unsigned k = 0; k < noutputs; ++k)
3608 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3609 internal_error ("%<asm%> clobber conflict with "
3610 "output operand");
3612 for (unsigned k = 0; k < ninputs - ninout; ++k)
3613 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3614 internal_error ("%<asm%> clobber conflict with "
3615 "input operand");
3618 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3621 if (nlabels > 0)
3622 emit_jump_insn (body);
3623 else
3624 emit_insn (body);
3627 generating_concat_p = old_generating_concat_p;
3629 if (fallthru_label)
3630 emit_label (fallthru_label);
3632 if (after_md_seq)
3633 emit_insn (after_md_seq);
3634 if (after_rtl_seq)
3636 if (nlabels == 0)
3637 emit_insn (after_rtl_seq);
3638 else
3640 edge e;
3641 edge_iterator ei;
3643 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3645 start_sequence ();
3646 for (rtx_insn *curr = after_rtl_seq;
3647 curr != NULL_RTX;
3648 curr = NEXT_INSN (curr))
3649 emit_insn (copy_insn (PATTERN (curr)));
3650 rtx_insn *copy = get_insns ();
3651 end_sequence ();
3652 insert_insn_on_edge (copy, e);
3657 free_temp_slots ();
3658 crtl->has_asm_statement = 1;
3661 /* Emit code to jump to the address
3662 specified by the pointer expression EXP. */
3664 static void
3665 expand_computed_goto (tree exp)
3667 rtx x = expand_normal (exp);
3669 do_pending_stack_adjust ();
3670 emit_indirect_jump (x);
3673 /* Generate RTL code for a `goto' statement with target label LABEL.
3674 LABEL should be a LABEL_DECL tree node that was or will later be
3675 defined with `expand_label'. */
3677 static void
3678 expand_goto (tree label)
3680 if (flag_checking)
3682 /* Check for a nonlocal goto to a containing function. Should have
3683 gotten translated to __builtin_nonlocal_goto. */
3684 tree context = decl_function_context (label);
3685 gcc_assert (!context || context == current_function_decl);
3688 emit_jump (jump_target_rtx (label));
3691 /* Output a return with no value. */
3693 static void
3694 expand_null_return_1 (void)
3696 clear_pending_stack_adjust ();
3697 do_pending_stack_adjust ();
3698 emit_jump (return_label);
3701 /* Generate RTL to return from the current function, with no value.
3702 (That is, we do not do anything about returning any value.) */
3704 void
3705 expand_null_return (void)
3707 /* If this function was declared to return a value, but we
3708 didn't, clobber the return registers so that they are not
3709 propagated live to the rest of the function. */
3710 clobber_return_register ();
3712 expand_null_return_1 ();
3715 /* Generate RTL to return from the current function, with value VAL. */
3717 static void
3718 expand_value_return (rtx val)
3720 /* Copy the value to the return location unless it's already there. */
3722 tree decl = DECL_RESULT (current_function_decl);
3723 rtx return_reg = DECL_RTL (decl);
3724 if (return_reg != val)
3726 tree funtype = TREE_TYPE (current_function_decl);
3727 tree type = TREE_TYPE (decl);
3728 int unsignedp = TYPE_UNSIGNED (type);
3729 machine_mode old_mode = DECL_MODE (decl);
3730 machine_mode mode;
3731 if (DECL_BY_REFERENCE (decl))
3732 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3733 else
3734 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3736 if (mode != old_mode)
3738 /* Some ABIs require scalar floating point modes to be returned
3739 in a wider scalar integer mode. We need to explicitly
3740 reinterpret to an integer mode of the correct precision
3741 before extending to the desired result. */
3742 if (SCALAR_INT_MODE_P (mode)
3743 && SCALAR_FLOAT_MODE_P (old_mode)
3744 && known_gt (GET_MODE_SIZE (mode), GET_MODE_SIZE (old_mode)))
3745 val = convert_float_to_wider_int (mode, old_mode, val);
3746 else
3747 val = convert_modes (mode, old_mode, val, unsignedp);
3750 if (GET_CODE (return_reg) == PARALLEL)
3751 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3752 else
3753 emit_move_insn (return_reg, val);
3756 expand_null_return_1 ();
3759 /* Generate RTL to evaluate the expression RETVAL and return it
3760 from the current function. */
3762 static void
3763 expand_return (tree retval)
3765 rtx result_rtl;
3766 rtx val = 0;
3767 tree retval_rhs;
3769 /* If function wants no value, give it none. */
3770 if (VOID_TYPE_P (TREE_TYPE (TREE_TYPE (current_function_decl))))
3772 expand_normal (retval);
3773 expand_null_return ();
3774 return;
3777 if (retval == error_mark_node)
3779 /* Treat this like a return of no value from a function that
3780 returns a value. */
3781 expand_null_return ();
3782 return;
3784 else if ((TREE_CODE (retval) == MODIFY_EXPR
3785 || TREE_CODE (retval) == INIT_EXPR)
3786 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3787 retval_rhs = TREE_OPERAND (retval, 1);
3788 else
3789 retval_rhs = retval;
3791 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3793 /* If we are returning the RESULT_DECL, then the value has already
3794 been stored into it, so we don't have to do anything special. */
3795 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3796 expand_value_return (result_rtl);
3798 /* If the result is an aggregate that is being returned in one (or more)
3799 registers, load the registers here. */
3801 else if (retval_rhs != 0
3802 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3803 && REG_P (result_rtl))
3805 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3806 if (val)
3808 /* Use the mode of the result value on the return register. */
3809 PUT_MODE (result_rtl, GET_MODE (val));
3810 expand_value_return (val);
3812 else
3813 expand_null_return ();
3815 else if (retval_rhs != 0
3816 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3817 && (REG_P (result_rtl)
3818 || (GET_CODE (result_rtl) == PARALLEL)))
3820 /* Compute the return value into a temporary (usually a pseudo reg). */
3822 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3823 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3824 val = force_not_mem (val);
3825 expand_value_return (val);
3827 else
3829 /* No hard reg used; calculate value into hard return reg. */
3830 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3831 expand_value_return (result_rtl);
3835 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3836 register, tell the rtl optimizers that its value is no longer
3837 needed. */
3839 static void
3840 expand_clobber (tree lhs)
3842 if (DECL_P (lhs))
3844 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3845 if (decl_rtl && REG_P (decl_rtl))
3847 machine_mode decl_mode = GET_MODE (decl_rtl);
3848 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3849 REGMODE_NATURAL_SIZE (decl_mode)))
3850 emit_clobber (decl_rtl);
3855 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3856 STMT that doesn't require special handling for outgoing edges. That
3857 is no tailcalls and no GIMPLE_COND. */
3859 static void
3860 expand_gimple_stmt_1 (gimple *stmt)
3862 tree op0;
3864 set_curr_insn_location (gimple_location (stmt));
3866 switch (gimple_code (stmt))
3868 case GIMPLE_GOTO:
3869 op0 = gimple_goto_dest (stmt);
3870 if (TREE_CODE (op0) == LABEL_DECL)
3871 expand_goto (op0);
3872 else
3873 expand_computed_goto (op0);
3874 break;
3875 case GIMPLE_LABEL:
3876 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3877 break;
3878 case GIMPLE_NOP:
3879 case GIMPLE_PREDICT:
3880 break;
3881 case GIMPLE_SWITCH:
3883 gswitch *swtch = as_a <gswitch *> (stmt);
3884 if (gimple_switch_num_labels (swtch) == 1)
3885 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3886 else
3887 expand_case (swtch);
3889 break;
3890 case GIMPLE_ASM:
3891 expand_asm_stmt (as_a <gasm *> (stmt));
3892 break;
3893 case GIMPLE_CALL:
3894 expand_call_stmt (as_a <gcall *> (stmt));
3895 break;
3897 case GIMPLE_RETURN:
3899 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3901 /* If a return doesn't have a location, it very likely represents
3902 multiple user returns so we cannot let it inherit the location
3903 of the last statement of the previous basic block in RTL. */
3904 if (!gimple_has_location (stmt))
3905 set_curr_insn_location (cfun->function_end_locus);
3907 if (op0 && op0 != error_mark_node)
3909 tree result = DECL_RESULT (current_function_decl);
3911 /* If we are not returning the current function's RESULT_DECL,
3912 build an assignment to it. */
3913 if (op0 != result)
3915 /* I believe that a function's RESULT_DECL is unique. */
3916 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3918 /* ??? We'd like to use simply expand_assignment here,
3919 but this fails if the value is of BLKmode but the return
3920 decl is a register. expand_return has special handling
3921 for this combination, which eventually should move
3922 to common code. See comments there. Until then, let's
3923 build a modify expression :-/ */
3924 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3925 result, op0);
3929 if (!op0)
3930 expand_null_return ();
3931 else
3932 expand_return (op0);
3934 break;
3936 case GIMPLE_ASSIGN:
3938 gassign *assign_stmt = as_a <gassign *> (stmt);
3939 tree lhs = gimple_assign_lhs (assign_stmt);
3941 /* Tree expand used to fiddle with |= and &= of two bitfield
3942 COMPONENT_REFs here. This can't happen with gimple, the LHS
3943 of binary assigns must be a gimple reg. */
3945 if (TREE_CODE (lhs) != SSA_NAME
3946 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
3948 tree rhs = gimple_assign_rhs1 (assign_stmt);
3949 gcc_assert (gimple_assign_rhs_class (assign_stmt)
3950 == GIMPLE_SINGLE_RHS);
3951 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3952 /* Do not put locations on possibly shared trees. */
3953 && !is_gimple_min_invariant (rhs))
3954 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3955 if (TREE_CLOBBER_P (rhs))
3956 /* This is a clobber to mark the going out of scope for
3957 this LHS. */
3958 expand_clobber (lhs);
3959 else
3960 expand_assignment (lhs, rhs,
3961 gimple_assign_nontemporal_move_p (
3962 assign_stmt));
3964 else
3966 rtx target, temp;
3967 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3968 struct separate_ops ops;
3969 bool promoted = false;
3971 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3972 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3973 promoted = true;
3975 ops.code = gimple_assign_rhs_code (assign_stmt);
3976 ops.type = TREE_TYPE (lhs);
3977 switch (get_gimple_rhs_class (ops.code))
3979 case GIMPLE_TERNARY_RHS:
3980 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3981 /* Fallthru */
3982 case GIMPLE_BINARY_RHS:
3983 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3984 /* Fallthru */
3985 case GIMPLE_UNARY_RHS:
3986 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3987 break;
3988 default:
3989 gcc_unreachable ();
3991 ops.location = gimple_location (stmt);
3993 /* If we want to use a nontemporal store, force the value to
3994 register first. If we store into a promoted register,
3995 don't directly expand to target. */
3996 temp = nontemporal || promoted ? NULL_RTX : target;
3997 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3998 EXPAND_NORMAL);
4000 if (temp == target)
4002 else if (promoted)
4004 int unsignedp = SUBREG_PROMOTED_SIGN (target);
4005 /* If TEMP is a VOIDmode constant, use convert_modes to make
4006 sure that we properly convert it. */
4007 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
4009 temp = convert_modes (GET_MODE (target),
4010 TYPE_MODE (ops.type),
4011 temp, unsignedp);
4012 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
4013 GET_MODE (target), temp, unsignedp);
4016 convert_move (SUBREG_REG (target), temp, unsignedp);
4018 else if (nontemporal && emit_storent_insn (target, temp))
4020 else
4022 temp = force_operand (temp, target);
4023 if (temp != target)
4024 emit_move_insn (target, temp);
4028 break;
4030 default:
4031 gcc_unreachable ();
4035 /* Expand one gimple statement STMT and return the last RTL instruction
4036 before any of the newly generated ones.
4038 In addition to generating the necessary RTL instructions this also
4039 sets REG_EH_REGION notes if necessary and sets the current source
4040 location for diagnostics. */
4042 static rtx_insn *
4043 expand_gimple_stmt (gimple *stmt)
4045 location_t saved_location = input_location;
4046 rtx_insn *last = get_last_insn ();
4047 int lp_nr;
4049 gcc_assert (cfun);
4051 /* We need to save and restore the current source location so that errors
4052 discovered during expansion are emitted with the right location. But
4053 it would be better if the diagnostic routines used the source location
4054 embedded in the tree nodes rather than globals. */
4055 if (gimple_has_location (stmt))
4056 input_location = gimple_location (stmt);
4058 expand_gimple_stmt_1 (stmt);
4060 /* Free any temporaries used to evaluate this statement. */
4061 free_temp_slots ();
4063 input_location = saved_location;
4065 /* Mark all insns that may trap. */
4066 lp_nr = lookup_stmt_eh_lp (stmt);
4067 if (lp_nr)
4069 rtx_insn *insn;
4070 for (insn = next_real_insn (last); insn;
4071 insn = next_real_insn (insn))
4073 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
4074 /* If we want exceptions for non-call insns, any
4075 may_trap_p instruction may throw. */
4076 && GET_CODE (PATTERN (insn)) != CLOBBER
4077 && GET_CODE (PATTERN (insn)) != USE
4078 && insn_could_throw_p (insn))
4079 make_reg_eh_region_note (insn, 0, lp_nr);
4083 return last;
4086 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
4087 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
4088 generated a tail call (something that might be denied by the ABI
4089 rules governing the call; see calls.cc).
4091 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
4092 can still reach the rest of BB. The case here is __builtin_sqrt,
4093 where the NaN result goes through the external function (with a
4094 tailcall) and the normal result happens via a sqrt instruction. */
4096 static basic_block
4097 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
4099 rtx_insn *last2, *last;
4100 edge e;
4101 edge_iterator ei;
4102 profile_probability probability;
4104 last2 = last = expand_gimple_stmt (stmt);
4106 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
4107 if (CALL_P (last) && SIBLING_CALL_P (last))
4108 goto found;
4110 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4112 *can_fallthru = true;
4113 return NULL;
4115 found:
4116 /* ??? Wouldn't it be better to just reset any pending stack adjust?
4117 Any instructions emitted here are about to be deleted. */
4118 do_pending_stack_adjust ();
4120 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
4121 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
4122 EH or abnormal edges, we shouldn't have created a tail call in
4123 the first place. So it seems to me we should just be removing
4124 all edges here, or redirecting the existing fallthru edge to
4125 the exit block. */
4127 probability = profile_probability::never ();
4129 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
4131 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
4133 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
4134 e->dest->count -= e->count ();
4135 probability += e->probability;
4136 remove_edge (e);
4138 else
4139 ei_next (&ei);
4142 /* This is somewhat ugly: the call_expr expander often emits instructions
4143 after the sibcall (to perform the function return). These confuse the
4144 find_many_sub_basic_blocks code, so we need to get rid of these. */
4145 last = NEXT_INSN (last);
4146 gcc_assert (BARRIER_P (last));
4148 *can_fallthru = false;
4149 while (NEXT_INSN (last))
4151 /* For instance an sqrt builtin expander expands if with
4152 sibcall in the then and label for `else`. */
4153 if (LABEL_P (NEXT_INSN (last)))
4155 *can_fallthru = true;
4156 break;
4158 delete_insn (NEXT_INSN (last));
4161 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
4162 | EDGE_SIBCALL);
4163 e->probability = probability;
4164 BB_END (bb) = last;
4165 update_bb_for_insn (bb);
4167 if (NEXT_INSN (last))
4169 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
4171 last = BB_END (bb);
4172 if (BARRIER_P (last))
4173 BB_END (bb) = PREV_INSN (last);
4176 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4178 return bb;
4181 /* Return the difference between the floor and the truncated result of
4182 a signed division by OP1 with remainder MOD. */
4183 static rtx
4184 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4186 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4187 return gen_rtx_IF_THEN_ELSE
4188 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4189 gen_rtx_IF_THEN_ELSE
4190 (mode, gen_rtx_LT (BImode,
4191 gen_rtx_DIV (mode, op1, mod),
4192 const0_rtx),
4193 constm1_rtx, const0_rtx),
4194 const0_rtx);
4197 /* Return the difference between the ceil and the truncated result of
4198 a signed division by OP1 with remainder MOD. */
4199 static rtx
4200 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4202 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4203 return gen_rtx_IF_THEN_ELSE
4204 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4205 gen_rtx_IF_THEN_ELSE
4206 (mode, gen_rtx_GT (BImode,
4207 gen_rtx_DIV (mode, op1, mod),
4208 const0_rtx),
4209 const1_rtx, const0_rtx),
4210 const0_rtx);
4213 /* Return the difference between the ceil and the truncated result of
4214 an unsigned division by OP1 with remainder MOD. */
4215 static rtx
4216 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4218 /* (mod != 0 ? 1 : 0) */
4219 return gen_rtx_IF_THEN_ELSE
4220 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4221 const1_rtx, const0_rtx);
4224 /* Return the difference between the rounded and the truncated result
4225 of a signed division by OP1 with remainder MOD. Halfway cases are
4226 rounded away from zero, rather than to the nearest even number. */
4227 static rtx
4228 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4230 /* (abs (mod) >= abs (op1) - abs (mod)
4231 ? (op1 / mod > 0 ? 1 : -1)
4232 : 0) */
4233 return gen_rtx_IF_THEN_ELSE
4234 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4235 gen_rtx_MINUS (mode,
4236 gen_rtx_ABS (mode, op1),
4237 gen_rtx_ABS (mode, mod))),
4238 gen_rtx_IF_THEN_ELSE
4239 (mode, gen_rtx_GT (BImode,
4240 gen_rtx_DIV (mode, op1, mod),
4241 const0_rtx),
4242 const1_rtx, constm1_rtx),
4243 const0_rtx);
4246 /* Return the difference between the rounded and the truncated result
4247 of a unsigned division by OP1 with remainder MOD. Halfway cases
4248 are rounded away from zero, rather than to the nearest even
4249 number. */
4250 static rtx
4251 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4253 /* (mod >= op1 - mod ? 1 : 0) */
4254 return gen_rtx_IF_THEN_ELSE
4255 (mode, gen_rtx_GE (BImode, mod,
4256 gen_rtx_MINUS (mode, op1, mod)),
4257 const1_rtx, const0_rtx);
4260 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4261 any rtl. */
4263 static rtx
4264 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4265 addr_space_t as)
4267 #ifndef POINTERS_EXTEND_UNSIGNED
4268 gcc_assert (mode == Pmode
4269 || mode == targetm.addr_space.address_mode (as));
4270 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4271 #else
4272 rtx temp;
4274 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4276 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4277 return x;
4279 /* X must have some form of address mode already. */
4280 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4281 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4282 x = lowpart_subreg (mode, x, xmode);
4283 else if (POINTERS_EXTEND_UNSIGNED > 0)
4284 x = gen_rtx_ZERO_EXTEND (mode, x);
4285 else if (!POINTERS_EXTEND_UNSIGNED)
4286 x = gen_rtx_SIGN_EXTEND (mode, x);
4287 else
4289 switch (GET_CODE (x))
4291 case SUBREG:
4292 if ((SUBREG_PROMOTED_VAR_P (x)
4293 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4294 || (GET_CODE (SUBREG_REG (x)) == PLUS
4295 && REG_P (XEXP (SUBREG_REG (x), 0))
4296 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4297 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4298 && GET_MODE (SUBREG_REG (x)) == mode)
4299 return SUBREG_REG (x);
4300 break;
4301 case LABEL_REF:
4302 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4303 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4304 return temp;
4305 case SYMBOL_REF:
4306 temp = shallow_copy_rtx (x);
4307 PUT_MODE (temp, mode);
4308 return temp;
4309 case CONST:
4310 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4311 if (temp)
4312 temp = gen_rtx_CONST (mode, temp);
4313 return temp;
4314 case PLUS:
4315 case MINUS:
4316 if (CONST_INT_P (XEXP (x, 1)))
4318 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4319 if (temp)
4320 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4322 break;
4323 default:
4324 break;
4326 /* Don't know how to express ptr_extend as operation in debug info. */
4327 return NULL;
4329 #endif /* POINTERS_EXTEND_UNSIGNED */
4331 return x;
4334 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4335 by avoid_deep_ter_for_debug. */
4337 static hash_map<tree, tree> *deep_ter_debug_map;
4339 /* Split too deep TER chains for debug stmts using debug temporaries. */
4341 static void
4342 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4344 use_operand_p use_p;
4345 ssa_op_iter iter;
4346 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4348 tree use = USE_FROM_PTR (use_p);
4349 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4350 continue;
4351 gimple *g = get_gimple_for_ssa_name (use);
4352 if (g == NULL)
4353 continue;
4354 if (depth > 6 && !stmt_ends_bb_p (g))
4356 if (deep_ter_debug_map == NULL)
4357 deep_ter_debug_map = new hash_map<tree, tree>;
4359 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4360 if (vexpr != NULL)
4361 continue;
4362 vexpr = build_debug_expr_decl (TREE_TYPE (use));
4363 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4364 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4365 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4366 avoid_deep_ter_for_debug (def_temp, 0);
4368 else
4369 avoid_deep_ter_for_debug (g, depth + 1);
4373 /* Return an RTX equivalent to the value of the parameter DECL. */
4375 static rtx
4376 expand_debug_parm_decl (tree decl)
4378 rtx incoming = DECL_INCOMING_RTL (decl);
4380 if (incoming
4381 && GET_MODE (incoming) != BLKmode
4382 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4383 || (MEM_P (incoming)
4384 && REG_P (XEXP (incoming, 0))
4385 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4387 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4389 #ifdef HAVE_window_save
4390 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4391 If the target machine has an explicit window save instruction, the
4392 actual entry value is the corresponding OUTGOING_REGNO instead. */
4393 if (REG_P (incoming)
4394 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4395 incoming
4396 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4397 OUTGOING_REGNO (REGNO (incoming)), 0);
4398 else if (MEM_P (incoming))
4400 rtx reg = XEXP (incoming, 0);
4401 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4403 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4404 incoming = replace_equiv_address_nv (incoming, reg);
4406 else
4407 incoming = copy_rtx (incoming);
4409 #endif
4411 ENTRY_VALUE_EXP (rtl) = incoming;
4412 return rtl;
4415 if (incoming
4416 && GET_MODE (incoming) != BLKmode
4417 && !TREE_ADDRESSABLE (decl)
4418 && MEM_P (incoming)
4419 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4420 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4421 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4422 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4423 return copy_rtx (incoming);
4425 return NULL_RTX;
4428 /* Return an RTX equivalent to the value of the tree expression EXP. */
4430 static rtx
4431 expand_debug_expr (tree exp)
4433 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4434 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4435 machine_mode inner_mode = VOIDmode;
4436 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4437 addr_space_t as;
4438 scalar_int_mode op0_mode, op1_mode, addr_mode;
4440 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4442 case tcc_expression:
4443 switch (TREE_CODE (exp))
4445 case COND_EXPR:
4446 case DOT_PROD_EXPR:
4447 case SAD_EXPR:
4448 case WIDEN_MULT_PLUS_EXPR:
4449 case WIDEN_MULT_MINUS_EXPR:
4450 goto ternary;
4452 case TRUTH_ANDIF_EXPR:
4453 case TRUTH_ORIF_EXPR:
4454 case TRUTH_AND_EXPR:
4455 case TRUTH_OR_EXPR:
4456 case TRUTH_XOR_EXPR:
4457 goto binary;
4459 case TRUTH_NOT_EXPR:
4460 goto unary;
4462 default:
4463 break;
4465 break;
4467 ternary:
4468 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4469 if (!op2)
4470 return NULL_RTX;
4471 /* Fall through. */
4473 binary:
4474 case tcc_binary:
4475 if (mode == BLKmode)
4476 return NULL_RTX;
4477 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4478 if (!op1)
4479 return NULL_RTX;
4480 switch (TREE_CODE (exp))
4482 case LSHIFT_EXPR:
4483 case RSHIFT_EXPR:
4484 case LROTATE_EXPR:
4485 case RROTATE_EXPR:
4486 case WIDEN_LSHIFT_EXPR:
4487 /* Ensure second operand isn't wider than the first one. */
4488 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4489 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4490 && (GET_MODE_UNIT_PRECISION (mode)
4491 < GET_MODE_PRECISION (op1_mode)))
4492 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4493 break;
4494 default:
4495 break;
4497 /* Fall through. */
4499 unary:
4500 case tcc_unary:
4501 if (mode == BLKmode)
4502 return NULL_RTX;
4503 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4504 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4505 if (!op0)
4506 return NULL_RTX;
4507 break;
4509 case tcc_comparison:
4510 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4511 goto binary;
4513 case tcc_type:
4514 case tcc_statement:
4515 gcc_unreachable ();
4517 case tcc_constant:
4518 case tcc_exceptional:
4519 case tcc_declaration:
4520 case tcc_reference:
4521 case tcc_vl_exp:
4522 break;
4525 switch (TREE_CODE (exp))
4527 case STRING_CST:
4528 if (!lookup_constant_def (exp))
4530 if (strlen (TREE_STRING_POINTER (exp)) + 1
4531 != (size_t) TREE_STRING_LENGTH (exp))
4532 return NULL_RTX;
4533 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4534 op0 = gen_rtx_MEM (BLKmode, op0);
4535 set_mem_attributes (op0, exp, 0);
4536 return op0;
4538 /* Fall through. */
4540 case INTEGER_CST:
4541 if (TREE_CODE (TREE_TYPE (exp)) == BITINT_TYPE
4542 && TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
4543 return NULL;
4544 /* FALLTHRU */
4545 case REAL_CST:
4546 case FIXED_CST:
4547 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4548 return op0;
4550 case POLY_INT_CST:
4551 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4553 case COMPLEX_CST:
4554 gcc_assert (COMPLEX_MODE_P (mode));
4555 op0 = expand_debug_expr (TREE_REALPART (exp));
4556 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4557 return gen_rtx_CONCAT (mode, op0, op1);
4559 case DEBUG_EXPR_DECL:
4560 op0 = DECL_RTL_IF_SET (exp);
4562 if (op0)
4564 if (GET_MODE (op0) != mode)
4565 gcc_assert (VECTOR_TYPE_P (TREE_TYPE (exp)));
4566 else
4567 return op0;
4570 op0 = gen_rtx_DEBUG_EXPR (mode);
4571 DEBUG_EXPR_TREE_DECL (op0) = exp;
4572 SET_DECL_RTL (exp, op0);
4574 return op0;
4576 case VAR_DECL:
4577 case PARM_DECL:
4578 case FUNCTION_DECL:
4579 case LABEL_DECL:
4580 case CONST_DECL:
4581 case RESULT_DECL:
4582 op0 = DECL_RTL_IF_SET (exp);
4584 /* This decl was probably optimized away. */
4585 if (!op0
4586 /* At least label RTXen are sometimes replaced by
4587 NOTE_INSN_DELETED_LABEL. Any notes here are not
4588 handled by copy_rtx. */
4589 || NOTE_P (op0))
4591 if (!VAR_P (exp)
4592 || DECL_EXTERNAL (exp)
4593 || !TREE_STATIC (exp)
4594 || !DECL_NAME (exp)
4595 || DECL_HARD_REGISTER (exp)
4596 || DECL_IN_CONSTANT_POOL (exp)
4597 || mode == VOIDmode
4598 || symtab_node::get (exp) == NULL)
4599 return NULL;
4601 op0 = make_decl_rtl_for_debug (exp);
4602 if (!MEM_P (op0)
4603 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4604 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4605 return NULL;
4607 else if (VAR_P (exp)
4608 && is_global_var (exp)
4609 && symtab_node::get (exp) == NULL)
4610 return NULL;
4611 else
4612 op0 = copy_rtx (op0);
4614 if (GET_MODE (op0) == BLKmode
4615 /* If op0 is not BLKmode, but mode is, adjust_mode
4616 below would ICE. While it is likely a FE bug,
4617 try to be robust here. See PR43166. */
4618 || mode == BLKmode
4619 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4621 gcc_assert (MEM_P (op0));
4622 op0 = adjust_address_nv (op0, mode, 0);
4623 return op0;
4626 /* Fall through. */
4628 adjust_mode:
4629 case PAREN_EXPR:
4630 CASE_CONVERT:
4632 inner_mode = GET_MODE (op0);
4634 if (mode == inner_mode)
4635 return op0;
4637 if (inner_mode == VOIDmode)
4639 if (TREE_CODE (exp) == SSA_NAME)
4640 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4641 else
4642 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4643 if (mode == inner_mode)
4644 return op0;
4647 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4649 if (GET_MODE_UNIT_BITSIZE (mode)
4650 == GET_MODE_UNIT_BITSIZE (inner_mode))
4651 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4652 else if (GET_MODE_UNIT_BITSIZE (mode)
4653 < GET_MODE_UNIT_BITSIZE (inner_mode))
4654 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4655 else
4656 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4658 else if (FLOAT_MODE_P (mode))
4660 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4661 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4662 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4663 else
4664 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4666 else if (FLOAT_MODE_P (inner_mode))
4668 if (unsignedp)
4669 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4670 else
4671 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4673 else if (GET_MODE_UNIT_PRECISION (mode)
4674 == GET_MODE_UNIT_PRECISION (inner_mode))
4675 op0 = lowpart_subreg (mode, op0, inner_mode);
4676 else if (GET_MODE_UNIT_PRECISION (mode)
4677 < GET_MODE_UNIT_PRECISION (inner_mode))
4678 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4679 else if (UNARY_CLASS_P (exp)
4680 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4681 : unsignedp)
4682 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4683 else
4684 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4686 return op0;
4689 case MEM_REF:
4690 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4692 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4693 TREE_OPERAND (exp, 0),
4694 TREE_OPERAND (exp, 1));
4695 if (newexp)
4696 return expand_debug_expr (newexp);
4698 /* FALLTHROUGH */
4699 case INDIRECT_REF:
4700 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4701 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4702 if (!op0)
4703 return NULL;
4705 if (TREE_CODE (exp) == MEM_REF)
4707 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4708 || (GET_CODE (op0) == PLUS
4709 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4710 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4711 Instead just use get_inner_reference. */
4712 goto component_ref;
4714 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4715 poly_int64 offset;
4716 if (!op1 || !poly_int_rtx_p (op1, &offset))
4717 return NULL;
4719 op0 = plus_constant (inner_mode, op0, offset);
4722 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4724 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4725 op0, as);
4726 if (op0 == NULL_RTX)
4727 return NULL;
4729 op0 = gen_rtx_MEM (mode, op0);
4730 set_mem_attributes (op0, exp, 0);
4731 if (TREE_CODE (exp) == MEM_REF
4732 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4733 set_mem_expr (op0, NULL_TREE);
4734 set_mem_addr_space (op0, as);
4736 return op0;
4738 case TARGET_MEM_REF:
4739 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4740 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4741 return NULL;
4743 op0 = expand_debug_expr
4744 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4745 if (!op0)
4746 return NULL;
4748 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4749 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4750 op0, as);
4751 if (op0 == NULL_RTX)
4752 return NULL;
4754 op0 = gen_rtx_MEM (mode, op0);
4756 set_mem_attributes (op0, exp, 0);
4757 set_mem_addr_space (op0, as);
4759 return op0;
4761 component_ref:
4762 case ARRAY_REF:
4763 case ARRAY_RANGE_REF:
4764 case COMPONENT_REF:
4765 case BIT_FIELD_REF:
4766 case REALPART_EXPR:
4767 case IMAGPART_EXPR:
4768 case VIEW_CONVERT_EXPR:
4770 machine_mode mode1;
4771 poly_int64 bitsize, bitpos;
4772 tree offset;
4773 int reversep, volatilep = 0;
4774 tree tem
4775 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4776 &unsignedp, &reversep, &volatilep);
4777 rtx orig_op0;
4779 if (known_eq (bitsize, 0))
4780 return NULL;
4782 orig_op0 = op0 = expand_debug_expr (tem);
4784 if (!op0)
4785 return NULL;
4787 if (offset)
4789 machine_mode addrmode, offmode;
4791 if (!MEM_P (op0))
4792 return NULL;
4794 op0 = XEXP (op0, 0);
4795 addrmode = GET_MODE (op0);
4796 if (addrmode == VOIDmode)
4797 addrmode = Pmode;
4799 op1 = expand_debug_expr (offset);
4800 if (!op1)
4801 return NULL;
4803 offmode = GET_MODE (op1);
4804 if (offmode == VOIDmode)
4805 offmode = TYPE_MODE (TREE_TYPE (offset));
4807 if (addrmode != offmode)
4808 op1 = lowpart_subreg (addrmode, op1, offmode);
4810 /* Don't use offset_address here, we don't need a
4811 recognizable address, and we don't want to generate
4812 code. */
4813 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4814 op0, op1));
4817 if (MEM_P (op0))
4819 if (mode1 == VOIDmode)
4821 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4822 return NULL;
4823 /* Bitfield. */
4824 mode1 = smallest_int_mode_for_size (bitsize);
4826 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4827 if (maybe_ne (bytepos, 0))
4829 op0 = adjust_address_nv (op0, mode1, bytepos);
4830 bitpos = num_trailing_bits (bitpos);
4832 else if (known_eq (bitpos, 0)
4833 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4834 op0 = adjust_address_nv (op0, mode, 0);
4835 else if (GET_MODE (op0) != mode1)
4836 op0 = adjust_address_nv (op0, mode1, 0);
4837 else
4838 op0 = copy_rtx (op0);
4839 if (op0 == orig_op0)
4840 op0 = shallow_copy_rtx (op0);
4841 if (TREE_CODE (tem) != SSA_NAME)
4842 set_mem_attributes (op0, exp, 0);
4845 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4846 return op0;
4848 if (maybe_lt (bitpos, 0))
4849 return NULL;
4851 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4852 return NULL;
4854 poly_int64 bytepos;
4855 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4856 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4858 machine_mode opmode = GET_MODE (op0);
4860 if (opmode == VOIDmode)
4861 opmode = TYPE_MODE (TREE_TYPE (tem));
4863 /* This condition may hold if we're expanding the address
4864 right past the end of an array that turned out not to
4865 be addressable (i.e., the address was only computed in
4866 debug stmts). The gen_subreg below would rightfully
4867 crash, and the address doesn't really exist, so just
4868 drop it. */
4869 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4870 return NULL;
4872 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4873 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4876 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4877 && TYPE_UNSIGNED (TREE_TYPE (exp))
4878 ? SIGN_EXTRACT
4879 : ZERO_EXTRACT, mode,
4880 GET_MODE (op0) != VOIDmode
4881 ? GET_MODE (op0)
4882 : TYPE_MODE (TREE_TYPE (tem)),
4883 op0, gen_int_mode (bitsize, word_mode),
4884 gen_int_mode (bitpos, word_mode));
4887 case ABS_EXPR:
4888 case ABSU_EXPR:
4889 return simplify_gen_unary (ABS, mode, op0, mode);
4891 case NEGATE_EXPR:
4892 return simplify_gen_unary (NEG, mode, op0, mode);
4894 case BIT_NOT_EXPR:
4895 return simplify_gen_unary (NOT, mode, op0, mode);
4897 case FLOAT_EXPR:
4898 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4899 0)))
4900 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4901 inner_mode);
4903 case FIX_TRUNC_EXPR:
4904 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4905 inner_mode);
4907 case POINTER_PLUS_EXPR:
4908 /* For the rare target where pointers are not the same size as
4909 size_t, we need to check for mis-matched modes and correct
4910 the addend. */
4911 if (op0 && op1
4912 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4913 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4914 && op0_mode != op1_mode)
4916 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4917 /* If OP0 is a partial mode, then we must truncate, even
4918 if it has the same bitsize as OP1 as GCC's
4919 representation of partial modes is opaque. */
4920 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4921 && (GET_MODE_BITSIZE (op0_mode)
4922 == GET_MODE_BITSIZE (op1_mode))))
4923 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4924 else
4925 /* We always sign-extend, regardless of the signedness of
4926 the operand, because the operand is always unsigned
4927 here even if the original C expression is signed. */
4928 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4930 /* Fall through. */
4931 case PLUS_EXPR:
4932 return simplify_gen_binary (PLUS, mode, op0, op1);
4934 case MINUS_EXPR:
4935 case POINTER_DIFF_EXPR:
4936 return simplify_gen_binary (MINUS, mode, op0, op1);
4938 case MULT_EXPR:
4939 return simplify_gen_binary (MULT, mode, op0, op1);
4941 case RDIV_EXPR:
4942 case TRUNC_DIV_EXPR:
4943 case EXACT_DIV_EXPR:
4944 if (unsignedp)
4945 return simplify_gen_binary (UDIV, mode, op0, op1);
4946 else
4947 return simplify_gen_binary (DIV, mode, op0, op1);
4949 case TRUNC_MOD_EXPR:
4950 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4952 case FLOOR_DIV_EXPR:
4953 if (unsignedp)
4954 return simplify_gen_binary (UDIV, mode, op0, op1);
4955 else
4957 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4958 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4959 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4960 return simplify_gen_binary (PLUS, mode, div, adj);
4963 case FLOOR_MOD_EXPR:
4964 if (unsignedp)
4965 return simplify_gen_binary (UMOD, mode, op0, op1);
4966 else
4968 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4969 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4970 adj = simplify_gen_unary (NEG, mode,
4971 simplify_gen_binary (MULT, mode, adj, op1),
4972 mode);
4973 return simplify_gen_binary (PLUS, mode, mod, adj);
4976 case CEIL_DIV_EXPR:
4977 if (unsignedp)
4979 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4980 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4981 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4982 return simplify_gen_binary (PLUS, mode, div, adj);
4984 else
4986 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4987 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4988 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4989 return simplify_gen_binary (PLUS, mode, div, adj);
4992 case CEIL_MOD_EXPR:
4993 if (unsignedp)
4995 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4996 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4997 adj = simplify_gen_unary (NEG, mode,
4998 simplify_gen_binary (MULT, mode, adj, op1),
4999 mode);
5000 return simplify_gen_binary (PLUS, mode, mod, adj);
5002 else
5004 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5005 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
5006 adj = simplify_gen_unary (NEG, mode,
5007 simplify_gen_binary (MULT, mode, adj, op1),
5008 mode);
5009 return simplify_gen_binary (PLUS, mode, mod, adj);
5012 case ROUND_DIV_EXPR:
5013 if (unsignedp)
5015 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
5016 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5017 rtx adj = round_udiv_adjust (mode, mod, op1);
5018 return simplify_gen_binary (PLUS, mode, div, adj);
5020 else
5022 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
5023 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5024 rtx adj = round_sdiv_adjust (mode, mod, op1);
5025 return simplify_gen_binary (PLUS, mode, div, adj);
5028 case ROUND_MOD_EXPR:
5029 if (unsignedp)
5031 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5032 rtx adj = round_udiv_adjust (mode, mod, op1);
5033 adj = simplify_gen_unary (NEG, mode,
5034 simplify_gen_binary (MULT, mode, adj, op1),
5035 mode);
5036 return simplify_gen_binary (PLUS, mode, mod, adj);
5038 else
5040 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5041 rtx adj = round_sdiv_adjust (mode, mod, op1);
5042 adj = simplify_gen_unary (NEG, mode,
5043 simplify_gen_binary (MULT, mode, adj, op1),
5044 mode);
5045 return simplify_gen_binary (PLUS, mode, mod, adj);
5048 case LSHIFT_EXPR:
5049 return simplify_gen_binary (ASHIFT, mode, op0, op1);
5051 case RSHIFT_EXPR:
5052 if (unsignedp)
5053 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
5054 else
5055 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
5057 case LROTATE_EXPR:
5058 return simplify_gen_binary (ROTATE, mode, op0, op1);
5060 case RROTATE_EXPR:
5061 return simplify_gen_binary (ROTATERT, mode, op0, op1);
5063 case MIN_EXPR:
5064 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
5066 case MAX_EXPR:
5067 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
5069 case BIT_AND_EXPR:
5070 case TRUTH_AND_EXPR:
5071 return simplify_gen_binary (AND, mode, op0, op1);
5073 case BIT_IOR_EXPR:
5074 case TRUTH_OR_EXPR:
5075 return simplify_gen_binary (IOR, mode, op0, op1);
5077 case BIT_XOR_EXPR:
5078 case TRUTH_XOR_EXPR:
5079 return simplify_gen_binary (XOR, mode, op0, op1);
5081 case TRUTH_ANDIF_EXPR:
5082 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
5084 case TRUTH_ORIF_EXPR:
5085 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
5087 case TRUTH_NOT_EXPR:
5088 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
5090 case LT_EXPR:
5091 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
5092 op0, op1);
5094 case LE_EXPR:
5095 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
5096 op0, op1);
5098 case GT_EXPR:
5099 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
5100 op0, op1);
5102 case GE_EXPR:
5103 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
5104 op0, op1);
5106 case EQ_EXPR:
5107 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
5109 case NE_EXPR:
5110 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
5112 case UNORDERED_EXPR:
5113 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
5115 case ORDERED_EXPR:
5116 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
5118 case UNLT_EXPR:
5119 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
5121 case UNLE_EXPR:
5122 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
5124 case UNGT_EXPR:
5125 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
5127 case UNGE_EXPR:
5128 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
5130 case UNEQ_EXPR:
5131 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
5133 case LTGT_EXPR:
5134 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
5136 case COND_EXPR:
5137 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
5139 case COMPLEX_EXPR:
5140 gcc_assert (COMPLEX_MODE_P (mode));
5141 if (GET_MODE (op0) == VOIDmode)
5142 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
5143 if (GET_MODE (op1) == VOIDmode)
5144 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
5145 return gen_rtx_CONCAT (mode, op0, op1);
5147 case CONJ_EXPR:
5148 if (GET_CODE (op0) == CONCAT)
5149 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
5150 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
5151 XEXP (op0, 1),
5152 GET_MODE_INNER (mode)));
5153 else
5155 scalar_mode imode = GET_MODE_INNER (mode);
5156 rtx re, im;
5158 if (MEM_P (op0))
5160 re = adjust_address_nv (op0, imode, 0);
5161 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
5163 else
5165 scalar_int_mode ifmode;
5166 scalar_int_mode ihmode;
5167 rtx halfsize;
5168 if (!int_mode_for_mode (mode).exists (&ifmode)
5169 || !int_mode_for_mode (imode).exists (&ihmode))
5170 return NULL;
5171 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
5172 re = op0;
5173 if (mode != ifmode)
5174 re = gen_rtx_SUBREG (ifmode, re, 0);
5175 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
5176 if (imode != ihmode)
5177 re = gen_rtx_SUBREG (imode, re, 0);
5178 im = copy_rtx (op0);
5179 if (mode != ifmode)
5180 im = gen_rtx_SUBREG (ifmode, im, 0);
5181 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
5182 if (imode != ihmode)
5183 im = gen_rtx_SUBREG (imode, im, 0);
5185 im = gen_rtx_NEG (imode, im);
5186 return gen_rtx_CONCAT (mode, re, im);
5189 case ADDR_EXPR:
5190 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
5191 if (!op0 || !MEM_P (op0))
5193 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5194 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5195 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5196 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5197 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5198 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5200 if (handled_component_p (TREE_OPERAND (exp, 0)))
5202 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5203 bool reverse;
5204 tree decl
5205 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5206 &bitsize, &maxsize, &reverse);
5207 if ((VAR_P (decl)
5208 || TREE_CODE (decl) == PARM_DECL
5209 || TREE_CODE (decl) == RESULT_DECL)
5210 && (!TREE_ADDRESSABLE (decl)
5211 || target_for_debug_bind (decl))
5212 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5213 && known_gt (bitsize, 0)
5214 && known_eq (bitsize, maxsize))
5216 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5217 return plus_constant (mode, base, byteoffset);
5221 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5222 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5223 == ADDR_EXPR)
5225 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5226 0));
5227 if (op0 != NULL
5228 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5229 || (GET_CODE (op0) == PLUS
5230 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5231 && CONST_INT_P (XEXP (op0, 1)))))
5233 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5234 1));
5235 poly_int64 offset;
5236 if (!op1 || !poly_int_rtx_p (op1, &offset))
5237 return NULL;
5239 return plus_constant (mode, op0, offset);
5243 return NULL;
5246 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5247 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5248 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5250 return op0;
5252 case VECTOR_CST:
5254 unsigned HOST_WIDE_INT i, nelts;
5256 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5257 return NULL;
5259 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5261 for (i = 0; i < nelts; ++i)
5263 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5264 if (!op1)
5265 return NULL;
5266 XVECEXP (op0, 0, i) = op1;
5269 return op0;
5272 case CONSTRUCTOR:
5273 if (TREE_CLOBBER_P (exp))
5274 return NULL;
5275 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5277 unsigned i;
5278 unsigned HOST_WIDE_INT nelts;
5279 tree val;
5281 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5282 goto flag_unsupported;
5284 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5286 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5288 op1 = expand_debug_expr (val);
5289 if (!op1)
5290 return NULL;
5291 XVECEXP (op0, 0, i) = op1;
5294 if (i < nelts)
5296 op1 = expand_debug_expr
5297 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5299 if (!op1)
5300 return NULL;
5302 for (; i < nelts; i++)
5303 XVECEXP (op0, 0, i) = op1;
5306 return op0;
5308 else
5309 goto flag_unsupported;
5311 case CALL_EXPR:
5312 /* ??? Maybe handle some builtins? */
5313 return NULL;
5315 case SSA_NAME:
5317 gimple *g = get_gimple_for_ssa_name (exp);
5318 if (g)
5320 tree t = NULL_TREE;
5321 if (deep_ter_debug_map)
5323 tree *slot = deep_ter_debug_map->get (exp);
5324 if (slot)
5325 t = *slot;
5327 if (t == NULL_TREE)
5328 t = gimple_assign_rhs_to_tree (g);
5329 op0 = expand_debug_expr (t);
5330 if (!op0)
5331 return NULL;
5333 else
5335 /* If this is a reference to an incoming value of
5336 parameter that is never used in the code or where the
5337 incoming value is never used in the code, use
5338 PARM_DECL's DECL_RTL if set. */
5339 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5340 && SSA_NAME_VAR (exp)
5341 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5342 && has_zero_uses (exp))
5344 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5345 if (op0)
5346 goto adjust_mode;
5347 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5348 if (op0)
5349 goto adjust_mode;
5352 int part = var_to_partition (SA.map, exp);
5354 if (part == NO_PARTITION)
5355 return NULL;
5357 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5359 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5361 goto adjust_mode;
5364 case ERROR_MARK:
5365 return NULL;
5367 /* Vector stuff. For most of the codes we don't have rtl codes. */
5368 case REALIGN_LOAD_EXPR:
5369 case VEC_COND_EXPR:
5370 case VEC_PACK_FIX_TRUNC_EXPR:
5371 case VEC_PACK_FLOAT_EXPR:
5372 case VEC_PACK_SAT_EXPR:
5373 case VEC_PACK_TRUNC_EXPR:
5374 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5375 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5376 case VEC_UNPACK_FLOAT_HI_EXPR:
5377 case VEC_UNPACK_FLOAT_LO_EXPR:
5378 case VEC_UNPACK_HI_EXPR:
5379 case VEC_UNPACK_LO_EXPR:
5380 case VEC_WIDEN_MULT_HI_EXPR:
5381 case VEC_WIDEN_MULT_LO_EXPR:
5382 case VEC_WIDEN_MULT_EVEN_EXPR:
5383 case VEC_WIDEN_MULT_ODD_EXPR:
5384 case VEC_WIDEN_LSHIFT_HI_EXPR:
5385 case VEC_WIDEN_LSHIFT_LO_EXPR:
5386 case VEC_PERM_EXPR:
5387 case VEC_DUPLICATE_EXPR:
5388 case VEC_SERIES_EXPR:
5389 case SAD_EXPR:
5390 return NULL;
5392 /* Misc codes. */
5393 case ADDR_SPACE_CONVERT_EXPR:
5394 case FIXED_CONVERT_EXPR:
5395 case OBJ_TYPE_REF:
5396 case WITH_SIZE_EXPR:
5397 case BIT_INSERT_EXPR:
5398 return NULL;
5400 case DOT_PROD_EXPR:
5401 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5402 && SCALAR_INT_MODE_P (mode))
5405 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5406 0)))
5407 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5408 inner_mode);
5410 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5411 1)))
5412 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5413 inner_mode);
5414 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5415 return simplify_gen_binary (PLUS, mode, op0, op2);
5417 return NULL;
5419 case WIDEN_MULT_EXPR:
5420 case WIDEN_MULT_PLUS_EXPR:
5421 case WIDEN_MULT_MINUS_EXPR:
5422 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5423 && SCALAR_INT_MODE_P (mode))
5425 inner_mode = GET_MODE (op0);
5426 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5427 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5428 else
5429 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5430 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5431 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5432 else
5433 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5434 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5435 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5436 return op0;
5437 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5438 return simplify_gen_binary (PLUS, mode, op0, op2);
5439 else
5440 return simplify_gen_binary (MINUS, mode, op2, op0);
5442 return NULL;
5444 case MULT_HIGHPART_EXPR:
5445 /* ??? Similar to the above. */
5446 return NULL;
5448 case WIDEN_SUM_EXPR:
5449 case WIDEN_LSHIFT_EXPR:
5450 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5451 && SCALAR_INT_MODE_P (mode))
5454 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5455 0)))
5456 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5457 inner_mode);
5458 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5459 ? ASHIFT : PLUS, mode, op0, op1);
5461 return NULL;
5463 default:
5464 flag_unsupported:
5465 if (flag_checking)
5467 debug_tree (exp);
5468 gcc_unreachable ();
5470 return NULL;
5474 /* Return an RTX equivalent to the source bind value of the tree expression
5475 EXP. */
5477 static rtx
5478 expand_debug_source_expr (tree exp)
5480 rtx op0 = NULL_RTX;
5481 machine_mode mode = VOIDmode, inner_mode;
5483 switch (TREE_CODE (exp))
5485 case VAR_DECL:
5486 if (DECL_ABSTRACT_ORIGIN (exp))
5487 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5488 break;
5489 case PARM_DECL:
5491 mode = DECL_MODE (exp);
5492 op0 = expand_debug_parm_decl (exp);
5493 if (op0)
5494 break;
5495 /* See if this isn't an argument that has been completely
5496 optimized out. */
5497 if (!DECL_RTL_SET_P (exp)
5498 && !DECL_INCOMING_RTL (exp)
5499 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5501 tree aexp = DECL_ORIGIN (exp);
5502 if (DECL_CONTEXT (aexp)
5503 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5505 vec<tree, va_gc> **debug_args;
5506 unsigned int ix;
5507 tree ddecl;
5508 debug_args = decl_debug_args_lookup (current_function_decl);
5509 if (debug_args != NULL)
5511 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5512 ix += 2)
5513 if (ddecl == aexp)
5514 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5518 break;
5520 default:
5521 break;
5524 if (op0 == NULL_RTX)
5525 return NULL_RTX;
5527 inner_mode = GET_MODE (op0);
5528 if (mode == inner_mode)
5529 return op0;
5531 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5533 if (GET_MODE_UNIT_BITSIZE (mode)
5534 == GET_MODE_UNIT_BITSIZE (inner_mode))
5535 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5536 else if (GET_MODE_UNIT_BITSIZE (mode)
5537 < GET_MODE_UNIT_BITSIZE (inner_mode))
5538 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5539 else
5540 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5542 else if (FLOAT_MODE_P (mode))
5543 gcc_unreachable ();
5544 else if (FLOAT_MODE_P (inner_mode))
5546 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5547 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5548 else
5549 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5551 else if (GET_MODE_UNIT_PRECISION (mode)
5552 == GET_MODE_UNIT_PRECISION (inner_mode))
5553 op0 = lowpart_subreg (mode, op0, inner_mode);
5554 else if (GET_MODE_UNIT_PRECISION (mode)
5555 < GET_MODE_UNIT_PRECISION (inner_mode))
5556 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5557 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5558 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5559 else
5560 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5562 return op0;
5565 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5566 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5567 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5569 static void
5570 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5572 rtx exp = *exp_p;
5574 if (exp == NULL_RTX)
5575 return;
5577 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5578 return;
5580 if (depth == 4)
5582 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5583 rtx dval = make_debug_expr_from_rtl (exp);
5585 /* Emit a debug bind insn before INSN. */
5586 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5587 DEBUG_EXPR_TREE_DECL (dval), exp,
5588 VAR_INIT_STATUS_INITIALIZED);
5590 emit_debug_insn_before (bind, insn);
5591 *exp_p = dval;
5592 return;
5595 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5596 int i, j;
5597 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5598 switch (*format_ptr++)
5600 case 'e':
5601 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5602 break;
5604 case 'E':
5605 case 'V':
5606 for (j = 0; j < XVECLEN (exp, i); j++)
5607 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5608 break;
5610 default:
5611 break;
5615 /* Expand the _LOCs in debug insns. We run this after expanding all
5616 regular insns, so that any variables referenced in the function
5617 will have their DECL_RTLs set. */
5619 static void
5620 expand_debug_locations (void)
5622 rtx_insn *insn;
5623 rtx_insn *last = get_last_insn ();
5624 int save_strict_alias = flag_strict_aliasing;
5626 /* New alias sets while setting up memory attributes cause
5627 -fcompare-debug failures, even though it doesn't bring about any
5628 codegen changes. */
5629 flag_strict_aliasing = 0;
5631 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5632 if (DEBUG_BIND_INSN_P (insn))
5634 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5635 rtx val;
5636 rtx_insn *prev_insn, *insn2;
5637 machine_mode mode;
5639 if (value == NULL_TREE)
5640 val = NULL_RTX;
5641 else
5643 if (INSN_VAR_LOCATION_STATUS (insn)
5644 == VAR_INIT_STATUS_UNINITIALIZED)
5645 val = expand_debug_source_expr (value);
5646 /* The avoid_deep_ter_for_debug function inserts
5647 debug bind stmts after SSA_NAME definition, with the
5648 SSA_NAME as the whole bind location. Disable temporarily
5649 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5650 being defined in this DEBUG_INSN. */
5651 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5653 tree *slot = deep_ter_debug_map->get (value);
5654 if (slot)
5656 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5657 *slot = NULL_TREE;
5658 else
5659 slot = NULL;
5661 val = expand_debug_expr (value);
5662 if (slot)
5663 *slot = INSN_VAR_LOCATION_DECL (insn);
5665 else
5666 val = expand_debug_expr (value);
5667 gcc_assert (last == get_last_insn ());
5670 if (!val)
5671 val = gen_rtx_UNKNOWN_VAR_LOC ();
5672 else
5674 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5676 gcc_assert (mode == GET_MODE (val)
5677 || (GET_MODE (val) == VOIDmode
5678 && (CONST_SCALAR_INT_P (val)
5679 || GET_CODE (val) == CONST_FIXED
5680 || GET_CODE (val) == LABEL_REF)));
5683 INSN_VAR_LOCATION_LOC (insn) = val;
5684 prev_insn = PREV_INSN (insn);
5685 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5686 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5689 flag_strict_aliasing = save_strict_alias;
5692 /* Performs swapping operands of commutative operations to expand
5693 the expensive one first. */
5695 static void
5696 reorder_operands (basic_block bb)
5698 unsigned int *lattice; /* Hold cost of each statement. */
5699 unsigned int i = 0, n = 0;
5700 gimple_stmt_iterator gsi;
5701 gimple_seq stmts;
5702 gimple *stmt;
5703 bool swap;
5704 tree op0, op1;
5705 ssa_op_iter iter;
5706 use_operand_p use_p;
5707 gimple *def0, *def1;
5709 /* Compute cost of each statement using estimate_num_insns. */
5710 stmts = bb_seq (bb);
5711 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5713 stmt = gsi_stmt (gsi);
5714 if (!is_gimple_debug (stmt))
5715 gimple_set_uid (stmt, n++);
5717 lattice = XNEWVEC (unsigned int, n);
5718 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5720 unsigned cost;
5721 stmt = gsi_stmt (gsi);
5722 if (is_gimple_debug (stmt))
5723 continue;
5724 cost = estimate_num_insns (stmt, &eni_size_weights);
5725 lattice[i] = cost;
5726 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5728 tree use = USE_FROM_PTR (use_p);
5729 gimple *def_stmt;
5730 if (TREE_CODE (use) != SSA_NAME)
5731 continue;
5732 def_stmt = get_gimple_for_ssa_name (use);
5733 if (!def_stmt)
5734 continue;
5735 lattice[i] += lattice[gimple_uid (def_stmt)];
5737 i++;
5738 if (!is_gimple_assign (stmt)
5739 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5740 continue;
5741 op0 = gimple_op (stmt, 1);
5742 op1 = gimple_op (stmt, 2);
5743 if (TREE_CODE (op0) != SSA_NAME
5744 || TREE_CODE (op1) != SSA_NAME)
5745 continue;
5746 /* Swap operands if the second one is more expensive. */
5747 def0 = get_gimple_for_ssa_name (op0);
5748 def1 = get_gimple_for_ssa_name (op1);
5749 if (!def1)
5750 continue;
5751 swap = false;
5752 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5753 swap = true;
5754 if (swap)
5756 if (dump_file && (dump_flags & TDF_DETAILS))
5758 fprintf (dump_file, "Swap operands in stmt:\n");
5759 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5760 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5761 def0 ? lattice[gimple_uid (def0)] : 0,
5762 lattice[gimple_uid (def1)]);
5764 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5765 gimple_assign_rhs2_ptr (stmt));
5768 XDELETE (lattice);
5771 /* Expand basic block BB from GIMPLE trees to RTL. */
5773 static basic_block
5774 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5776 gimple_stmt_iterator gsi;
5777 gimple_seq stmts;
5778 gimple *stmt = NULL;
5779 rtx_note *note = NULL;
5780 rtx_insn *last;
5781 edge e;
5782 edge_iterator ei;
5783 bool nondebug_stmt_seen = false;
5785 if (dump_file)
5786 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5787 bb->index);
5789 /* Note that since we are now transitioning from GIMPLE to RTL, we
5790 cannot use the gsi_*_bb() routines because they expect the basic
5791 block to be in GIMPLE, instead of RTL. Therefore, we need to
5792 access the BB sequence directly. */
5793 if (optimize)
5794 reorder_operands (bb);
5795 stmts = bb_seq (bb);
5796 bb->il.gimple.seq = NULL;
5797 bb->il.gimple.phi_nodes = NULL;
5798 rtl_profile_for_bb (bb);
5799 init_rtl_bb_info (bb);
5800 bb->flags |= BB_RTL;
5802 /* Remove the RETURN_EXPR if we may fall though to the exit
5803 instead. */
5804 gsi = gsi_last (stmts);
5805 if (!gsi_end_p (gsi)
5806 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5808 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5810 gcc_assert (single_succ_p (bb));
5811 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5813 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5814 && !gimple_return_retval (ret_stmt))
5816 gsi_remove (&gsi, false);
5817 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5821 gsi = gsi_start (stmts);
5822 if (!gsi_end_p (gsi))
5824 stmt = gsi_stmt (gsi);
5825 if (gimple_code (stmt) != GIMPLE_LABEL)
5826 stmt = NULL;
5829 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5831 if (stmt || elt)
5833 gcc_checking_assert (!note);
5834 last = get_last_insn ();
5836 if (stmt)
5838 expand_gimple_stmt (stmt);
5839 gsi_next (&gsi);
5842 if (elt)
5843 emit_label (*elt);
5845 BB_HEAD (bb) = NEXT_INSN (last);
5846 if (NOTE_P (BB_HEAD (bb)))
5847 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5848 gcc_assert (LABEL_P (BB_HEAD (bb)));
5849 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5851 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5853 else
5854 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5856 if (note)
5857 NOTE_BASIC_BLOCK (note) = bb;
5859 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5861 basic_block new_bb;
5863 stmt = gsi_stmt (gsi);
5864 if (!is_gimple_debug (stmt))
5865 nondebug_stmt_seen = true;
5867 /* If this statement is a non-debug one, and we generate debug
5868 insns, then this one might be the last real use of a TERed
5869 SSA_NAME, but where there are still some debug uses further
5870 down. Expanding the current SSA name in such further debug
5871 uses by their RHS might lead to wrong debug info, as coalescing
5872 might make the operands of such RHS be placed into the same
5873 pseudo as something else. Like so:
5874 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5875 use(a_1);
5876 a_2 = ...
5877 #DEBUG ... => a_1
5878 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5879 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5880 the write to a_2 would actually have clobbered the place which
5881 formerly held a_0.
5883 So, instead of that, we recognize the situation, and generate
5884 debug temporaries at the last real use of TERed SSA names:
5885 a_1 = a_0 + 1;
5886 #DEBUG #D1 => a_1
5887 use(a_1);
5888 a_2 = ...
5889 #DEBUG ... => #D1
5891 if (MAY_HAVE_DEBUG_BIND_INSNS
5892 && SA.values
5893 && !is_gimple_debug (stmt))
5895 ssa_op_iter iter;
5896 tree op;
5897 gimple *def;
5899 location_t sloc = curr_insn_location ();
5901 /* Look for SSA names that have their last use here (TERed
5902 names always have only one real use). */
5903 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5904 if ((def = get_gimple_for_ssa_name (op)))
5906 imm_use_iterator imm_iter;
5907 use_operand_p use_p;
5908 bool have_debug_uses = false;
5910 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5912 if (gimple_debug_bind_p (USE_STMT (use_p)))
5914 have_debug_uses = true;
5915 break;
5919 if (have_debug_uses)
5921 /* OP is a TERed SSA name, with DEF its defining
5922 statement, and where OP is used in further debug
5923 instructions. Generate a debug temporary, and
5924 replace all uses of OP in debug insns with that
5925 temporary. */
5926 gimple *debugstmt;
5927 tree value = gimple_assign_rhs_to_tree (def);
5928 tree vexpr = build_debug_expr_decl (TREE_TYPE (value));
5929 rtx val;
5930 machine_mode mode;
5932 set_curr_insn_location (gimple_location (def));
5934 if (DECL_P (value))
5935 mode = DECL_MODE (value);
5936 else
5937 mode = TYPE_MODE (TREE_TYPE (value));
5938 /* FIXME: Is setting the mode really necessary? */
5939 SET_DECL_MODE (vexpr, mode);
5941 val = gen_rtx_VAR_LOCATION
5942 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5944 emit_debug_insn (val);
5946 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5948 if (!gimple_debug_bind_p (debugstmt))
5949 continue;
5951 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5952 SET_USE (use_p, vexpr);
5954 update_stmt (debugstmt);
5958 set_curr_insn_location (sloc);
5961 currently_expanding_gimple_stmt = stmt;
5963 /* Expand this statement, then evaluate the resulting RTL and
5964 fixup the CFG accordingly. */
5965 if (gimple_code (stmt) == GIMPLE_COND)
5967 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5968 if (new_bb)
5970 currently_expanding_gimple_stmt = NULL;
5971 return new_bb;
5974 else if (is_gimple_debug (stmt))
5976 location_t sloc = curr_insn_location ();
5977 gimple_stmt_iterator nsi = gsi;
5979 for (;;)
5981 tree var;
5982 tree value = NULL_TREE;
5983 rtx val = NULL_RTX;
5984 machine_mode mode;
5986 if (!gimple_debug_nonbind_marker_p (stmt))
5988 if (gimple_debug_bind_p (stmt))
5990 var = gimple_debug_bind_get_var (stmt);
5992 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5993 && TREE_CODE (var) != LABEL_DECL
5994 && !target_for_debug_bind (var))
5995 goto delink_debug_stmt;
5997 if (DECL_P (var) && !VECTOR_TYPE_P (TREE_TYPE (var)))
5998 mode = DECL_MODE (var);
5999 else
6000 mode = TYPE_MODE (TREE_TYPE (var));
6002 if (gimple_debug_bind_has_value_p (stmt))
6003 value = gimple_debug_bind_get_value (stmt);
6005 val = gen_rtx_VAR_LOCATION
6006 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
6008 else if (gimple_debug_source_bind_p (stmt))
6010 var = gimple_debug_source_bind_get_var (stmt);
6012 value = gimple_debug_source_bind_get_value (stmt);
6014 if (!VECTOR_TYPE_P (TREE_TYPE (var)))
6015 mode = DECL_MODE (var);
6016 else
6017 mode = TYPE_MODE (TREE_TYPE (var));
6019 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
6020 VAR_INIT_STATUS_UNINITIALIZED);
6022 else
6023 gcc_unreachable ();
6025 /* If this function was first compiled with markers
6026 enabled, but they're now disable (e.g. LTO), drop
6027 them on the floor. */
6028 else if (gimple_debug_nonbind_marker_p (stmt)
6029 && !MAY_HAVE_DEBUG_MARKER_INSNS)
6030 goto delink_debug_stmt;
6031 else if (gimple_debug_begin_stmt_p (stmt))
6032 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
6033 else if (gimple_debug_inline_entry_p (stmt))
6034 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
6035 else
6036 gcc_unreachable ();
6038 last = get_last_insn ();
6040 set_curr_insn_location (gimple_location (stmt));
6042 emit_debug_insn (val);
6044 if (dump_file && (dump_flags & TDF_DETAILS))
6046 /* We can't dump the insn with a TREE where an RTX
6047 is expected. */
6048 if (GET_CODE (val) == VAR_LOCATION)
6050 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
6051 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
6053 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6054 if (GET_CODE (val) == VAR_LOCATION)
6055 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
6058 delink_debug_stmt:
6059 /* In order not to generate too many debug temporaries,
6060 we delink all uses of debug statements we already expanded.
6061 Therefore debug statements between definition and real
6062 use of TERed SSA names will continue to use the SSA name,
6063 and not be replaced with debug temps. */
6064 delink_stmt_imm_use (stmt);
6066 gsi = nsi;
6067 gsi_next (&nsi);
6068 if (gsi_end_p (nsi))
6069 break;
6070 stmt = gsi_stmt (nsi);
6071 if (!is_gimple_debug (stmt))
6072 break;
6075 set_curr_insn_location (sloc);
6077 else
6079 gcall *call_stmt = dyn_cast <gcall *> (stmt);
6080 if (call_stmt
6081 && gimple_call_tail_p (call_stmt)
6082 && disable_tail_calls)
6083 gimple_call_set_tail (call_stmt, false);
6085 if (call_stmt && gimple_call_tail_p (call_stmt))
6087 bool can_fallthru;
6088 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
6089 if (new_bb)
6091 if (can_fallthru)
6092 bb = new_bb;
6093 else
6095 currently_expanding_gimple_stmt = NULL;
6096 return new_bb;
6100 else
6102 def_operand_p def_p;
6103 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
6105 if (def_p != NULL)
6107 /* Ignore this stmt if it is in the list of
6108 replaceable expressions. */
6109 if (SA.values
6110 && bitmap_bit_p (SA.values,
6111 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
6112 continue;
6114 last = expand_gimple_stmt (stmt);
6115 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6120 currently_expanding_gimple_stmt = NULL;
6122 /* Expand implicit goto and convert goto_locus. */
6123 FOR_EACH_EDGE (e, ei, bb->succs)
6125 if (e->goto_locus != UNKNOWN_LOCATION || !nondebug_stmt_seen)
6126 set_curr_insn_location (e->goto_locus);
6127 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
6129 emit_jump (label_rtx_for_bb (e->dest));
6130 e->flags &= ~EDGE_FALLTHRU;
6134 /* Expanded RTL can create a jump in the last instruction of block.
6135 This later might be assumed to be a jump to successor and break edge insertion.
6136 We need to insert dummy move to prevent this. PR41440. */
6137 if (single_succ_p (bb)
6138 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
6139 && (last = get_last_insn ())
6140 && (JUMP_P (last)
6141 || (DEBUG_INSN_P (last)
6142 && JUMP_P (prev_nondebug_insn (last)))))
6144 rtx dummy = gen_reg_rtx (SImode);
6145 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
6148 do_pending_stack_adjust ();
6150 /* Find the block tail. The last insn in the block is the insn
6151 before a barrier and/or table jump insn. */
6152 last = get_last_insn ();
6153 if (BARRIER_P (last))
6154 last = PREV_INSN (last);
6155 if (JUMP_TABLE_DATA_P (last))
6156 last = PREV_INSN (PREV_INSN (last));
6157 if (BARRIER_P (last))
6158 last = PREV_INSN (last);
6159 BB_END (bb) = last;
6161 update_bb_for_insn (bb);
6163 return bb;
6167 /* Create a basic block for initialization code. */
6169 static basic_block
6170 construct_init_block (void)
6172 basic_block init_block, first_block;
6173 edge e = NULL;
6174 int flags;
6176 /* Multiple entry points not supported yet. */
6177 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
6178 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
6179 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
6180 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6181 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6183 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
6185 /* When entry edge points to first basic block, we don't need jump,
6186 otherwise we have to jump into proper target. */
6187 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
6189 tree label = gimple_block_label (e->dest);
6191 emit_jump (jump_target_rtx (label));
6192 flags = 0;
6194 else
6195 flags = EDGE_FALLTHRU;
6197 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6198 get_last_insn (),
6199 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6200 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6201 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6202 if (e)
6204 first_block = e->dest;
6205 redirect_edge_succ (e, init_block);
6206 make_single_succ_edge (init_block, first_block, flags);
6208 else
6209 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6210 EDGE_FALLTHRU);
6212 update_bb_for_insn (init_block);
6213 return init_block;
6216 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6217 found in the block tree. */
6219 static void
6220 set_block_levels (tree block, int level)
6222 while (block)
6224 BLOCK_NUMBER (block) = level;
6225 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6226 block = BLOCK_CHAIN (block);
6230 /* Create a block containing landing pads and similar stuff. */
6232 static void
6233 construct_exit_block (void)
6235 rtx_insn *head = get_last_insn ();
6236 rtx_insn *end;
6237 basic_block exit_block;
6238 edge e, e2;
6239 unsigned ix;
6240 edge_iterator ei;
6241 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6242 rtx_insn *orig_end = BB_END (prev_bb);
6244 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6246 /* Make sure the locus is set to the end of the function, so that
6247 epilogue line numbers and warnings are set properly. */
6248 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6249 input_location = cfun->function_end_locus;
6251 /* Generate rtl for function exit. */
6252 expand_function_end ();
6254 end = get_last_insn ();
6255 if (head == end)
6256 return;
6257 /* While emitting the function end we could move end of the last basic
6258 block. */
6259 BB_END (prev_bb) = orig_end;
6260 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6261 head = NEXT_INSN (head);
6262 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6263 bb count counting will be confused. Any instructions before that
6264 label are emitted for the case where PREV_BB falls through into the
6265 exit block, so append those instructions to prev_bb in that case. */
6266 if (NEXT_INSN (head) != return_label)
6268 while (NEXT_INSN (head) != return_label)
6270 if (!NOTE_P (NEXT_INSN (head)))
6271 BB_END (prev_bb) = NEXT_INSN (head);
6272 head = NEXT_INSN (head);
6275 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6276 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6277 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6279 ix = 0;
6280 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6282 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6283 if (!(e->flags & EDGE_ABNORMAL))
6284 redirect_edge_succ (e, exit_block);
6285 else
6286 ix++;
6289 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6290 EDGE_FALLTHRU);
6291 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6292 if (e2 != e)
6294 exit_block->count -= e2->count ();
6296 update_bb_for_insn (exit_block);
6299 /* Helper function for discover_nonconstant_array_refs.
6300 Look for ARRAY_REF nodes with non-constant indexes and mark them
6301 addressable. */
6303 static tree
6304 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6305 void *data)
6307 tree t = *tp;
6308 bitmap forced_stack_vars = (bitmap)((walk_stmt_info *)data)->info;
6310 if (IS_TYPE_OR_DECL_P (t))
6311 *walk_subtrees = 0;
6312 else if (REFERENCE_CLASS_P (t) && TREE_THIS_VOLATILE (t))
6314 t = get_base_address (t);
6315 if (t && DECL_P (t)
6316 && DECL_MODE (t) != BLKmode
6317 && !TREE_ADDRESSABLE (t))
6318 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6319 *walk_subtrees = 0;
6321 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6323 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6324 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6325 && (!TREE_OPERAND (t, 2)
6326 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6327 || (TREE_CODE (t) == COMPONENT_REF
6328 && (!TREE_OPERAND (t,2)
6329 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6330 || TREE_CODE (t) == BIT_FIELD_REF
6331 || TREE_CODE (t) == REALPART_EXPR
6332 || TREE_CODE (t) == IMAGPART_EXPR
6333 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6334 || CONVERT_EXPR_P (t))
6335 t = TREE_OPERAND (t, 0);
6337 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6339 t = get_base_address (t);
6340 if (t && DECL_P (t)
6341 && DECL_MODE (t) != BLKmode
6342 && !TREE_ADDRESSABLE (t))
6343 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6346 *walk_subtrees = 0;
6348 /* References of size POLY_INT_CST to a fixed-size object must go
6349 through memory. It's more efficient to force that here than
6350 to create temporary slots on the fly.
6351 RTL expansion expectes TARGET_MEM_REF to always address actual memory. */
6352 else if (TREE_CODE (t) == TARGET_MEM_REF
6353 || (TREE_CODE (t) == MEM_REF
6354 && TYPE_SIZE (TREE_TYPE (t))
6355 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t)))))
6357 tree base = get_base_address (t);
6358 if (base
6359 && DECL_P (base)
6360 && !TREE_ADDRESSABLE (base)
6361 && DECL_MODE (base) != BLKmode
6362 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6363 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6364 *walk_subtrees = 0;
6367 return NULL_TREE;
6370 /* If there's a chance to get a pseudo for t then if it would be of float mode
6371 and the actual access is via an integer mode (lowered memcpy or similar
6372 access) then avoid the register expansion if the mode likely is not storage
6373 suitable for raw bits processing (like XFmode on i?86). */
6375 static void
6376 avoid_type_punning_on_regs (tree t, bitmap forced_stack_vars)
6378 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6379 if (access_mode != BLKmode
6380 && !SCALAR_INT_MODE_P (access_mode))
6381 return;
6382 tree base = get_base_address (t);
6383 if (DECL_P (base)
6384 && !TREE_ADDRESSABLE (base)
6385 && FLOAT_MODE_P (DECL_MODE (base))
6386 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6387 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6388 /* Double check in the expensive way we really would get a pseudo. */
6389 && use_register_for_decl (base))
6390 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6393 /* RTL expansion is not able to compile array references with variable
6394 offsets for arrays stored in single register. Discover such
6395 expressions and mark variables as addressable to avoid this
6396 scenario. */
6398 static void
6399 discover_nonconstant_array_refs (bitmap forced_stack_vars)
6401 basic_block bb;
6402 gimple_stmt_iterator gsi;
6404 walk_stmt_info wi = {};
6405 wi.info = forced_stack_vars;
6406 FOR_EACH_BB_FN (bb, cfun)
6407 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6409 gimple *stmt = gsi_stmt (gsi);
6410 if (!is_gimple_debug (stmt))
6412 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, &wi);
6413 gcall *call = dyn_cast <gcall *> (stmt);
6414 if (call && gimple_call_internal_p (call))
6416 tree cand = NULL_TREE;
6417 switch (gimple_call_internal_fn (call))
6419 case IFN_LOAD_LANES:
6420 /* The source must be a MEM. */
6421 cand = gimple_call_arg (call, 0);
6422 break;
6423 case IFN_STORE_LANES:
6424 /* The destination must be a MEM. */
6425 cand = gimple_call_lhs (call);
6426 break;
6427 default:
6428 break;
6430 if (cand)
6431 cand = get_base_address (cand);
6432 if (cand
6433 && DECL_P (cand)
6434 && use_register_for_decl (cand))
6435 bitmap_set_bit (forced_stack_vars, DECL_UID (cand));
6437 if (gimple_vdef (stmt))
6439 tree t = gimple_get_lhs (stmt);
6440 if (t && REFERENCE_CLASS_P (t))
6441 avoid_type_punning_on_regs (t, forced_stack_vars);
6447 /* This function sets crtl->args.internal_arg_pointer to a virtual
6448 register if DRAP is needed. Local register allocator will replace
6449 virtual_incoming_args_rtx with the virtual register. */
6451 static void
6452 expand_stack_alignment (void)
6454 rtx drap_rtx;
6455 unsigned int preferred_stack_boundary;
6457 if (! SUPPORTS_STACK_ALIGNMENT)
6458 return;
6460 if (cfun->calls_alloca
6461 || cfun->has_nonlocal_label
6462 || crtl->has_nonlocal_goto)
6463 crtl->need_drap = true;
6465 /* Call update_stack_boundary here again to update incoming stack
6466 boundary. It may set incoming stack alignment to a different
6467 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6468 use the minimum incoming stack alignment to check if it is OK
6469 to perform sibcall optimization since sibcall optimization will
6470 only align the outgoing stack to incoming stack boundary. */
6471 if (targetm.calls.update_stack_boundary)
6472 targetm.calls.update_stack_boundary ();
6474 /* The incoming stack frame has to be aligned at least at
6475 parm_stack_boundary. */
6476 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6478 /* Update crtl->stack_alignment_estimated and use it later to align
6479 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6480 exceptions since callgraph doesn't collect incoming stack alignment
6481 in this case. */
6482 if (cfun->can_throw_non_call_exceptions
6483 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6484 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6485 else
6486 preferred_stack_boundary = crtl->preferred_stack_boundary;
6487 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6488 crtl->stack_alignment_estimated = preferred_stack_boundary;
6489 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6490 crtl->stack_alignment_needed = preferred_stack_boundary;
6492 gcc_assert (crtl->stack_alignment_needed
6493 <= crtl->stack_alignment_estimated);
6495 crtl->stack_realign_needed
6496 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6497 crtl->stack_realign_tried = crtl->stack_realign_needed;
6499 crtl->stack_realign_processed = true;
6501 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6502 alignment. */
6503 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6504 drap_rtx = targetm.calls.get_drap_rtx ();
6506 /* stack_realign_drap and drap_rtx must match. */
6507 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6509 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6510 if (drap_rtx != NULL)
6512 crtl->args.internal_arg_pointer = drap_rtx;
6514 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6515 needed. */
6516 fixup_tail_calls ();
6521 static void
6522 expand_main_function (void)
6524 #if (defined(INVOKE__main) \
6525 || (!defined(HAS_INIT_SECTION) \
6526 && !defined(INIT_SECTION_ASM_OP) \
6527 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6528 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6529 #endif
6533 /* Expand code to initialize the stack_protect_guard. This is invoked at
6534 the beginning of a function to be protected. */
6536 static void
6537 stack_protect_prologue (void)
6539 tree guard_decl = targetm.stack_protect_guard ();
6540 rtx x, y;
6542 crtl->stack_protect_guard_decl = guard_decl;
6543 x = expand_normal (crtl->stack_protect_guard);
6545 if (targetm.have_stack_protect_combined_set () && guard_decl)
6547 gcc_assert (DECL_P (guard_decl));
6548 y = DECL_RTL (guard_decl);
6550 /* Allow the target to compute address of Y and copy it to X without
6551 leaking Y into a register. This combined address + copy pattern
6552 allows the target to prevent spilling of any intermediate results by
6553 splitting it after register allocator. */
6554 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6556 emit_insn (insn);
6557 return;
6561 if (guard_decl)
6562 y = expand_normal (guard_decl);
6563 else
6564 y = const0_rtx;
6566 /* Allow the target to copy from Y to X without leaking Y into a
6567 register. */
6568 if (targetm.have_stack_protect_set ())
6569 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6571 emit_insn (insn);
6572 return;
6575 /* Otherwise do a straight move. */
6576 emit_move_insn (x, y);
6579 /* Translate the intermediate representation contained in the CFG
6580 from GIMPLE trees to RTL.
6582 We do conversion per basic block and preserve/update the tree CFG.
6583 This implies we have to do some magic as the CFG can simultaneously
6584 consist of basic blocks containing RTL and GIMPLE trees. This can
6585 confuse the CFG hooks, so be careful to not manipulate CFG during
6586 the expansion. */
6588 namespace {
6590 const pass_data pass_data_expand =
6592 RTL_PASS, /* type */
6593 "expand", /* name */
6594 OPTGROUP_NONE, /* optinfo_flags */
6595 TV_EXPAND, /* tv_id */
6596 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6597 | PROP_gimple_lcx
6598 | PROP_gimple_lvec
6599 | PROP_gimple_lva), /* properties_required */
6600 PROP_rtl, /* properties_provided */
6601 ( PROP_ssa | PROP_gimple ), /* properties_destroyed */
6602 0, /* todo_flags_start */
6603 0, /* todo_flags_finish */
6606 class pass_expand : public rtl_opt_pass
6608 public:
6609 pass_expand (gcc::context *ctxt)
6610 : rtl_opt_pass (pass_data_expand, ctxt)
6613 /* opt_pass methods: */
6614 unsigned int execute (function *) final override;
6616 }; // class pass_expand
6618 unsigned int
6619 pass_expand::execute (function *fun)
6621 basic_block bb, init_block;
6622 edge_iterator ei;
6623 edge e;
6624 rtx_insn *var_seq, *var_ret_seq;
6625 unsigned i;
6627 timevar_push (TV_OUT_OF_SSA);
6628 rewrite_out_of_ssa (&SA);
6629 timevar_pop (TV_OUT_OF_SSA);
6630 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6632 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6634 gimple_stmt_iterator gsi;
6635 FOR_EACH_BB_FN (bb, cfun)
6636 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6637 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6638 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6641 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6642 auto_bitmap forced_stack_vars;
6643 discover_nonconstant_array_refs (forced_stack_vars);
6645 /* Make sure all values used by the optimization passes have sane
6646 defaults. */
6647 reg_renumber = 0;
6649 /* Some backends want to know that we are expanding to RTL. */
6650 currently_expanding_to_rtl = 1;
6651 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6652 free_dominance_info (CDI_DOMINATORS);
6654 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6656 insn_locations_init ();
6657 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6659 /* Eventually, all FEs should explicitly set function_start_locus. */
6660 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6661 set_curr_insn_location
6662 (DECL_SOURCE_LOCATION (current_function_decl));
6663 else
6664 set_curr_insn_location (fun->function_start_locus);
6666 else
6667 set_curr_insn_location (UNKNOWN_LOCATION);
6668 prologue_location = curr_insn_location ();
6670 #ifdef INSN_SCHEDULING
6671 init_sched_attrs ();
6672 #endif
6674 /* Make sure first insn is a note even if we don't want linenums.
6675 This makes sure the first insn will never be deleted.
6676 Also, final expects a note to appear there. */
6677 emit_note (NOTE_INSN_DELETED);
6679 targetm.expand_to_rtl_hook ();
6680 crtl->init_stack_alignment ();
6681 fun->cfg->max_jumptable_ents = 0;
6683 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6684 of the function section at exapnsion time to predict distance of calls. */
6685 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6687 /* Expand the variables recorded during gimple lowering. */
6688 timevar_push (TV_VAR_EXPAND);
6689 start_sequence ();
6691 var_ret_seq = expand_used_vars (forced_stack_vars);
6693 var_seq = get_insns ();
6694 end_sequence ();
6695 timevar_pop (TV_VAR_EXPAND);
6697 /* Honor stack protection warnings. */
6698 if (warn_stack_protect)
6700 if (fun->calls_alloca)
6701 warning (OPT_Wstack_protector,
6702 "stack protector not protecting local variables: "
6703 "variable length buffer");
6704 if (has_short_buffer && !crtl->stack_protect_guard)
6705 warning (OPT_Wstack_protector,
6706 "stack protector not protecting function: "
6707 "all local arrays are less than %d bytes long",
6708 (int) param_ssp_buffer_size);
6711 /* Temporarily mark PARM_DECLs and RESULT_DECLs we need to expand to
6712 memory addressable so expand_function_start can emit the required
6713 copies. */
6714 auto_vec<tree, 16> marked_parms;
6715 for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
6716 parm = DECL_CHAIN (parm))
6717 if (!TREE_ADDRESSABLE (parm)
6718 && bitmap_bit_p (forced_stack_vars, DECL_UID (parm)))
6720 TREE_ADDRESSABLE (parm) = 1;
6721 marked_parms.safe_push (parm);
6723 if (DECL_RESULT (current_function_decl)
6724 && !TREE_ADDRESSABLE (DECL_RESULT (current_function_decl))
6725 && bitmap_bit_p (forced_stack_vars,
6726 DECL_UID (DECL_RESULT (current_function_decl))))
6728 TREE_ADDRESSABLE (DECL_RESULT (current_function_decl)) = 1;
6729 marked_parms.safe_push (DECL_RESULT (current_function_decl));
6732 /* Set up parameters and prepare for return, for the function. */
6733 expand_function_start (current_function_decl);
6735 /* Clear TREE_ADDRESSABLE again. */
6736 while (!marked_parms.is_empty ())
6737 TREE_ADDRESSABLE (marked_parms.pop ()) = 0;
6739 /* If we emitted any instructions for setting up the variables,
6740 emit them before the FUNCTION_START note. */
6741 if (var_seq)
6743 emit_insn_before (var_seq, parm_birth_insn);
6745 /* In expand_function_end we'll insert the alloca save/restore
6746 before parm_birth_insn. We've just insertted an alloca call.
6747 Adjust the pointer to match. */
6748 parm_birth_insn = var_seq;
6751 /* Now propagate the RTL assignment of each partition to the
6752 underlying var of each SSA_NAME. */
6753 tree name;
6755 FOR_EACH_SSA_NAME (i, name, cfun)
6757 /* We might have generated new SSA names in
6758 update_alias_info_with_stack_vars. They will have a NULL
6759 defining statements, and won't be part of the partitioning,
6760 so ignore those. */
6761 if (!SSA_NAME_DEF_STMT (name))
6762 continue;
6764 adjust_one_expanded_partition_var (name);
6767 /* Clean up RTL of variables that straddle across multiple
6768 partitions, and check that the rtl of any PARM_DECLs that are not
6769 cleaned up is that of their default defs. */
6770 FOR_EACH_SSA_NAME (i, name, cfun)
6772 int part;
6774 /* We might have generated new SSA names in
6775 update_alias_info_with_stack_vars. They will have a NULL
6776 defining statements, and won't be part of the partitioning,
6777 so ignore those. */
6778 if (!SSA_NAME_DEF_STMT (name))
6779 continue;
6780 part = var_to_partition (SA.map, name);
6781 if (part == NO_PARTITION)
6782 continue;
6784 /* If this decl was marked as living in multiple places, reset
6785 this now to NULL. */
6786 tree var = SSA_NAME_VAR (name);
6787 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6788 SET_DECL_RTL (var, NULL);
6789 /* Check that the pseudos chosen by assign_parms are those of
6790 the corresponding default defs. */
6791 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6792 && (TREE_CODE (var) == PARM_DECL
6793 || TREE_CODE (var) == RESULT_DECL))
6795 rtx in = DECL_RTL_IF_SET (var);
6796 gcc_assert (in);
6797 rtx out = SA.partition_to_pseudo[part];
6798 gcc_assert (in == out);
6800 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6801 those expected by debug backends for each parm and for
6802 the result. This is particularly important for stabs,
6803 whose register elimination from parm's DECL_RTL may cause
6804 -fcompare-debug differences as SET_DECL_RTL changes reg's
6805 attrs. So, make sure the RTL already has the parm as the
6806 EXPR, so that it won't change. */
6807 SET_DECL_RTL (var, NULL_RTX);
6808 if (MEM_P (in))
6809 set_mem_attributes (in, var, true);
6810 SET_DECL_RTL (var, in);
6814 /* If this function is `main', emit a call to `__main'
6815 to run global initializers, etc. */
6816 if (DECL_NAME (current_function_decl)
6817 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6818 && DECL_FILE_SCOPE_P (current_function_decl))
6819 expand_main_function ();
6821 /* Initialize the stack_protect_guard field. This must happen after the
6822 call to __main (if any) so that the external decl is initialized. */
6823 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6824 stack_protect_prologue ();
6826 expand_phi_nodes (&SA);
6828 /* Release any stale SSA redirection data. */
6829 redirect_edge_var_map_empty ();
6831 /* Register rtl specific functions for cfg. */
6832 rtl_register_cfg_hooks ();
6834 init_block = construct_init_block ();
6836 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6837 remaining edges later. */
6838 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6839 e->flags &= ~EDGE_EXECUTABLE;
6841 /* If the function has too many markers, drop them while expanding. */
6842 if (cfun->debug_marker_count
6843 >= param_max_debug_marker_count)
6844 cfun->debug_nonbind_markers = false;
6846 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6847 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6848 next_bb)
6849 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6851 if (MAY_HAVE_DEBUG_BIND_INSNS)
6852 expand_debug_locations ();
6854 if (deep_ter_debug_map)
6856 delete deep_ter_debug_map;
6857 deep_ter_debug_map = NULL;
6860 /* Free stuff we no longer need after GIMPLE optimizations. */
6861 free_dominance_info (CDI_DOMINATORS);
6862 free_dominance_info (CDI_POST_DOMINATORS);
6863 delete_tree_cfg_annotations (fun);
6865 timevar_push (TV_OUT_OF_SSA);
6866 finish_out_of_ssa (&SA);
6867 timevar_pop (TV_OUT_OF_SSA);
6869 timevar_push (TV_POST_EXPAND);
6870 /* We are no longer in SSA form. */
6871 fun->gimple_df->in_ssa_p = false;
6872 loops_state_clear (LOOP_CLOSED_SSA);
6874 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6875 conservatively to true until they are all profile aware. */
6876 delete lab_rtx_for_bb;
6877 free_histograms (fun);
6879 construct_exit_block ();
6880 insn_locations_finalize ();
6882 if (var_ret_seq)
6884 rtx_insn *after = return_label;
6885 rtx_insn *next = NEXT_INSN (after);
6886 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6887 after = next;
6888 emit_insn_after (var_ret_seq, after);
6891 if (hwasan_sanitize_stack_p ())
6892 hwasan_maybe_emit_frame_base_init ();
6894 /* Zap the tree EH table. */
6895 set_eh_throw_stmt_table (fun, NULL);
6897 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6898 split edges which edge insertions might do. */
6899 rebuild_jump_labels (get_insns ());
6901 /* If we have a single successor to the entry block, put the pending insns
6902 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6903 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6905 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6906 if (e->insns.r)
6908 rtx_insn *insns = e->insns.r;
6909 e->insns.r = NULL;
6910 rebuild_jump_labels_chain (insns);
6911 if (NOTE_P (parm_birth_insn)
6912 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6913 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6914 else
6915 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6919 /* Otherwise, as well as for other edges, take the usual way. */
6920 commit_edge_insertions ();
6922 /* We're done expanding trees to RTL. */
6923 currently_expanding_to_rtl = 0;
6925 flush_mark_addressable_queue ();
6927 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6928 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6930 edge e;
6931 edge_iterator ei;
6932 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6934 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6935 e->flags &= ~EDGE_EXECUTABLE;
6937 /* At the moment not all abnormal edges match the RTL
6938 representation. It is safe to remove them here as
6939 find_many_sub_basic_blocks will rediscover them.
6940 In the future we should get this fixed properly. */
6941 if ((e->flags & EDGE_ABNORMAL)
6942 && !(e->flags & EDGE_SIBCALL))
6943 remove_edge (e);
6944 else
6945 ei_next (&ei);
6949 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6950 bitmap_ones (blocks);
6951 find_many_sub_basic_blocks (blocks);
6952 purge_all_dead_edges ();
6954 /* After initial rtl generation, call back to finish generating
6955 exception support code. We need to do this before cleaning up
6956 the CFG as the code does not expect dead landing pads. */
6957 if (fun->eh->region_tree != NULL)
6958 finish_eh_generation ();
6960 /* Call expand_stack_alignment after finishing all
6961 updates to crtl->preferred_stack_boundary. */
6962 expand_stack_alignment ();
6964 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6965 function. */
6966 if (crtl->tail_call_emit)
6967 fixup_tail_calls ();
6969 HOST_WIDE_INT patch_area_size, patch_area_entry;
6970 parse_and_check_patch_area (flag_patchable_function_entry, false,
6971 &patch_area_size, &patch_area_entry);
6973 tree patchable_function_entry_attr
6974 = lookup_attribute ("patchable_function_entry",
6975 DECL_ATTRIBUTES (cfun->decl));
6976 if (patchable_function_entry_attr)
6978 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
6979 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
6981 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
6982 patch_area_entry = 0;
6983 if (TREE_CHAIN (pp_val) != NULL_TREE)
6985 tree patchable_function_entry_value2
6986 = TREE_VALUE (TREE_CHAIN (pp_val));
6987 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
6991 if (patch_area_entry > patch_area_size)
6993 if (patch_area_size > 0)
6994 warning (OPT_Wattributes,
6995 "patchable function entry %wu exceeds size %wu",
6996 patch_area_entry, patch_area_size);
6997 patch_area_entry = 0;
7000 crtl->patch_area_size = patch_area_size;
7001 crtl->patch_area_entry = patch_area_entry;
7003 /* BB subdivision may have created basic blocks that are only reachable
7004 from unlikely bbs but not marked as such in the profile. */
7005 if (optimize)
7006 propagate_unlikely_bbs_forward ();
7008 /* Remove unreachable blocks, otherwise we cannot compute dominators
7009 which are needed for loop state verification. As a side-effect
7010 this also compacts blocks.
7011 ??? We cannot remove trivially dead insns here as for example
7012 the DRAP reg on i?86 is not magically live at this point.
7013 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
7014 cleanup_cfg (CLEANUP_NO_INSN_DEL);
7016 checking_verify_flow_info ();
7018 /* Initialize pseudos allocated for hard registers. */
7019 emit_initial_value_sets ();
7021 /* And finally unshare all RTL. */
7022 unshare_all_rtl ();
7024 /* There's no need to defer outputting this function any more; we
7025 know we want to output it. */
7026 DECL_DEFER_OUTPUT (current_function_decl) = 0;
7028 /* Now that we're done expanding trees to RTL, we shouldn't have any
7029 more CONCATs anywhere. */
7030 generating_concat_p = 0;
7032 if (dump_file)
7034 fprintf (dump_file,
7035 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
7036 /* And the pass manager will dump RTL for us. */
7039 /* If we're emitting a nested function, make sure its parent gets
7040 emitted as well. Doing otherwise confuses debug info. */
7042 tree parent;
7043 for (parent = DECL_CONTEXT (current_function_decl);
7044 parent != NULL_TREE;
7045 parent = get_containing_scope (parent))
7046 if (TREE_CODE (parent) == FUNCTION_DECL)
7047 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
7050 TREE_ASM_WRITTEN (current_function_decl) = 1;
7052 /* After expanding, the return labels are no longer needed. */
7053 return_label = NULL;
7054 naked_return_label = NULL;
7056 /* After expanding, the tm_restart map is no longer needed. */
7057 if (fun->gimple_df->tm_restart)
7058 fun->gimple_df->tm_restart = NULL;
7060 /* Tag the blocks with a depth number so that change_scope can find
7061 the common parent easily. */
7062 set_block_levels (DECL_INITIAL (fun->decl), 0);
7063 default_rtl_profile ();
7065 /* For -dx discard loops now, otherwise IL verify in clean_state will
7066 ICE. */
7067 if (rtl_dump_and_exit)
7069 cfun->curr_properties &= ~PROP_loops;
7070 loop_optimizer_finalize ();
7073 timevar_pop (TV_POST_EXPAND);
7075 return 0;
7078 } // anon namespace
7080 rtl_opt_pass *
7081 make_pass_expand (gcc::context *ctxt)
7083 return new pass_expand (ctxt);