mklog: add subject line skeleton
[official-gcc.git] / gcc / cfgexpand.c
blob39e5b04042704fbe89b4e60250302d0a78fb4045
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2021 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
76 #include "opts.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 switch (gimple_assign_rhs_class (stmt))
109 case GIMPLE_TERNARY_RHS:
110 t = build3 (gimple_assign_rhs_code (stmt),
111 TREE_TYPE (gimple_assign_lhs (stmt)),
112 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
113 gimple_assign_rhs3 (stmt));
114 break;
115 case GIMPLE_BINARY_RHS:
116 t = build2 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
119 break;
120 case GIMPLE_UNARY_RHS:
121 t = build1 (gimple_assign_rhs_code (stmt),
122 TREE_TYPE (gimple_assign_lhs (stmt)),
123 gimple_assign_rhs1 (stmt));
124 break;
125 case GIMPLE_SINGLE_RHS:
127 t = gimple_assign_rhs1 (stmt);
128 /* Avoid modifying this tree in place below. */
129 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
130 && gimple_location (stmt) != EXPR_LOCATION (t))
131 || (gimple_block (stmt) && currently_expanding_to_rtl
132 && EXPR_P (t)))
133 t = copy_node (t);
134 break;
136 default:
137 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 class stack_var
310 public:
311 /* The Variable. */
312 tree decl;
314 /* Initially, the size of the variable. Later, the size of the partition,
315 if this variable becomes it's partition's representative. */
316 poly_uint64 size;
318 /* The *byte* alignment required for this variable. Or as, with the
319 size, the alignment for this partition. */
320 unsigned int alignb;
322 /* The partition representative. */
323 size_t representative;
325 /* The next stack variable in the partition, or EOC. */
326 size_t next;
328 /* The numbers of conflicting stack variables. */
329 bitmap conflicts;
332 #define EOC ((size_t)-1)
334 /* We have an array of such objects while deciding allocation. */
335 static class stack_var *stack_vars;
336 static size_t stack_vars_alloc;
337 static size_t stack_vars_num;
338 static hash_map<tree, size_t> *decl_to_stack_part;
340 /* Conflict bitmaps go on this obstack. This allows us to destroy
341 all of them in one big sweep. */
342 static bitmap_obstack stack_var_bitmap_obstack;
344 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
345 is non-decreasing. */
346 static size_t *stack_vars_sorted;
348 /* The phase of the stack frame. This is the known misalignment of
349 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
350 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
351 static int frame_phase;
353 /* Used during expand_used_vars to remember if we saw any decls for
354 which we'd like to enable stack smashing protection. */
355 static bool has_protected_decls;
357 /* Used during expand_used_vars. Remember if we say a character buffer
358 smaller than our cutoff threshold. Used for -Wstack-protector. */
359 static bool has_short_buffer;
361 /* Compute the byte alignment to use for DECL. Ignore alignment
362 we can't do with expected alignment of the stack boundary. */
364 static unsigned int
365 align_local_variable (tree decl, bool really_expand)
367 unsigned int align;
369 if (TREE_CODE (decl) == SSA_NAME)
371 tree type = TREE_TYPE (decl);
372 machine_mode mode = TYPE_MODE (type);
374 align = TYPE_ALIGN (type);
375 if (mode != BLKmode
376 && align < GET_MODE_ALIGNMENT (mode))
377 align = GET_MODE_ALIGNMENT (mode);
379 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
382 if (hwasan_sanitize_stack_p ())
383 align = MAX (align, (unsigned) HWASAN_TAG_GRANULE_SIZE * BITS_PER_UNIT);
385 if (TREE_CODE (decl) != SSA_NAME && really_expand)
386 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
387 That is done before IPA and could bump alignment based on host
388 backend even for offloaded code which wants different
389 LOCAL_DECL_ALIGNMENT. */
390 SET_DECL_ALIGN (decl, align);
392 return align / BITS_PER_UNIT;
395 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
396 down otherwise. Return truncated BASE value. */
398 static inline unsigned HOST_WIDE_INT
399 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
401 return align_up ? (base + align - 1) & -align : base & -align;
404 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
405 Return the frame offset. */
407 static poly_int64
408 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
410 poly_int64 offset, new_frame_offset;
412 if (FRAME_GROWS_DOWNWARD)
414 new_frame_offset
415 = aligned_lower_bound (frame_offset - frame_phase - size,
416 align) + frame_phase;
417 offset = new_frame_offset;
419 else
421 new_frame_offset
422 = aligned_upper_bound (frame_offset - frame_phase,
423 align) + frame_phase;
424 offset = new_frame_offset;
425 new_frame_offset += size;
427 frame_offset = new_frame_offset;
429 if (frame_offset_overflow (frame_offset, cfun->decl))
430 frame_offset = offset = 0;
432 return offset;
435 /* Ensure that the stack is aligned to ALIGN bytes.
436 Return the new frame offset. */
437 static poly_int64
438 align_frame_offset (unsigned HOST_WIDE_INT align)
440 return alloc_stack_frame_space (0, align);
443 /* Accumulate DECL into STACK_VARS. */
445 static void
446 add_stack_var (tree decl, bool really_expand)
448 class stack_var *v;
450 if (stack_vars_num >= stack_vars_alloc)
452 if (stack_vars_alloc)
453 stack_vars_alloc = stack_vars_alloc * 3 / 2;
454 else
455 stack_vars_alloc = 32;
456 stack_vars
457 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
459 if (!decl_to_stack_part)
460 decl_to_stack_part = new hash_map<tree, size_t>;
462 v = &stack_vars[stack_vars_num];
463 decl_to_stack_part->put (decl, stack_vars_num);
465 v->decl = decl;
466 tree size = TREE_CODE (decl) == SSA_NAME
467 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
468 : DECL_SIZE_UNIT (decl);
469 v->size = tree_to_poly_uint64 (size);
470 /* Ensure that all variables have size, so that &a != &b for any two
471 variables that are simultaneously live. */
472 if (known_eq (v->size, 0U))
473 v->size = 1;
474 v->alignb = align_local_variable (decl, really_expand);
475 /* An alignment of zero can mightily confuse us later. */
476 gcc_assert (v->alignb != 0);
478 /* All variables are initially in their own partition. */
479 v->representative = stack_vars_num;
480 v->next = EOC;
482 /* All variables initially conflict with no other. */
483 v->conflicts = NULL;
485 /* Ensure that this decl doesn't get put onto the list twice. */
486 set_rtl (decl, pc_rtx);
488 stack_vars_num++;
491 /* Make the decls associated with luid's X and Y conflict. */
493 static void
494 add_stack_var_conflict (size_t x, size_t y)
496 class stack_var *a = &stack_vars[x];
497 class stack_var *b = &stack_vars[y];
498 if (x == y)
499 return;
500 if (!a->conflicts)
501 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
502 if (!b->conflicts)
503 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
504 bitmap_set_bit (a->conflicts, y);
505 bitmap_set_bit (b->conflicts, x);
508 /* Check whether the decls associated with luid's X and Y conflict. */
510 static bool
511 stack_var_conflict_p (size_t x, size_t y)
513 class stack_var *a = &stack_vars[x];
514 class stack_var *b = &stack_vars[y];
515 if (x == y)
516 return false;
517 /* Partitions containing an SSA name result from gimple registers
518 with things like unsupported modes. They are top-level and
519 hence conflict with everything else. */
520 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
521 return true;
523 if (!a->conflicts || !b->conflicts)
524 return false;
525 return bitmap_bit_p (a->conflicts, y);
528 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
529 enter its partition number into bitmap DATA. */
531 static bool
532 visit_op (gimple *, tree op, tree, void *data)
534 bitmap active = (bitmap)data;
535 op = get_base_address (op);
536 if (op
537 && DECL_P (op)
538 && DECL_RTL_IF_SET (op) == pc_rtx)
540 size_t *v = decl_to_stack_part->get (op);
541 if (v)
542 bitmap_set_bit (active, *v);
544 return false;
547 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
548 record conflicts between it and all currently active other partitions
549 from bitmap DATA. */
551 static bool
552 visit_conflict (gimple *, tree op, tree, void *data)
554 bitmap active = (bitmap)data;
555 op = get_base_address (op);
556 if (op
557 && DECL_P (op)
558 && DECL_RTL_IF_SET (op) == pc_rtx)
560 size_t *v = decl_to_stack_part->get (op);
561 if (v && bitmap_set_bit (active, *v))
563 size_t num = *v;
564 bitmap_iterator bi;
565 unsigned i;
566 gcc_assert (num < stack_vars_num);
567 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
568 add_stack_var_conflict (num, i);
571 return false;
574 /* Helper routine for add_scope_conflicts, calculating the active partitions
575 at the end of BB, leaving the result in WORK. We're called to generate
576 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
577 liveness. */
579 static void
580 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
582 edge e;
583 edge_iterator ei;
584 gimple_stmt_iterator gsi;
585 walk_stmt_load_store_addr_fn visit;
587 bitmap_clear (work);
588 FOR_EACH_EDGE (e, ei, bb->preds)
589 bitmap_ior_into (work, (bitmap)e->src->aux);
591 visit = visit_op;
593 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
595 gimple *stmt = gsi_stmt (gsi);
596 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
598 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
600 gimple *stmt = gsi_stmt (gsi);
602 if (gimple_clobber_p (stmt))
604 tree lhs = gimple_assign_lhs (stmt);
605 size_t *v;
606 /* Nested function lowering might introduce LHSs
607 that are COMPONENT_REFs. */
608 if (!VAR_P (lhs))
609 continue;
610 if (DECL_RTL_IF_SET (lhs) == pc_rtx
611 && (v = decl_to_stack_part->get (lhs)))
612 bitmap_clear_bit (work, *v);
614 else if (!is_gimple_debug (stmt))
616 if (for_conflict
617 && visit == visit_op)
619 /* If this is the first real instruction in this BB we need
620 to add conflicts for everything live at this point now.
621 Unlike classical liveness for named objects we can't
622 rely on seeing a def/use of the names we're interested in.
623 There might merely be indirect loads/stores. We'd not add any
624 conflicts for such partitions. */
625 bitmap_iterator bi;
626 unsigned i;
627 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
629 class stack_var *a = &stack_vars[i];
630 if (!a->conflicts)
631 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
632 bitmap_ior_into (a->conflicts, work);
634 visit = visit_conflict;
636 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
641 /* Generate stack partition conflicts between all partitions that are
642 simultaneously live. */
644 static void
645 add_scope_conflicts (void)
647 basic_block bb;
648 bool changed;
649 bitmap work = BITMAP_ALLOC (NULL);
650 int *rpo;
651 int n_bbs;
653 /* We approximate the live range of a stack variable by taking the first
654 mention of its name as starting point(s), and by the end-of-scope
655 death clobber added by gimplify as ending point(s) of the range.
656 This overapproximates in the case we for instance moved an address-taken
657 operation upward, without also moving a dereference to it upwards.
658 But it's conservatively correct as a variable never can hold values
659 before its name is mentioned at least once.
661 We then do a mostly classical bitmap liveness algorithm. */
663 FOR_ALL_BB_FN (bb, cfun)
664 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
666 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
667 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
669 changed = true;
670 while (changed)
672 int i;
673 changed = false;
674 for (i = 0; i < n_bbs; i++)
676 bitmap active;
677 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
678 active = (bitmap)bb->aux;
679 add_scope_conflicts_1 (bb, work, false);
680 if (bitmap_ior_into (active, work))
681 changed = true;
685 FOR_EACH_BB_FN (bb, cfun)
686 add_scope_conflicts_1 (bb, work, true);
688 free (rpo);
689 BITMAP_FREE (work);
690 FOR_ALL_BB_FN (bb, cfun)
691 BITMAP_FREE (bb->aux);
694 /* A subroutine of partition_stack_vars. A comparison function for qsort,
695 sorting an array of indices by the properties of the object. */
697 static int
698 stack_var_cmp (const void *a, const void *b)
700 size_t ia = *(const size_t *)a;
701 size_t ib = *(const size_t *)b;
702 unsigned int aligna = stack_vars[ia].alignb;
703 unsigned int alignb = stack_vars[ib].alignb;
704 poly_int64 sizea = stack_vars[ia].size;
705 poly_int64 sizeb = stack_vars[ib].size;
706 tree decla = stack_vars[ia].decl;
707 tree declb = stack_vars[ib].decl;
708 bool largea, largeb;
709 unsigned int uida, uidb;
711 /* Primary compare on "large" alignment. Large comes first. */
712 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
713 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
714 if (largea != largeb)
715 return (int)largeb - (int)largea;
717 /* Secondary compare on size, decreasing */
718 int diff = compare_sizes_for_sort (sizeb, sizea);
719 if (diff != 0)
720 return diff;
722 /* Tertiary compare on true alignment, decreasing. */
723 if (aligna < alignb)
724 return -1;
725 if (aligna > alignb)
726 return 1;
728 /* Final compare on ID for sort stability, increasing.
729 Two SSA names are compared by their version, SSA names come before
730 non-SSA names, and two normal decls are compared by their DECL_UID. */
731 if (TREE_CODE (decla) == SSA_NAME)
733 if (TREE_CODE (declb) == SSA_NAME)
734 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
735 else
736 return -1;
738 else if (TREE_CODE (declb) == SSA_NAME)
739 return 1;
740 else
741 uida = DECL_UID (decla), uidb = DECL_UID (declb);
742 if (uida < uidb)
743 return 1;
744 if (uida > uidb)
745 return -1;
746 return 0;
749 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
750 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
752 /* If the points-to solution *PI points to variables that are in a partition
753 together with other variables add all partition members to the pointed-to
754 variables bitmap. */
756 static void
757 add_partitioned_vars_to_ptset (struct pt_solution *pt,
758 part_hashmap *decls_to_partitions,
759 hash_set<bitmap> *visited, bitmap temp)
761 bitmap_iterator bi;
762 unsigned i;
763 bitmap *part;
765 if (pt->anything
766 || pt->vars == NULL
767 /* The pointed-to vars bitmap is shared, it is enough to
768 visit it once. */
769 || visited->add (pt->vars))
770 return;
772 bitmap_clear (temp);
774 /* By using a temporary bitmap to store all members of the partitions
775 we have to add we make sure to visit each of the partitions only
776 once. */
777 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
778 if ((!temp
779 || !bitmap_bit_p (temp, i))
780 && (part = decls_to_partitions->get (i)))
781 bitmap_ior_into (temp, *part);
782 if (!bitmap_empty_p (temp))
783 bitmap_ior_into (pt->vars, temp);
786 /* Update points-to sets based on partition info, so we can use them on RTL.
787 The bitmaps representing stack partitions will be saved until expand,
788 where partitioned decls used as bases in memory expressions will be
789 rewritten. */
791 static void
792 update_alias_info_with_stack_vars (void)
794 part_hashmap *decls_to_partitions = NULL;
795 size_t i, j;
796 tree var = NULL_TREE;
798 for (i = 0; i < stack_vars_num; i++)
800 bitmap part = NULL;
801 tree name;
802 struct ptr_info_def *pi;
804 /* Not interested in partitions with single variable. */
805 if (stack_vars[i].representative != i
806 || stack_vars[i].next == EOC)
807 continue;
809 if (!decls_to_partitions)
811 decls_to_partitions = new part_hashmap;
812 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
815 /* Create an SSA_NAME that points to the partition for use
816 as base during alias-oracle queries on RTL for bases that
817 have been partitioned. */
818 if (var == NULL_TREE)
819 var = create_tmp_var (ptr_type_node);
820 name = make_ssa_name (var);
822 /* Create bitmaps representing partitions. They will be used for
823 points-to sets later, so use GGC alloc. */
824 part = BITMAP_GGC_ALLOC ();
825 for (j = i; j != EOC; j = stack_vars[j].next)
827 tree decl = stack_vars[j].decl;
828 unsigned int uid = DECL_PT_UID (decl);
829 bitmap_set_bit (part, uid);
830 decls_to_partitions->put (uid, part);
831 cfun->gimple_df->decls_to_pointers->put (decl, name);
832 if (TREE_ADDRESSABLE (decl))
833 TREE_ADDRESSABLE (name) = 1;
836 /* Make the SSA name point to all partition members. */
837 pi = get_ptr_info (name);
838 pt_solution_set (&pi->pt, part, false);
841 /* Make all points-to sets that contain one member of a partition
842 contain all members of the partition. */
843 if (decls_to_partitions)
845 unsigned i;
846 tree name;
847 hash_set<bitmap> visited;
848 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
850 FOR_EACH_SSA_NAME (i, name, cfun)
852 struct ptr_info_def *pi;
854 if (POINTER_TYPE_P (TREE_TYPE (name))
855 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
856 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
857 &visited, temp);
860 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
861 decls_to_partitions, &visited, temp);
863 delete decls_to_partitions;
864 BITMAP_FREE (temp);
868 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
869 partitioning algorithm. Partitions A and B are known to be non-conflicting.
870 Merge them into a single partition A. */
872 static void
873 union_stack_vars (size_t a, size_t b)
875 class stack_var *vb = &stack_vars[b];
876 bitmap_iterator bi;
877 unsigned u;
879 gcc_assert (stack_vars[b].next == EOC);
880 /* Add B to A's partition. */
881 stack_vars[b].next = stack_vars[a].next;
882 stack_vars[b].representative = a;
883 stack_vars[a].next = b;
885 /* Make sure A is big enough to hold B. */
886 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
888 /* Update the required alignment of partition A to account for B. */
889 if (stack_vars[a].alignb < stack_vars[b].alignb)
890 stack_vars[a].alignb = stack_vars[b].alignb;
892 /* Update the interference graph and merge the conflicts. */
893 if (vb->conflicts)
895 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
896 add_stack_var_conflict (a, stack_vars[u].representative);
897 BITMAP_FREE (vb->conflicts);
901 /* A subroutine of expand_used_vars. Binpack the variables into
902 partitions constrained by the interference graph. The overall
903 algorithm used is as follows:
905 Sort the objects by size in descending order.
906 For each object A {
907 S = size(A)
908 O = 0
909 loop {
910 Look for the largest non-conflicting object B with size <= S.
911 UNION (A, B)
916 static void
917 partition_stack_vars (void)
919 size_t si, sj, n = stack_vars_num;
921 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
922 for (si = 0; si < n; ++si)
923 stack_vars_sorted[si] = si;
925 if (n == 1)
926 return;
928 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
930 for (si = 0; si < n; ++si)
932 size_t i = stack_vars_sorted[si];
933 unsigned int ialign = stack_vars[i].alignb;
934 poly_int64 isize = stack_vars[i].size;
936 /* Ignore objects that aren't partition representatives. If we
937 see a var that is not a partition representative, it must
938 have been merged earlier. */
939 if (stack_vars[i].representative != i)
940 continue;
942 for (sj = si + 1; sj < n; ++sj)
944 size_t j = stack_vars_sorted[sj];
945 unsigned int jalign = stack_vars[j].alignb;
946 poly_int64 jsize = stack_vars[j].size;
948 /* Ignore objects that aren't partition representatives. */
949 if (stack_vars[j].representative != j)
950 continue;
952 /* Do not mix objects of "small" (supported) alignment
953 and "large" (unsupported) alignment. */
954 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
955 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
956 break;
958 /* For Address Sanitizer do not mix objects with different
959 sizes, as the shorter vars wouldn't be adequately protected.
960 Don't do that for "large" (unsupported) alignment objects,
961 those aren't protected anyway. */
962 if (asan_sanitize_stack_p ()
963 && maybe_ne (isize, jsize)
964 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
965 break;
967 /* Ignore conflicting objects. */
968 if (stack_var_conflict_p (i, j))
969 continue;
971 /* UNION the objects, placing J at OFFSET. */
972 union_stack_vars (i, j);
976 update_alias_info_with_stack_vars ();
979 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
981 static void
982 dump_stack_var_partition (void)
984 size_t si, i, j, n = stack_vars_num;
986 for (si = 0; si < n; ++si)
988 i = stack_vars_sorted[si];
990 /* Skip variables that aren't partition representatives, for now. */
991 if (stack_vars[i].representative != i)
992 continue;
994 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
995 print_dec (stack_vars[i].size, dump_file);
996 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
998 for (j = i; j != EOC; j = stack_vars[j].next)
1000 fputc ('\t', dump_file);
1001 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
1003 fputc ('\n', dump_file);
1007 /* Assign rtl to DECL at BASE + OFFSET. */
1009 static void
1010 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1011 poly_int64 offset)
1013 unsigned align;
1014 rtx x;
1016 /* If this fails, we've overflowed the stack frame. Error nicely? */
1017 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1019 if (hwasan_sanitize_stack_p ())
1020 x = targetm.memtag.add_tag (base, offset,
1021 hwasan_current_frame_tag ());
1022 else
1023 x = plus_constant (Pmode, base, offset);
1025 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1026 ? TYPE_MODE (TREE_TYPE (decl))
1027 : DECL_MODE (decl), x);
1029 /* Set alignment we actually gave this decl if it isn't an SSA name.
1030 If it is we generate stack slots only accidentally so it isn't as
1031 important, we'll simply set the alignment directly on the MEM. */
1033 if (stack_vars_base_reg_p (base))
1034 offset -= frame_phase;
1035 align = known_alignment (offset);
1036 align *= BITS_PER_UNIT;
1037 if (align == 0 || align > base_align)
1038 align = base_align;
1040 if (TREE_CODE (decl) != SSA_NAME)
1042 /* One would think that we could assert that we're not decreasing
1043 alignment here, but (at least) the i386 port does exactly this
1044 via the MINIMUM_ALIGNMENT hook. */
1046 SET_DECL_ALIGN (decl, align);
1047 DECL_USER_ALIGN (decl) = 0;
1050 set_rtl (decl, x);
1052 set_mem_align (x, align);
1055 class stack_vars_data
1057 public:
1058 /* Vector of offset pairs, always end of some padding followed
1059 by start of the padding that needs Address Sanitizer protection.
1060 The vector is in reversed, highest offset pairs come first. */
1061 auto_vec<HOST_WIDE_INT> asan_vec;
1063 /* Vector of partition representative decls in between the paddings. */
1064 auto_vec<tree> asan_decl_vec;
1066 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1067 rtx asan_base;
1069 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1070 unsigned int asan_alignb;
1073 /* A subroutine of expand_used_vars. Give each partition representative
1074 a unique location within the stack frame. Update each partition member
1075 with that location. */
1076 static void
1077 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1079 size_t si, i, j, n = stack_vars_num;
1080 poly_uint64 large_size = 0, large_alloc = 0;
1081 rtx large_base = NULL;
1082 rtx large_untagged_base = NULL;
1083 unsigned large_align = 0;
1084 bool large_allocation_done = false;
1085 tree decl;
1087 /* Determine if there are any variables requiring "large" alignment.
1088 Since these are dynamically allocated, we only process these if
1089 no predicate involved. */
1090 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1091 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1093 /* Find the total size of these variables. */
1094 for (si = 0; si < n; ++si)
1096 unsigned alignb;
1098 i = stack_vars_sorted[si];
1099 alignb = stack_vars[i].alignb;
1101 /* All "large" alignment decls come before all "small" alignment
1102 decls, but "large" alignment decls are not sorted based on
1103 their alignment. Increase large_align to track the largest
1104 required alignment. */
1105 if ((alignb * BITS_PER_UNIT) > large_align)
1106 large_align = alignb * BITS_PER_UNIT;
1108 /* Stop when we get to the first decl with "small" alignment. */
1109 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1110 break;
1112 /* Skip variables that aren't partition representatives. */
1113 if (stack_vars[i].representative != i)
1114 continue;
1116 /* Skip variables that have already had rtl assigned. See also
1117 add_stack_var where we perpetrate this pc_rtx hack. */
1118 decl = stack_vars[i].decl;
1119 if (TREE_CODE (decl) == SSA_NAME
1120 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1121 : DECL_RTL (decl) != pc_rtx)
1122 continue;
1124 large_size = aligned_upper_bound (large_size, alignb);
1125 large_size += stack_vars[i].size;
1129 for (si = 0; si < n; ++si)
1131 rtx base;
1132 unsigned base_align, alignb;
1133 poly_int64 offset = 0;
1135 i = stack_vars_sorted[si];
1137 /* Skip variables that aren't partition representatives, for now. */
1138 if (stack_vars[i].representative != i)
1139 continue;
1141 /* Skip variables that have already had rtl assigned. See also
1142 add_stack_var where we perpetrate this pc_rtx hack. */
1143 decl = stack_vars[i].decl;
1144 if (TREE_CODE (decl) == SSA_NAME
1145 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1146 : DECL_RTL (decl) != pc_rtx)
1147 continue;
1149 /* Check the predicate to see whether this variable should be
1150 allocated in this pass. */
1151 if (pred && !pred (i))
1152 continue;
1154 base = (hwasan_sanitize_stack_p ()
1155 ? hwasan_frame_base ()
1156 : virtual_stack_vars_rtx);
1157 alignb = stack_vars[i].alignb;
1158 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1160 poly_int64 hwasan_orig_offset;
1161 if (hwasan_sanitize_stack_p ())
1163 /* There must be no tag granule "shared" between different
1164 objects. This means that no HWASAN_TAG_GRANULE_SIZE byte
1165 chunk can have more than one object in it.
1167 We ensure this by forcing the end of the last bit of data to
1168 be aligned to HWASAN_TAG_GRANULE_SIZE bytes here, and setting
1169 the start of each variable to be aligned to
1170 HWASAN_TAG_GRANULE_SIZE bytes in `align_local_variable`.
1172 We can't align just one of the start or end, since there are
1173 untagged things stored on the stack which we do not align to
1174 HWASAN_TAG_GRANULE_SIZE bytes. If we only aligned the start
1175 or the end of tagged objects then untagged objects could end
1176 up sharing the first granule of a tagged object or sharing the
1177 last granule of a tagged object respectively. */
1178 hwasan_orig_offset = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1179 gcc_assert (stack_vars[i].alignb >= HWASAN_TAG_GRANULE_SIZE);
1181 /* ASAN description strings don't yet have a syntax for expressing
1182 polynomial offsets. */
1183 HOST_WIDE_INT prev_offset;
1184 if (asan_sanitize_stack_p ()
1185 && pred
1186 && frame_offset.is_constant (&prev_offset)
1187 && stack_vars[i].size.is_constant ())
1189 if (data->asan_vec.is_empty ())
1191 align_frame_offset (ASAN_RED_ZONE_SIZE);
1192 prev_offset = frame_offset.to_constant ();
1194 prev_offset = align_base (prev_offset,
1195 ASAN_MIN_RED_ZONE_SIZE,
1196 !FRAME_GROWS_DOWNWARD);
1197 tree repr_decl = NULL_TREE;
1198 unsigned HOST_WIDE_INT size
1199 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1200 if (data->asan_vec.is_empty ())
1201 size = MAX (size, ASAN_RED_ZONE_SIZE);
1203 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1204 ASAN_MIN_RED_ZONE_SIZE);
1205 offset = alloc_stack_frame_space (size, alignment);
1207 data->asan_vec.safe_push (prev_offset);
1208 /* Allocating a constant amount of space from a constant
1209 starting offset must give a constant result. */
1210 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1211 .to_constant ());
1212 /* Find best representative of the partition.
1213 Prefer those with DECL_NAME, even better
1214 satisfying asan_protect_stack_decl predicate. */
1215 for (j = i; j != EOC; j = stack_vars[j].next)
1216 if (asan_protect_stack_decl (stack_vars[j].decl)
1217 && DECL_NAME (stack_vars[j].decl))
1219 repr_decl = stack_vars[j].decl;
1220 break;
1222 else if (repr_decl == NULL_TREE
1223 && DECL_P (stack_vars[j].decl)
1224 && DECL_NAME (stack_vars[j].decl))
1225 repr_decl = stack_vars[j].decl;
1226 if (repr_decl == NULL_TREE)
1227 repr_decl = stack_vars[i].decl;
1228 data->asan_decl_vec.safe_push (repr_decl);
1230 /* Make sure a representative is unpoison if another
1231 variable in the partition is handled by
1232 use-after-scope sanitization. */
1233 if (asan_handled_variables != NULL
1234 && !asan_handled_variables->contains (repr_decl))
1236 for (j = i; j != EOC; j = stack_vars[j].next)
1237 if (asan_handled_variables->contains (stack_vars[j].decl))
1238 break;
1239 if (j != EOC)
1240 asan_handled_variables->add (repr_decl);
1243 data->asan_alignb = MAX (data->asan_alignb, alignb);
1244 if (data->asan_base == NULL)
1245 data->asan_base = gen_reg_rtx (Pmode);
1246 base = data->asan_base;
1248 if (!STRICT_ALIGNMENT)
1249 base_align = crtl->max_used_stack_slot_alignment;
1250 else
1251 base_align = MAX (crtl->max_used_stack_slot_alignment,
1252 GET_MODE_ALIGNMENT (SImode)
1253 << ASAN_SHADOW_SHIFT);
1255 else
1257 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1258 base_align = crtl->max_used_stack_slot_alignment;
1260 if (hwasan_sanitize_stack_p ())
1262 /* Align again since the point of this alignment is to handle
1263 the "end" of the object (i.e. smallest address after the
1264 stack object). For FRAME_GROWS_DOWNWARD that requires
1265 aligning the stack before allocating, but for a frame that
1266 grows upwards that requires aligning the stack after
1267 allocation.
1269 Use `frame_offset` to record the offset value rather than
1270 `offset` since the `frame_offset` describes the extent
1271 allocated for this particular variable while `offset`
1272 describes the address that this variable starts at. */
1273 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1274 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1275 hwasan_orig_offset, frame_offset);
1279 else
1281 /* Large alignment is only processed in the last pass. */
1282 if (pred)
1283 continue;
1285 /* If there were any variables requiring "large" alignment, allocate
1286 space. */
1287 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1289 poly_int64 loffset;
1290 rtx large_allocsize;
1292 large_allocsize = gen_int_mode (large_size, Pmode);
1293 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1294 loffset = alloc_stack_frame_space
1295 (rtx_to_poly_int64 (large_allocsize),
1296 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1297 large_base = get_dynamic_stack_base (loffset, large_align, base);
1298 large_allocation_done = true;
1301 gcc_assert (large_base != NULL);
1302 large_alloc = aligned_upper_bound (large_alloc, alignb);
1303 offset = large_alloc;
1304 large_alloc += stack_vars[i].size;
1305 if (hwasan_sanitize_stack_p ())
1307 /* An object with a large alignment requirement means that the
1308 alignment requirement is greater than the required alignment
1309 for tags. */
1310 if (!large_untagged_base)
1311 large_untagged_base
1312 = targetm.memtag.untagged_pointer (large_base, NULL_RTX);
1313 /* Ensure the end of the variable is also aligned correctly. */
1314 poly_int64 align_again
1315 = aligned_upper_bound (large_alloc, HWASAN_TAG_GRANULE_SIZE);
1316 /* For large allocations we always allocate a chunk of space
1317 (which is addressed by large_untagged_base/large_base) and
1318 then use positive offsets from that. Hence the farthest
1319 offset is `align_again` and the nearest offset from the base
1320 is `offset`. */
1321 hwasan_record_stack_var (large_untagged_base, large_base,
1322 offset, align_again);
1325 base = large_base;
1326 base_align = large_align;
1329 /* Create rtl for each variable based on their location within the
1330 partition. */
1331 for (j = i; j != EOC; j = stack_vars[j].next)
1333 expand_one_stack_var_at (stack_vars[j].decl,
1334 base, base_align, offset);
1336 if (hwasan_sanitize_stack_p ())
1337 hwasan_increment_frame_tag ();
1340 gcc_assert (known_eq (large_alloc, large_size));
1343 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1344 static poly_uint64
1345 account_stack_vars (void)
1347 size_t si, j, i, n = stack_vars_num;
1348 poly_uint64 size = 0;
1350 for (si = 0; si < n; ++si)
1352 i = stack_vars_sorted[si];
1354 /* Skip variables that aren't partition representatives, for now. */
1355 if (stack_vars[i].representative != i)
1356 continue;
1358 size += stack_vars[i].size;
1359 for (j = i; j != EOC; j = stack_vars[j].next)
1360 set_rtl (stack_vars[j].decl, NULL);
1362 return size;
1365 /* Record the RTL assignment X for the default def of PARM. */
1367 extern void
1368 set_parm_rtl (tree parm, rtx x)
1370 gcc_assert (TREE_CODE (parm) == PARM_DECL
1371 || TREE_CODE (parm) == RESULT_DECL);
1373 if (x && !MEM_P (x))
1375 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1376 TYPE_MODE (TREE_TYPE (parm)),
1377 TYPE_ALIGN (TREE_TYPE (parm)));
1379 /* If the variable alignment is very large we'll dynamicaly
1380 allocate it, which means that in-frame portion is just a
1381 pointer. ??? We've got a pseudo for sure here, do we
1382 actually dynamically allocate its spilling area if needed?
1383 ??? Isn't it a problem when Pmode alignment also exceeds
1384 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1385 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1386 align = GET_MODE_ALIGNMENT (Pmode);
1388 record_alignment_for_reg_var (align);
1391 tree ssa = ssa_default_def (cfun, parm);
1392 if (!ssa)
1393 return set_rtl (parm, x);
1395 int part = var_to_partition (SA.map, ssa);
1396 gcc_assert (part != NO_PARTITION);
1398 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1399 gcc_assert (changed);
1401 set_rtl (ssa, x);
1402 gcc_assert (DECL_RTL (parm) == x);
1405 /* A subroutine of expand_one_var. Called to immediately assign rtl
1406 to a variable to be allocated in the stack frame. */
1408 static void
1409 expand_one_stack_var_1 (tree var)
1411 poly_uint64 size;
1412 poly_int64 offset;
1413 unsigned byte_align;
1415 if (TREE_CODE (var) == SSA_NAME)
1417 tree type = TREE_TYPE (var);
1418 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1420 else
1421 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1423 byte_align = align_local_variable (var, true);
1425 /* We handle highly aligned variables in expand_stack_vars. */
1426 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1428 rtx base;
1429 if (hwasan_sanitize_stack_p ())
1431 /* Allocate zero bytes to align the stack. */
1432 poly_int64 hwasan_orig_offset
1433 = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1434 offset = alloc_stack_frame_space (size, byte_align);
1435 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1436 base = hwasan_frame_base ();
1437 /* Use `frame_offset` to automatically account for machines where the
1438 frame grows upwards.
1440 `offset` will always point to the "start" of the stack object, which
1441 will be the smallest address, for ! FRAME_GROWS_DOWNWARD this is *not*
1442 the "furthest" offset from the base delimiting the current stack
1443 object. `frame_offset` will always delimit the extent that the frame.
1445 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1446 hwasan_orig_offset, frame_offset);
1448 else
1450 offset = alloc_stack_frame_space (size, byte_align);
1451 base = virtual_stack_vars_rtx;
1454 expand_one_stack_var_at (var, base,
1455 crtl->max_used_stack_slot_alignment, offset);
1457 if (hwasan_sanitize_stack_p ())
1458 hwasan_increment_frame_tag ();
1461 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1462 already assigned some MEM. */
1464 static void
1465 expand_one_stack_var (tree var)
1467 if (TREE_CODE (var) == SSA_NAME)
1469 int part = var_to_partition (SA.map, var);
1470 if (part != NO_PARTITION)
1472 rtx x = SA.partition_to_pseudo[part];
1473 gcc_assert (x);
1474 gcc_assert (MEM_P (x));
1475 return;
1479 return expand_one_stack_var_1 (var);
1482 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1483 that will reside in a hard register. */
1485 static void
1486 expand_one_hard_reg_var (tree var)
1488 rest_of_decl_compilation (var, 0, 0);
1491 /* Record the alignment requirements of some variable assigned to a
1492 pseudo. */
1494 static void
1495 record_alignment_for_reg_var (unsigned int align)
1497 if (SUPPORTS_STACK_ALIGNMENT
1498 && crtl->stack_alignment_estimated < align)
1500 /* stack_alignment_estimated shouldn't change after stack
1501 realign decision made */
1502 gcc_assert (!crtl->stack_realign_processed);
1503 crtl->stack_alignment_estimated = align;
1506 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1507 So here we only make sure stack_alignment_needed >= align. */
1508 if (crtl->stack_alignment_needed < align)
1509 crtl->stack_alignment_needed = align;
1510 if (crtl->max_used_stack_slot_alignment < align)
1511 crtl->max_used_stack_slot_alignment = align;
1514 /* Create RTL for an SSA partition. */
1516 static void
1517 expand_one_ssa_partition (tree var)
1519 int part = var_to_partition (SA.map, var);
1520 gcc_assert (part != NO_PARTITION);
1522 if (SA.partition_to_pseudo[part])
1523 return;
1525 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1526 TYPE_MODE (TREE_TYPE (var)),
1527 TYPE_ALIGN (TREE_TYPE (var)));
1529 /* If the variable alignment is very large we'll dynamicaly allocate
1530 it, which means that in-frame portion is just a pointer. */
1531 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1532 align = GET_MODE_ALIGNMENT (Pmode);
1534 record_alignment_for_reg_var (align);
1536 if (!use_register_for_decl (var))
1538 if (defer_stack_allocation (var, true))
1539 add_stack_var (var, true);
1540 else
1541 expand_one_stack_var_1 (var);
1542 return;
1545 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1546 rtx x = gen_reg_rtx (reg_mode);
1548 set_rtl (var, x);
1550 /* For a promoted variable, X will not be used directly but wrapped in a
1551 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1552 will assume that its upper bits can be inferred from its lower bits.
1553 Therefore, if X isn't initialized on every path from the entry, then
1554 we must do it manually in order to fulfill the above assumption. */
1555 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1556 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1557 emit_move_insn (x, CONST0_RTX (reg_mode));
1560 /* Record the association between the RTL generated for partition PART
1561 and the underlying variable of the SSA_NAME VAR. */
1563 static void
1564 adjust_one_expanded_partition_var (tree var)
1566 if (!var)
1567 return;
1569 tree decl = SSA_NAME_VAR (var);
1571 int part = var_to_partition (SA.map, var);
1572 if (part == NO_PARTITION)
1573 return;
1575 rtx x = SA.partition_to_pseudo[part];
1577 gcc_assert (x);
1579 set_rtl (var, x);
1581 if (!REG_P (x))
1582 return;
1584 /* Note if the object is a user variable. */
1585 if (decl && !DECL_ARTIFICIAL (decl))
1586 mark_user_reg (x);
1588 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1589 mark_reg_pointer (x, get_pointer_alignment (var));
1592 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1593 that will reside in a pseudo register. */
1595 static void
1596 expand_one_register_var (tree var)
1598 if (TREE_CODE (var) == SSA_NAME)
1600 int part = var_to_partition (SA.map, var);
1601 if (part != NO_PARTITION)
1603 rtx x = SA.partition_to_pseudo[part];
1604 gcc_assert (x);
1605 gcc_assert (REG_P (x));
1606 return;
1608 gcc_unreachable ();
1611 tree decl = var;
1612 tree type = TREE_TYPE (decl);
1613 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1614 rtx x = gen_reg_rtx (reg_mode);
1616 set_rtl (var, x);
1618 /* Note if the object is a user variable. */
1619 if (!DECL_ARTIFICIAL (decl))
1620 mark_user_reg (x);
1622 if (POINTER_TYPE_P (type))
1623 mark_reg_pointer (x, get_pointer_alignment (var));
1626 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1627 has some associated error, e.g. its type is error-mark. We just need
1628 to pick something that won't crash the rest of the compiler. */
1630 static void
1631 expand_one_error_var (tree var)
1633 machine_mode mode = DECL_MODE (var);
1634 rtx x;
1636 if (mode == BLKmode)
1637 x = gen_rtx_MEM (BLKmode, const0_rtx);
1638 else if (mode == VOIDmode)
1639 x = const0_rtx;
1640 else
1641 x = gen_reg_rtx (mode);
1643 SET_DECL_RTL (var, x);
1646 /* A subroutine of expand_one_var. VAR is a variable that will be
1647 allocated to the local stack frame. Return true if we wish to
1648 add VAR to STACK_VARS so that it will be coalesced with other
1649 variables. Return false to allocate VAR immediately.
1651 This function is used to reduce the number of variables considered
1652 for coalescing, which reduces the size of the quadratic problem. */
1654 static bool
1655 defer_stack_allocation (tree var, bool toplevel)
1657 tree size_unit = TREE_CODE (var) == SSA_NAME
1658 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1659 : DECL_SIZE_UNIT (var);
1660 poly_uint64 size;
1662 /* Whether the variable is small enough for immediate allocation not to be
1663 a problem with regard to the frame size. */
1664 bool smallish
1665 = (poly_int_tree_p (size_unit, &size)
1666 && (estimated_poly_value (size)
1667 < param_min_size_for_stack_sharing));
1669 /* If stack protection is enabled, *all* stack variables must be deferred,
1670 so that we can re-order the strings to the top of the frame.
1671 Similarly for Address Sanitizer. */
1672 if (flag_stack_protect || asan_sanitize_stack_p ())
1673 return true;
1675 unsigned int align = TREE_CODE (var) == SSA_NAME
1676 ? TYPE_ALIGN (TREE_TYPE (var))
1677 : DECL_ALIGN (var);
1679 /* We handle "large" alignment via dynamic allocation. We want to handle
1680 this extra complication in only one place, so defer them. */
1681 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1682 return true;
1684 bool ignored = TREE_CODE (var) == SSA_NAME
1685 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1686 : DECL_IGNORED_P (var);
1688 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1689 might be detached from their block and appear at toplevel when we reach
1690 here. We want to coalesce them with variables from other blocks when
1691 the immediate contribution to the frame size would be noticeable. */
1692 if (toplevel && optimize > 0 && ignored && !smallish)
1693 return true;
1695 /* Variables declared in the outermost scope automatically conflict
1696 with every other variable. The only reason to want to defer them
1697 at all is that, after sorting, we can more efficiently pack
1698 small variables in the stack frame. Continue to defer at -O2. */
1699 if (toplevel && optimize < 2)
1700 return false;
1702 /* Without optimization, *most* variables are allocated from the
1703 stack, which makes the quadratic problem large exactly when we
1704 want compilation to proceed as quickly as possible. On the
1705 other hand, we don't want the function's stack frame size to
1706 get completely out of hand. So we avoid adding scalars and
1707 "small" aggregates to the list at all. */
1708 if (optimize == 0 && smallish)
1709 return false;
1711 return true;
1714 /* A subroutine of expand_used_vars. Expand one variable according to
1715 its flavor. Variables to be placed on the stack are not actually
1716 expanded yet, merely recorded.
1717 When REALLY_EXPAND is false, only add stack values to be allocated.
1718 Return stack usage this variable is supposed to take.
1721 static poly_uint64
1722 expand_one_var (tree var, bool toplevel, bool really_expand,
1723 bitmap forced_stack_var = NULL)
1725 unsigned int align = BITS_PER_UNIT;
1726 tree origvar = var;
1728 var = SSAVAR (var);
1730 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1732 if (is_global_var (var))
1733 return 0;
1735 /* Because we don't know if VAR will be in register or on stack,
1736 we conservatively assume it will be on stack even if VAR is
1737 eventually put into register after RA pass. For non-automatic
1738 variables, which won't be on stack, we collect alignment of
1739 type and ignore user specified alignment. Similarly for
1740 SSA_NAMEs for which use_register_for_decl returns true. */
1741 if (TREE_STATIC (var)
1742 || DECL_EXTERNAL (var)
1743 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1744 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1745 TYPE_MODE (TREE_TYPE (var)),
1746 TYPE_ALIGN (TREE_TYPE (var)));
1747 else if (DECL_HAS_VALUE_EXPR_P (var)
1748 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1749 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1750 or variables which were assigned a stack slot already by
1751 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1752 changed from the offset chosen to it. */
1753 align = crtl->stack_alignment_estimated;
1754 else
1755 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1757 /* If the variable alignment is very large we'll dynamicaly allocate
1758 it, which means that in-frame portion is just a pointer. */
1759 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1760 align = GET_MODE_ALIGNMENT (Pmode);
1763 record_alignment_for_reg_var (align);
1765 poly_uint64 size;
1766 if (TREE_CODE (origvar) == SSA_NAME)
1768 gcc_assert (!VAR_P (var)
1769 || (!DECL_EXTERNAL (var)
1770 && !DECL_HAS_VALUE_EXPR_P (var)
1771 && !TREE_STATIC (var)
1772 && TREE_TYPE (var) != error_mark_node
1773 && !DECL_HARD_REGISTER (var)
1774 && really_expand));
1776 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1778 else if (DECL_EXTERNAL (var))
1780 else if (DECL_HAS_VALUE_EXPR_P (var))
1782 else if (TREE_STATIC (var))
1784 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1786 else if (TREE_TYPE (var) == error_mark_node)
1788 if (really_expand)
1789 expand_one_error_var (var);
1791 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1793 if (really_expand)
1795 expand_one_hard_reg_var (var);
1796 if (!DECL_HARD_REGISTER (var))
1797 /* Invalid register specification. */
1798 expand_one_error_var (var);
1801 else if (use_register_for_decl (var)
1802 && (!forced_stack_var
1803 || !bitmap_bit_p (forced_stack_var, DECL_UID (var))))
1805 if (really_expand)
1806 expand_one_register_var (origvar);
1808 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1809 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1811 /* Reject variables which cover more than half of the address-space. */
1812 if (really_expand)
1814 if (DECL_NONLOCAL_FRAME (var))
1815 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1816 "total size of local objects is too large");
1817 else
1818 error_at (DECL_SOURCE_LOCATION (var),
1819 "size of variable %q+D is too large", var);
1820 expand_one_error_var (var);
1823 else if (defer_stack_allocation (var, toplevel))
1824 add_stack_var (origvar, really_expand);
1825 else
1827 if (really_expand)
1829 if (lookup_attribute ("naked",
1830 DECL_ATTRIBUTES (current_function_decl)))
1831 error ("cannot allocate stack for variable %q+D, naked function",
1832 var);
1834 expand_one_stack_var (origvar);
1836 return size;
1838 return 0;
1841 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1842 expanding variables. Those variables that can be put into registers
1843 are allocated pseudos; those that can't are put on the stack.
1845 TOPLEVEL is true if this is the outermost BLOCK. */
1847 static void
1848 expand_used_vars_for_block (tree block, bool toplevel, bitmap forced_stack_vars)
1850 tree t;
1852 /* Expand all variables at this level. */
1853 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1854 if (TREE_USED (t)
1855 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1856 || !DECL_NONSHAREABLE (t)))
1857 expand_one_var (t, toplevel, true, forced_stack_vars);
1859 /* Expand all variables at containing levels. */
1860 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1861 expand_used_vars_for_block (t, false, forced_stack_vars);
1864 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1865 and clear TREE_USED on all local variables. */
1867 static void
1868 clear_tree_used (tree block)
1870 tree t;
1872 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1873 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1874 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1875 || !DECL_NONSHAREABLE (t))
1876 TREE_USED (t) = 0;
1878 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1879 clear_tree_used (t);
1882 /* Examine TYPE and determine a bit mask of the following features. */
1884 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1885 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1886 #define SPCT_HAS_ARRAY 4
1887 #define SPCT_HAS_AGGREGATE 8
1889 static unsigned int
1890 stack_protect_classify_type (tree type)
1892 unsigned int ret = 0;
1893 tree t;
1895 switch (TREE_CODE (type))
1897 case ARRAY_TYPE:
1898 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1899 if (t == char_type_node
1900 || t == signed_char_type_node
1901 || t == unsigned_char_type_node)
1903 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1904 unsigned HOST_WIDE_INT len;
1906 if (!TYPE_SIZE_UNIT (type)
1907 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1908 len = max;
1909 else
1910 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1912 if (len < max)
1913 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1914 else
1915 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1917 else
1918 ret = SPCT_HAS_ARRAY;
1919 break;
1921 case UNION_TYPE:
1922 case QUAL_UNION_TYPE:
1923 case RECORD_TYPE:
1924 ret = SPCT_HAS_AGGREGATE;
1925 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1926 if (TREE_CODE (t) == FIELD_DECL)
1927 ret |= stack_protect_classify_type (TREE_TYPE (t));
1928 break;
1930 default:
1931 break;
1934 return ret;
1937 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1938 part of the local stack frame. Remember if we ever return nonzero for
1939 any variable in this function. The return value is the phase number in
1940 which the variable should be allocated. */
1942 static int
1943 stack_protect_decl_phase (tree decl)
1945 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1946 int ret = 0;
1948 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1949 has_short_buffer = true;
1951 tree attribs = DECL_ATTRIBUTES (current_function_decl);
1952 if (!lookup_attribute ("no_stack_protector", attribs)
1953 && (flag_stack_protect == SPCT_FLAG_ALL
1954 || flag_stack_protect == SPCT_FLAG_STRONG
1955 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1956 && lookup_attribute ("stack_protect", attribs))))
1958 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1959 && !(bits & SPCT_HAS_AGGREGATE))
1960 ret = 1;
1961 else if (bits & SPCT_HAS_ARRAY)
1962 ret = 2;
1964 else
1965 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1967 if (ret)
1968 has_protected_decls = true;
1970 return ret;
1973 /* Two helper routines that check for phase 1 and phase 2. These are used
1974 as callbacks for expand_stack_vars. */
1976 static bool
1977 stack_protect_decl_phase_1 (size_t i)
1979 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1982 static bool
1983 stack_protect_decl_phase_2 (size_t i)
1985 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1988 /* And helper function that checks for asan phase (with stack protector
1989 it is phase 3). This is used as callback for expand_stack_vars.
1990 Returns true if any of the vars in the partition need to be protected. */
1992 static bool
1993 asan_decl_phase_3 (size_t i)
1995 while (i != EOC)
1997 if (asan_protect_stack_decl (stack_vars[i].decl))
1998 return true;
1999 i = stack_vars[i].next;
2001 return false;
2004 /* Ensure that variables in different stack protection phases conflict
2005 so that they are not merged and share the same stack slot.
2006 Return true if there are any address taken variables. */
2008 static bool
2009 add_stack_protection_conflicts (void)
2011 size_t i, j, n = stack_vars_num;
2012 unsigned char *phase;
2013 bool ret = false;
2015 phase = XNEWVEC (unsigned char, n);
2016 for (i = 0; i < n; ++i)
2018 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
2019 if (TREE_ADDRESSABLE (stack_vars[i].decl))
2020 ret = true;
2023 for (i = 0; i < n; ++i)
2025 unsigned char ph_i = phase[i];
2026 for (j = i + 1; j < n; ++j)
2027 if (ph_i != phase[j])
2028 add_stack_var_conflict (i, j);
2031 XDELETEVEC (phase);
2032 return ret;
2035 /* Create a decl for the guard at the top of the stack frame. */
2037 static void
2038 create_stack_guard (void)
2040 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
2041 VAR_DECL, NULL, ptr_type_node);
2042 TREE_THIS_VOLATILE (guard) = 1;
2043 TREE_USED (guard) = 1;
2044 expand_one_stack_var (guard);
2045 crtl->stack_protect_guard = guard;
2048 /* Prepare for expanding variables. */
2049 static void
2050 init_vars_expansion (void)
2052 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
2053 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
2055 /* A map from decl to stack partition. */
2056 decl_to_stack_part = new hash_map<tree, size_t>;
2058 /* Initialize local stack smashing state. */
2059 has_protected_decls = false;
2060 has_short_buffer = false;
2061 if (hwasan_sanitize_stack_p ())
2062 hwasan_record_frame_init ();
2065 /* Free up stack variable graph data. */
2066 static void
2067 fini_vars_expansion (void)
2069 bitmap_obstack_release (&stack_var_bitmap_obstack);
2070 if (stack_vars)
2071 XDELETEVEC (stack_vars);
2072 if (stack_vars_sorted)
2073 XDELETEVEC (stack_vars_sorted);
2074 stack_vars = NULL;
2075 stack_vars_sorted = NULL;
2076 stack_vars_alloc = stack_vars_num = 0;
2077 delete decl_to_stack_part;
2078 decl_to_stack_part = NULL;
2081 /* Make a fair guess for the size of the stack frame of the function
2082 in NODE. This doesn't have to be exact, the result is only used in
2083 the inline heuristics. So we don't want to run the full stack var
2084 packing algorithm (which is quadratic in the number of stack vars).
2085 Instead, we calculate the total size of all stack vars. This turns
2086 out to be a pretty fair estimate -- packing of stack vars doesn't
2087 happen very often. */
2089 HOST_WIDE_INT
2090 estimated_stack_frame_size (struct cgraph_node *node)
2092 poly_int64 size = 0;
2093 size_t i;
2094 tree var;
2095 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2097 push_cfun (fn);
2099 init_vars_expansion ();
2101 FOR_EACH_LOCAL_DECL (fn, i, var)
2102 if (auto_var_in_fn_p (var, fn->decl))
2103 size += expand_one_var (var, true, false);
2105 if (stack_vars_num > 0)
2107 /* Fake sorting the stack vars for account_stack_vars (). */
2108 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
2109 for (i = 0; i < stack_vars_num; ++i)
2110 stack_vars_sorted[i] = i;
2111 size += account_stack_vars ();
2114 fini_vars_expansion ();
2115 pop_cfun ();
2116 return estimated_poly_value (size);
2119 /* Check if the current function has calls that use a return slot. */
2121 static bool
2122 stack_protect_return_slot_p ()
2124 basic_block bb;
2126 FOR_ALL_BB_FN (bb, cfun)
2127 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2128 !gsi_end_p (gsi); gsi_next (&gsi))
2130 gimple *stmt = gsi_stmt (gsi);
2131 /* This assumes that calls to internal-only functions never
2132 use a return slot. */
2133 if (is_gimple_call (stmt)
2134 && !gimple_call_internal_p (stmt)
2135 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2136 gimple_call_fndecl (stmt)))
2137 return true;
2139 return false;
2142 /* Expand all variables used in the function. */
2144 static rtx_insn *
2145 expand_used_vars (bitmap forced_stack_vars)
2147 tree var, outer_block = DECL_INITIAL (current_function_decl);
2148 auto_vec<tree> maybe_local_decls;
2149 rtx_insn *var_end_seq = NULL;
2150 unsigned i;
2151 unsigned len;
2152 bool gen_stack_protect_signal = false;
2154 /* Compute the phase of the stack frame for this function. */
2156 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2157 int off = targetm.starting_frame_offset () % align;
2158 frame_phase = off ? align - off : 0;
2161 /* Set TREE_USED on all variables in the local_decls. */
2162 FOR_EACH_LOCAL_DECL (cfun, i, var)
2163 TREE_USED (var) = 1;
2164 /* Clear TREE_USED on all variables associated with a block scope. */
2165 clear_tree_used (DECL_INITIAL (current_function_decl));
2167 init_vars_expansion ();
2169 if (targetm.use_pseudo_pic_reg ())
2170 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2172 for (i = 0; i < SA.map->num_partitions; i++)
2174 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2175 continue;
2177 tree var = partition_to_var (SA.map, i);
2179 gcc_assert (!virtual_operand_p (var));
2181 expand_one_ssa_partition (var);
2184 if (flag_stack_protect == SPCT_FLAG_STRONG)
2185 gen_stack_protect_signal = stack_protect_return_slot_p ();
2187 /* At this point all variables on the local_decls with TREE_USED
2188 set are not associated with any block scope. Lay them out. */
2190 len = vec_safe_length (cfun->local_decls);
2191 FOR_EACH_LOCAL_DECL (cfun, i, var)
2193 bool expand_now = false;
2195 /* Expanded above already. */
2196 if (is_gimple_reg (var))
2198 TREE_USED (var) = 0;
2199 goto next;
2201 /* We didn't set a block for static or extern because it's hard
2202 to tell the difference between a global variable (re)declared
2203 in a local scope, and one that's really declared there to
2204 begin with. And it doesn't really matter much, since we're
2205 not giving them stack space. Expand them now. */
2206 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2207 expand_now = true;
2209 /* Expand variables not associated with any block now. Those created by
2210 the optimizers could be live anywhere in the function. Those that
2211 could possibly have been scoped originally and detached from their
2212 block will have their allocation deferred so we coalesce them with
2213 others when optimization is enabled. */
2214 else if (TREE_USED (var))
2215 expand_now = true;
2217 /* Finally, mark all variables on the list as used. We'll use
2218 this in a moment when we expand those associated with scopes. */
2219 TREE_USED (var) = 1;
2221 if (expand_now)
2222 expand_one_var (var, true, true, forced_stack_vars);
2224 next:
2225 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2227 rtx rtl = DECL_RTL_IF_SET (var);
2229 /* Keep artificial non-ignored vars in cfun->local_decls
2230 chain until instantiate_decls. */
2231 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2232 add_local_decl (cfun, var);
2233 else if (rtl == NULL_RTX)
2234 /* If rtl isn't set yet, which can happen e.g. with
2235 -fstack-protector, retry before returning from this
2236 function. */
2237 maybe_local_decls.safe_push (var);
2241 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2243 +-----------------+-----------------+
2244 | ...processed... | ...duplicates...|
2245 +-----------------+-----------------+
2247 +-- LEN points here.
2249 We just want the duplicates, as those are the artificial
2250 non-ignored vars that we want to keep until instantiate_decls.
2251 Move them down and truncate the array. */
2252 if (!vec_safe_is_empty (cfun->local_decls))
2253 cfun->local_decls->block_remove (0, len);
2255 /* At this point, all variables within the block tree with TREE_USED
2256 set are actually used by the optimized function. Lay them out. */
2257 expand_used_vars_for_block (outer_block, true, forced_stack_vars);
2259 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2260 if (stack_vars_num > 0)
2262 bool has_addressable_vars = false;
2264 add_scope_conflicts ();
2266 /* If stack protection is enabled, we don't share space between
2267 vulnerable data and non-vulnerable data. */
2268 if (flag_stack_protect != 0
2269 && !lookup_attribute ("no_stack_protector", attribs)
2270 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2271 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2272 && lookup_attribute ("stack_protect", attribs))))
2273 has_addressable_vars = add_stack_protection_conflicts ();
2275 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2276 gen_stack_protect_signal = true;
2278 /* Now that we have collected all stack variables, and have computed a
2279 minimal interference graph, attempt to save some stack space. */
2280 partition_stack_vars ();
2281 if (dump_file)
2282 dump_stack_var_partition ();
2286 if (!lookup_attribute ("no_stack_protector", attribs))
2287 switch (flag_stack_protect)
2289 case SPCT_FLAG_ALL:
2290 create_stack_guard ();
2291 break;
2293 case SPCT_FLAG_STRONG:
2294 if (gen_stack_protect_signal
2295 || cfun->calls_alloca
2296 || has_protected_decls
2297 || lookup_attribute ("stack_protect",
2298 DECL_ATTRIBUTES (current_function_decl)))
2299 create_stack_guard ();
2300 break;
2302 case SPCT_FLAG_DEFAULT:
2303 if (cfun->calls_alloca
2304 || has_protected_decls
2305 || lookup_attribute ("stack_protect",
2306 DECL_ATTRIBUTES (current_function_decl)))
2307 create_stack_guard ();
2308 break;
2310 case SPCT_FLAG_EXPLICIT:
2311 if (lookup_attribute ("stack_protect",
2312 DECL_ATTRIBUTES (current_function_decl)))
2313 create_stack_guard ();
2314 break;
2316 default:
2317 break;
2320 /* Assign rtl to each variable based on these partitions. */
2321 if (stack_vars_num > 0)
2323 class stack_vars_data data;
2325 data.asan_base = NULL_RTX;
2326 data.asan_alignb = 0;
2328 /* Reorder decls to be protected by iterating over the variables
2329 array multiple times, and allocating out of each phase in turn. */
2330 /* ??? We could probably integrate this into the qsort we did
2331 earlier, such that we naturally see these variables first,
2332 and thus naturally allocate things in the right order. */
2333 if (has_protected_decls)
2335 /* Phase 1 contains only character arrays. */
2336 expand_stack_vars (stack_protect_decl_phase_1, &data);
2338 /* Phase 2 contains other kinds of arrays. */
2339 if (!lookup_attribute ("no_stack_protector", attribs)
2340 && (flag_stack_protect == SPCT_FLAG_ALL
2341 || flag_stack_protect == SPCT_FLAG_STRONG
2342 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2343 && lookup_attribute ("stack_protect", attribs))))
2344 expand_stack_vars (stack_protect_decl_phase_2, &data);
2347 if (asan_sanitize_stack_p ())
2348 /* Phase 3, any partitions that need asan protection
2349 in addition to phase 1 and 2. */
2350 expand_stack_vars (asan_decl_phase_3, &data);
2352 /* ASAN description strings don't yet have a syntax for expressing
2353 polynomial offsets. */
2354 HOST_WIDE_INT prev_offset;
2355 if (!data.asan_vec.is_empty ()
2356 && frame_offset.is_constant (&prev_offset))
2358 HOST_WIDE_INT offset, sz, redzonesz;
2359 redzonesz = ASAN_RED_ZONE_SIZE;
2360 sz = data.asan_vec[0] - prev_offset;
2361 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2362 && data.asan_alignb <= 4096
2363 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2364 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2365 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2366 /* Allocating a constant amount of space from a constant
2367 starting offset must give a constant result. */
2368 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2369 .to_constant ());
2370 data.asan_vec.safe_push (prev_offset);
2371 data.asan_vec.safe_push (offset);
2372 /* Leave space for alignment if STRICT_ALIGNMENT. */
2373 if (STRICT_ALIGNMENT)
2374 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2375 << ASAN_SHADOW_SHIFT)
2376 / BITS_PER_UNIT, 1);
2378 var_end_seq
2379 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2380 data.asan_base,
2381 data.asan_alignb,
2382 data.asan_vec.address (),
2383 data.asan_decl_vec.address (),
2384 data.asan_vec.length ());
2387 expand_stack_vars (NULL, &data);
2390 if (hwasan_sanitize_stack_p ())
2391 hwasan_emit_prologue ();
2392 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2393 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2394 virtual_stack_vars_rtx,
2395 var_end_seq);
2396 else if (hwasan_sanitize_allocas_p () && cfun->calls_alloca)
2397 /* When using out-of-line instrumentation we only want to emit one function
2398 call for clearing the tags in a region of shadow stack. When there are
2399 alloca calls in this frame we want to emit a call using the
2400 virtual_stack_dynamic_rtx, but when not we use the hwasan_frame_extent
2401 rtx we created in expand_stack_vars. */
2402 var_end_seq = hwasan_emit_untag_frame (virtual_stack_dynamic_rtx,
2403 virtual_stack_vars_rtx);
2404 else if (hwasan_sanitize_stack_p ())
2405 /* If no variables were stored on the stack, `hwasan_get_frame_extent`
2406 will return NULL_RTX and hence `hwasan_emit_untag_frame` will return
2407 NULL (i.e. an empty sequence). */
2408 var_end_seq = hwasan_emit_untag_frame (hwasan_get_frame_extent (),
2409 virtual_stack_vars_rtx);
2411 fini_vars_expansion ();
2413 /* If there were any artificial non-ignored vars without rtl
2414 found earlier, see if deferred stack allocation hasn't assigned
2415 rtl to them. */
2416 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2418 rtx rtl = DECL_RTL_IF_SET (var);
2420 /* Keep artificial non-ignored vars in cfun->local_decls
2421 chain until instantiate_decls. */
2422 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2423 add_local_decl (cfun, var);
2426 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2427 if (STACK_ALIGNMENT_NEEDED)
2429 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2430 if (FRAME_GROWS_DOWNWARD)
2431 frame_offset = aligned_lower_bound (frame_offset, align);
2432 else
2433 frame_offset = aligned_upper_bound (frame_offset, align);
2436 return var_end_seq;
2440 /* If we need to produce a detailed dump, print the tree representation
2441 for STMT to the dump file. SINCE is the last RTX after which the RTL
2442 generated for STMT should have been appended. */
2444 static void
2445 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2447 if (dump_file && (dump_flags & TDF_DETAILS))
2449 fprintf (dump_file, "\n;; ");
2450 print_gimple_stmt (dump_file, stmt, 0,
2451 TDF_SLIM | (dump_flags & TDF_LINENO));
2452 fprintf (dump_file, "\n");
2454 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2458 /* Maps the blocks that do not contain tree labels to rtx labels. */
2460 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2462 /* Returns the label_rtx expression for a label starting basic block BB. */
2464 static rtx_code_label *
2465 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2467 gimple_stmt_iterator gsi;
2468 tree lab;
2470 if (bb->flags & BB_RTL)
2471 return block_label (bb);
2473 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2474 if (elt)
2475 return *elt;
2477 /* Find the tree label if it is present. */
2479 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2481 glabel *lab_stmt;
2483 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2484 if (!lab_stmt)
2485 break;
2487 lab = gimple_label_label (lab_stmt);
2488 if (DECL_NONLOCAL (lab))
2489 break;
2491 return jump_target_rtx (lab);
2494 rtx_code_label *l = gen_label_rtx ();
2495 lab_rtx_for_bb->put (bb, l);
2496 return l;
2500 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2501 of a basic block where we just expanded the conditional at the end,
2502 possibly clean up the CFG and instruction sequence. LAST is the
2503 last instruction before the just emitted jump sequence. */
2505 static void
2506 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2508 /* Special case: when jumpif decides that the condition is
2509 trivial it emits an unconditional jump (and the necessary
2510 barrier). But we still have two edges, the fallthru one is
2511 wrong. purge_dead_edges would clean this up later. Unfortunately
2512 we have to insert insns (and split edges) before
2513 find_many_sub_basic_blocks and hence before purge_dead_edges.
2514 But splitting edges might create new blocks which depend on the
2515 fact that if there are two edges there's no barrier. So the
2516 barrier would get lost and verify_flow_info would ICE. Instead
2517 of auditing all edge splitters to care for the barrier (which
2518 normally isn't there in a cleaned CFG), fix it here. */
2519 if (BARRIER_P (get_last_insn ()))
2521 rtx_insn *insn;
2522 remove_edge (e);
2523 /* Now, we have a single successor block, if we have insns to
2524 insert on the remaining edge we potentially will insert
2525 it at the end of this block (if the dest block isn't feasible)
2526 in order to avoid splitting the edge. This insertion will take
2527 place in front of the last jump. But we might have emitted
2528 multiple jumps (conditional and one unconditional) to the
2529 same destination. Inserting in front of the last one then
2530 is a problem. See PR 40021. We fix this by deleting all
2531 jumps except the last unconditional one. */
2532 insn = PREV_INSN (get_last_insn ());
2533 /* Make sure we have an unconditional jump. Otherwise we're
2534 confused. */
2535 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2536 for (insn = PREV_INSN (insn); insn != last;)
2538 insn = PREV_INSN (insn);
2539 if (JUMP_P (NEXT_INSN (insn)))
2541 if (!any_condjump_p (NEXT_INSN (insn)))
2543 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2544 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2546 delete_insn (NEXT_INSN (insn));
2552 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2553 Returns a new basic block if we've terminated the current basic
2554 block and created a new one. */
2556 static basic_block
2557 expand_gimple_cond (basic_block bb, gcond *stmt)
2559 basic_block new_bb, dest;
2560 edge true_edge;
2561 edge false_edge;
2562 rtx_insn *last2, *last;
2563 enum tree_code code;
2564 tree op0, op1;
2566 code = gimple_cond_code (stmt);
2567 op0 = gimple_cond_lhs (stmt);
2568 op1 = gimple_cond_rhs (stmt);
2569 /* We're sometimes presented with such code:
2570 D.123_1 = x < y;
2571 if (D.123_1 != 0)
2573 This would expand to two comparisons which then later might
2574 be cleaned up by combine. But some pattern matchers like if-conversion
2575 work better when there's only one compare, so make up for this
2576 here as special exception if TER would have made the same change. */
2577 if (SA.values
2578 && TREE_CODE (op0) == SSA_NAME
2579 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2580 && TREE_CODE (op1) == INTEGER_CST
2581 && ((gimple_cond_code (stmt) == NE_EXPR
2582 && integer_zerop (op1))
2583 || (gimple_cond_code (stmt) == EQ_EXPR
2584 && integer_onep (op1)))
2585 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2587 gimple *second = SSA_NAME_DEF_STMT (op0);
2588 if (gimple_code (second) == GIMPLE_ASSIGN)
2590 enum tree_code code2 = gimple_assign_rhs_code (second);
2591 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2593 code = code2;
2594 op0 = gimple_assign_rhs1 (second);
2595 op1 = gimple_assign_rhs2 (second);
2597 /* If jumps are cheap and the target does not support conditional
2598 compare, turn some more codes into jumpy sequences. */
2599 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2600 && targetm.gen_ccmp_first == NULL)
2602 if ((code2 == BIT_AND_EXPR
2603 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2604 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2605 || code2 == TRUTH_AND_EXPR)
2607 code = TRUTH_ANDIF_EXPR;
2608 op0 = gimple_assign_rhs1 (second);
2609 op1 = gimple_assign_rhs2 (second);
2611 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2613 code = TRUTH_ORIF_EXPR;
2614 op0 = gimple_assign_rhs1 (second);
2615 op1 = gimple_assign_rhs2 (second);
2621 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2622 into (x - C2) * C3 < C4. */
2623 if ((code == EQ_EXPR || code == NE_EXPR)
2624 && TREE_CODE (op0) == SSA_NAME
2625 && TREE_CODE (op1) == INTEGER_CST)
2626 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2628 /* Optimize (x - y) < 0 into x < y if x - y has undefined overflow. */
2629 if (!TYPE_UNSIGNED (TREE_TYPE (op0))
2630 && (code == LT_EXPR || code == LE_EXPR
2631 || code == GT_EXPR || code == GE_EXPR)
2632 && integer_zerop (op1)
2633 && TREE_CODE (op0) == SSA_NAME)
2634 maybe_optimize_sub_cmp_0 (code, &op0, &op1);
2636 last2 = last = get_last_insn ();
2638 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2639 set_curr_insn_location (gimple_location (stmt));
2641 /* These flags have no purpose in RTL land. */
2642 true_edge->flags &= ~EDGE_TRUE_VALUE;
2643 false_edge->flags &= ~EDGE_FALSE_VALUE;
2645 /* We can either have a pure conditional jump with one fallthru edge or
2646 two-way jump that needs to be decomposed into two basic blocks. */
2647 if (false_edge->dest == bb->next_bb)
2649 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2650 true_edge->probability);
2651 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2652 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2653 set_curr_insn_location (true_edge->goto_locus);
2654 false_edge->flags |= EDGE_FALLTHRU;
2655 maybe_cleanup_end_of_block (false_edge, last);
2656 return NULL;
2658 if (true_edge->dest == bb->next_bb)
2660 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2661 false_edge->probability);
2662 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2663 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2664 set_curr_insn_location (false_edge->goto_locus);
2665 true_edge->flags |= EDGE_FALLTHRU;
2666 maybe_cleanup_end_of_block (true_edge, last);
2667 return NULL;
2670 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2671 true_edge->probability);
2672 last = get_last_insn ();
2673 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2674 set_curr_insn_location (false_edge->goto_locus);
2675 emit_jump (label_rtx_for_bb (false_edge->dest));
2677 BB_END (bb) = last;
2678 if (BARRIER_P (BB_END (bb)))
2679 BB_END (bb) = PREV_INSN (BB_END (bb));
2680 update_bb_for_insn (bb);
2682 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2683 dest = false_edge->dest;
2684 redirect_edge_succ (false_edge, new_bb);
2685 false_edge->flags |= EDGE_FALLTHRU;
2686 new_bb->count = false_edge->count ();
2687 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2688 add_bb_to_loop (new_bb, loop);
2689 if (loop->latch == bb
2690 && loop->header == dest)
2691 loop->latch = new_bb;
2692 make_single_succ_edge (new_bb, dest, 0);
2693 if (BARRIER_P (BB_END (new_bb)))
2694 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2695 update_bb_for_insn (new_bb);
2697 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2699 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2701 set_curr_insn_location (true_edge->goto_locus);
2702 true_edge->goto_locus = curr_insn_location ();
2705 return new_bb;
2708 /* Mark all calls that can have a transaction restart. */
2710 static void
2711 mark_transaction_restart_calls (gimple *stmt)
2713 struct tm_restart_node dummy;
2714 tm_restart_node **slot;
2716 if (!cfun->gimple_df->tm_restart)
2717 return;
2719 dummy.stmt = stmt;
2720 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2721 if (slot)
2723 struct tm_restart_node *n = *slot;
2724 tree list = n->label_or_list;
2725 rtx_insn *insn;
2727 for (insn = next_real_insn (get_last_insn ());
2728 !CALL_P (insn);
2729 insn = next_real_insn (insn))
2730 continue;
2732 if (TREE_CODE (list) == LABEL_DECL)
2733 add_reg_note (insn, REG_TM, label_rtx (list));
2734 else
2735 for (; list ; list = TREE_CHAIN (list))
2736 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2740 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2741 statement STMT. */
2743 static void
2744 expand_call_stmt (gcall *stmt)
2746 tree exp, decl, lhs;
2747 bool builtin_p;
2748 size_t i;
2750 if (gimple_call_internal_p (stmt))
2752 expand_internal_call (stmt);
2753 return;
2756 /* If this is a call to a built-in function and it has no effect other
2757 than setting the lhs, try to implement it using an internal function
2758 instead. */
2759 decl = gimple_call_fndecl (stmt);
2760 if (gimple_call_lhs (stmt)
2761 && !gimple_has_side_effects (stmt)
2762 && (optimize || (decl && called_as_built_in (decl))))
2764 internal_fn ifn = replacement_internal_fn (stmt);
2765 if (ifn != IFN_LAST)
2767 expand_internal_call (ifn, stmt);
2768 return;
2772 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2774 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2775 builtin_p = decl && fndecl_built_in_p (decl);
2777 /* If this is not a builtin function, the function type through which the
2778 call is made may be different from the type of the function. */
2779 if (!builtin_p)
2780 CALL_EXPR_FN (exp)
2781 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2782 CALL_EXPR_FN (exp));
2784 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2785 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2787 for (i = 0; i < gimple_call_num_args (stmt); i++)
2789 tree arg = gimple_call_arg (stmt, i);
2790 gimple *def;
2791 /* TER addresses into arguments of builtin functions so we have a
2792 chance to infer more correct alignment information. See PR39954. */
2793 if (builtin_p
2794 && TREE_CODE (arg) == SSA_NAME
2795 && (def = get_gimple_for_ssa_name (arg))
2796 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2797 arg = gimple_assign_rhs1 (def);
2798 CALL_EXPR_ARG (exp, i) = arg;
2801 if (gimple_has_side_effects (stmt)
2802 /* ??? Downstream in expand_expr_real_1 we assume that expressions
2803 w/o side-effects do not throw so work around this here. */
2804 || stmt_could_throw_p (cfun, stmt))
2805 TREE_SIDE_EFFECTS (exp) = 1;
2807 if (gimple_call_nothrow_p (stmt))
2808 TREE_NOTHROW (exp) = 1;
2810 if (gimple_no_warning_p (stmt))
2811 TREE_NO_WARNING (exp) = 1;
2813 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2814 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2815 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2816 if (decl
2817 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2818 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2819 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2820 else
2821 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2822 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2823 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2824 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2826 /* Ensure RTL is created for debug args. */
2827 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2829 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2830 unsigned int ix;
2831 tree dtemp;
2833 if (debug_args)
2834 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2836 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2837 expand_debug_expr (dtemp);
2841 rtx_insn *before_call = get_last_insn ();
2842 lhs = gimple_call_lhs (stmt);
2843 if (lhs)
2844 expand_assignment (lhs, exp, false);
2845 else
2846 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2848 /* If the gimple call is an indirect call and has 'nocf_check'
2849 attribute find a generated CALL insn to mark it as no
2850 control-flow verification is needed. */
2851 if (gimple_call_nocf_check_p (stmt)
2852 && !gimple_call_fndecl (stmt))
2854 rtx_insn *last = get_last_insn ();
2855 while (!CALL_P (last)
2856 && last != before_call)
2857 last = PREV_INSN (last);
2859 if (last != before_call)
2860 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2863 mark_transaction_restart_calls (stmt);
2867 /* Generate RTL for an asm statement (explicit assembler code).
2868 STRING is a STRING_CST node containing the assembler code text,
2869 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2870 insn is volatile; don't optimize it. */
2872 static void
2873 expand_asm_loc (tree string, int vol, location_t locus)
2875 rtx body;
2877 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2878 ggc_strdup (TREE_STRING_POINTER (string)),
2879 locus);
2881 MEM_VOLATILE_P (body) = vol;
2883 /* Non-empty basic ASM implicitly clobbers memory. */
2884 if (TREE_STRING_LENGTH (string) != 0)
2886 rtx asm_op, clob;
2887 unsigned i, nclobbers;
2888 auto_vec<rtx> input_rvec, output_rvec;
2889 auto_vec<machine_mode> input_mode;
2890 auto_vec<const char *> constraints;
2891 auto_vec<rtx> clobber_rvec;
2892 HARD_REG_SET clobbered_regs;
2893 CLEAR_HARD_REG_SET (clobbered_regs);
2895 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2896 clobber_rvec.safe_push (clob);
2898 if (targetm.md_asm_adjust)
2899 targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
2900 constraints, clobber_rvec, clobbered_regs);
2902 asm_op = body;
2903 nclobbers = clobber_rvec.length ();
2904 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2906 XVECEXP (body, 0, 0) = asm_op;
2907 for (i = 0; i < nclobbers; i++)
2908 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2911 emit_insn (body);
2914 /* Return the number of times character C occurs in string S. */
2915 static int
2916 n_occurrences (int c, const char *s)
2918 int n = 0;
2919 while (*s)
2920 n += (*s++ == c);
2921 return n;
2924 /* A subroutine of expand_asm_operands. Check that all operands have
2925 the same number of alternatives. Return true if so. */
2927 static bool
2928 check_operand_nalternatives (const vec<const char *> &constraints)
2930 unsigned len = constraints.length();
2931 if (len > 0)
2933 int nalternatives = n_occurrences (',', constraints[0]);
2935 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2937 error ("too many alternatives in %<asm%>");
2938 return false;
2941 for (unsigned i = 1; i < len; ++i)
2942 if (n_occurrences (',', constraints[i]) != nalternatives)
2944 error ("operand constraints for %<asm%> differ "
2945 "in number of alternatives");
2946 return false;
2949 return true;
2952 /* Check for overlap between registers marked in CLOBBERED_REGS and
2953 anything inappropriate in T. Emit error and return the register
2954 variable definition for error, NULL_TREE for ok. */
2956 static bool
2957 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2959 /* Conflicts between asm-declared register variables and the clobber
2960 list are not allowed. */
2961 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2963 if (overlap)
2965 error ("%<asm%> specifier for variable %qE conflicts with "
2966 "%<asm%> clobber list",
2967 DECL_NAME (overlap));
2969 /* Reset registerness to stop multiple errors emitted for a single
2970 variable. */
2971 DECL_REGISTER (overlap) = 0;
2972 return true;
2975 return false;
2978 /* Check that the given REGNO spanning NREGS is a valid
2979 asm clobber operand. Some HW registers cannot be
2980 saved/restored, hence they should not be clobbered by
2981 asm statements. */
2982 static bool
2983 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
2985 bool is_valid = true;
2986 HARD_REG_SET regset;
2988 CLEAR_HARD_REG_SET (regset);
2990 add_range_to_hard_reg_set (&regset, regno, nregs);
2992 /* Clobbering the PIC register is an error. */
2993 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
2994 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
2996 /* ??? Diagnose during gimplification? */
2997 error ("PIC register clobbered by %qs in %<asm%>", regname);
2998 is_valid = false;
3000 else if (!in_hard_reg_set_p
3001 (accessible_reg_set, reg_raw_mode[regno], regno))
3003 /* ??? Diagnose during gimplification? */
3004 error ("the register %qs cannot be clobbered in %<asm%>"
3005 " for the current target", regname);
3006 is_valid = false;
3009 /* Clobbering the stack pointer register is deprecated. GCC expects
3010 the value of the stack pointer after an asm statement to be the same
3011 as it was before, so no asm can validly clobber the stack pointer in
3012 the usual sense. Adding the stack pointer to the clobber list has
3013 traditionally had some undocumented and somewhat obscure side-effects. */
3014 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
3016 crtl->sp_is_clobbered_by_asm = true;
3017 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
3018 " %qs in a clobber list is deprecated", regname))
3019 inform (input_location, "the value of the stack pointer after"
3020 " an %<asm%> statement must be the same as it was before"
3021 " the statement");
3024 return is_valid;
3027 /* Generate RTL for an asm statement with arguments.
3028 STRING is the instruction template.
3029 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
3030 Each output or input has an expression in the TREE_VALUE and
3031 a tree list in TREE_PURPOSE which in turn contains a constraint
3032 name in TREE_VALUE (or NULL_TREE) and a constraint string
3033 in TREE_PURPOSE.
3034 CLOBBERS is a list of STRING_CST nodes each naming a hard register
3035 that is clobbered by this insn.
3037 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
3038 should be the fallthru basic block of the asm goto.
3040 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
3041 Some elements of OUTPUTS may be replaced with trees representing temporary
3042 values. The caller should copy those temporary values to the originally
3043 specified lvalues.
3045 VOL nonzero means the insn is volatile; don't optimize it. */
3047 static void
3048 expand_asm_stmt (gasm *stmt)
3050 class save_input_location
3052 location_t old;
3054 public:
3055 explicit save_input_location(location_t where)
3057 old = input_location;
3058 input_location = where;
3061 ~save_input_location()
3063 input_location = old;
3067 location_t locus = gimple_location (stmt);
3069 if (gimple_asm_input_p (stmt))
3071 const char *s = gimple_asm_string (stmt);
3072 tree string = build_string (strlen (s), s);
3073 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
3074 return;
3077 /* There are some legacy diagnostics in here, and also avoids an extra
3078 parameter to targetm.md_asm_adjust. */
3079 save_input_location s_i_l(locus);
3081 unsigned noutputs = gimple_asm_noutputs (stmt);
3082 unsigned ninputs = gimple_asm_ninputs (stmt);
3083 unsigned nlabels = gimple_asm_nlabels (stmt);
3084 unsigned i;
3086 /* ??? Diagnose during gimplification? */
3087 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
3089 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
3090 return;
3093 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
3094 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
3095 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
3097 /* Copy the gimple vectors into new vectors that we can manipulate. */
3099 output_tvec.safe_grow (noutputs, true);
3100 input_tvec.safe_grow (ninputs, true);
3101 constraints.safe_grow (noutputs + ninputs, true);
3103 for (i = 0; i < noutputs; ++i)
3105 tree t = gimple_asm_output_op (stmt, i);
3106 output_tvec[i] = TREE_VALUE (t);
3107 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3109 for (i = 0; i < ninputs; i++)
3111 tree t = gimple_asm_input_op (stmt, i);
3112 input_tvec[i] = TREE_VALUE (t);
3113 constraints[i + noutputs]
3114 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3117 /* ??? Diagnose during gimplification? */
3118 if (! check_operand_nalternatives (constraints))
3119 return;
3121 /* Count the number of meaningful clobbered registers, ignoring what
3122 we would ignore later. */
3123 auto_vec<rtx> clobber_rvec;
3124 HARD_REG_SET clobbered_regs;
3125 CLEAR_HARD_REG_SET (clobbered_regs);
3127 if (unsigned n = gimple_asm_nclobbers (stmt))
3129 clobber_rvec.reserve (n);
3130 for (i = 0; i < n; i++)
3132 tree t = gimple_asm_clobber_op (stmt, i);
3133 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
3134 int nregs, j;
3136 j = decode_reg_name_and_count (regname, &nregs);
3137 if (j < 0)
3139 if (j == -2)
3141 /* ??? Diagnose during gimplification? */
3142 error ("unknown register name %qs in %<asm%>", regname);
3144 else if (j == -4)
3146 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3147 clobber_rvec.safe_push (x);
3149 else
3151 /* Otherwise we should have -1 == empty string
3152 or -3 == cc, which is not a register. */
3153 gcc_assert (j == -1 || j == -3);
3156 else
3157 for (int reg = j; reg < j + nregs; reg++)
3159 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3160 return;
3162 SET_HARD_REG_BIT (clobbered_regs, reg);
3163 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3164 clobber_rvec.safe_push (x);
3169 /* First pass over inputs and outputs checks validity and sets
3170 mark_addressable if needed. */
3171 /* ??? Diagnose during gimplification? */
3173 for (i = 0; i < noutputs; ++i)
3175 tree val = output_tvec[i];
3176 tree type = TREE_TYPE (val);
3177 const char *constraint;
3178 bool is_inout;
3179 bool allows_reg;
3180 bool allows_mem;
3182 /* Try to parse the output constraint. If that fails, there's
3183 no point in going further. */
3184 constraint = constraints[i];
3185 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3186 &allows_mem, &allows_reg, &is_inout))
3187 return;
3189 /* If the output is a hard register, verify it doesn't conflict with
3190 any other operand's possible hard register use. */
3191 if (DECL_P (val)
3192 && REG_P (DECL_RTL (val))
3193 && HARD_REGISTER_P (DECL_RTL (val)))
3195 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3196 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3197 unsigned long match;
3199 /* Verify the other outputs do not use the same hard register. */
3200 for (j = i + 1; j < noutputs; ++j)
3201 if (DECL_P (output_tvec[j])
3202 && REG_P (DECL_RTL (output_tvec[j]))
3203 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3204 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3205 error ("invalid hard register usage between output operands");
3207 /* Verify matching constraint operands use the same hard register
3208 and that the non-matching constraint operands do not use the same
3209 hard register if the output is an early clobber operand. */
3210 for (j = 0; j < ninputs; ++j)
3211 if (DECL_P (input_tvec[j])
3212 && REG_P (DECL_RTL (input_tvec[j]))
3213 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3215 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3216 switch (*constraints[j + noutputs])
3218 case '0': case '1': case '2': case '3': case '4':
3219 case '5': case '6': case '7': case '8': case '9':
3220 match = strtoul (constraints[j + noutputs], NULL, 10);
3221 break;
3222 default:
3223 match = ULONG_MAX;
3224 break;
3226 if (i == match
3227 && output_hregno != input_hregno)
3228 error ("invalid hard register usage between output operand "
3229 "and matching constraint operand");
3230 else if (early_clobber_p
3231 && i != match
3232 && output_hregno == input_hregno)
3233 error ("invalid hard register usage between earlyclobber "
3234 "operand and input operand");
3238 if (! allows_reg
3239 && (allows_mem
3240 || is_inout
3241 || (DECL_P (val)
3242 && REG_P (DECL_RTL (val))
3243 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3244 mark_addressable (val);
3247 for (i = 0; i < ninputs; ++i)
3249 bool allows_reg, allows_mem;
3250 const char *constraint;
3252 constraint = constraints[i + noutputs];
3253 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3254 constraints.address (),
3255 &allows_mem, &allows_reg))
3256 return;
3258 if (! allows_reg && allows_mem)
3259 mark_addressable (input_tvec[i]);
3262 /* Second pass evaluates arguments. */
3264 /* Make sure stack is consistent for asm goto. */
3265 if (nlabels > 0)
3266 do_pending_stack_adjust ();
3267 int old_generating_concat_p = generating_concat_p;
3269 /* Vector of RTX's of evaluated output operands. */
3270 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3271 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3272 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3274 output_rvec.safe_grow (noutputs, true);
3276 for (i = 0; i < noutputs; ++i)
3278 tree val = output_tvec[i];
3279 tree type = TREE_TYPE (val);
3280 bool is_inout, allows_reg, allows_mem, ok;
3281 rtx op;
3283 ok = parse_output_constraint (&constraints[i], i, ninputs,
3284 noutputs, &allows_mem, &allows_reg,
3285 &is_inout);
3286 gcc_assert (ok);
3288 /* If an output operand is not a decl or indirect ref and our constraint
3289 allows a register, make a temporary to act as an intermediate.
3290 Make the asm insn write into that, then we will copy it to
3291 the real output operand. Likewise for promoted variables. */
3293 generating_concat_p = 0;
3295 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3296 || (DECL_P (val)
3297 && (allows_mem || REG_P (DECL_RTL (val)))
3298 && ! (REG_P (DECL_RTL (val))
3299 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3300 || ! allows_reg
3301 || is_inout
3302 || TREE_ADDRESSABLE (type))
3304 op = expand_expr (val, NULL_RTX, VOIDmode,
3305 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3306 if (MEM_P (op))
3307 op = validize_mem (op);
3309 if (! allows_reg && !MEM_P (op))
3310 error ("output number %d not directly addressable", i);
3311 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3312 || GET_CODE (op) == CONCAT)
3314 rtx old_op = op;
3315 op = gen_reg_rtx (GET_MODE (op));
3317 generating_concat_p = old_generating_concat_p;
3319 if (is_inout)
3320 emit_move_insn (op, old_op);
3322 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3323 emit_move_insn (old_op, op);
3324 after_rtl_seq = get_insns ();
3325 after_rtl_end = get_last_insn ();
3326 end_sequence ();
3329 else
3331 op = assign_temp (type, 0, 1);
3332 op = validize_mem (op);
3333 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3334 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3336 generating_concat_p = old_generating_concat_p;
3338 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3339 expand_assignment (val, make_tree (type, op), false);
3340 after_rtl_seq = get_insns ();
3341 after_rtl_end = get_last_insn ();
3342 end_sequence ();
3344 output_rvec[i] = op;
3346 if (is_inout)
3347 inout_opnum.safe_push (i);
3350 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3351 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3353 input_rvec.safe_grow (ninputs, true);
3354 input_mode.safe_grow (ninputs, true);
3356 generating_concat_p = 0;
3358 for (i = 0; i < ninputs; ++i)
3360 tree val = input_tvec[i];
3361 tree type = TREE_TYPE (val);
3362 bool allows_reg, allows_mem, ok;
3363 const char *constraint;
3364 rtx op;
3366 constraint = constraints[i + noutputs];
3367 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3368 constraints.address (),
3369 &allows_mem, &allows_reg);
3370 gcc_assert (ok);
3372 /* EXPAND_INITIALIZER will not generate code for valid initializer
3373 constants, but will still generate code for other types of operand.
3374 This is the behavior we want for constant constraints. */
3375 op = expand_expr (val, NULL_RTX, VOIDmode,
3376 allows_reg ? EXPAND_NORMAL
3377 : allows_mem ? EXPAND_MEMORY
3378 : EXPAND_INITIALIZER);
3380 /* Never pass a CONCAT to an ASM. */
3381 if (GET_CODE (op) == CONCAT)
3382 op = force_reg (GET_MODE (op), op);
3383 else if (MEM_P (op))
3384 op = validize_mem (op);
3386 if (asm_operand_ok (op, constraint, NULL) <= 0)
3388 if (allows_reg && TYPE_MODE (type) != BLKmode)
3389 op = force_reg (TYPE_MODE (type), op);
3390 else if (!allows_mem)
3391 warning (0, "%<asm%> operand %d probably does not match "
3392 "constraints",
3393 i + noutputs);
3394 else if (MEM_P (op))
3396 /* We won't recognize either volatile memory or memory
3397 with a queued address as available a memory_operand
3398 at this point. Ignore it: clearly this *is* a memory. */
3400 else
3401 gcc_unreachable ();
3403 input_rvec[i] = op;
3404 input_mode[i] = TYPE_MODE (type);
3407 /* For in-out operands, copy output rtx to input rtx. */
3408 unsigned ninout = inout_opnum.length();
3409 for (i = 0; i < ninout; i++)
3411 int j = inout_opnum[i];
3412 rtx o = output_rvec[j];
3414 input_rvec.safe_push (o);
3415 input_mode.safe_push (GET_MODE (o));
3417 char buffer[16];
3418 sprintf (buffer, "%d", j);
3419 constraints.safe_push (ggc_strdup (buffer));
3421 ninputs += ninout;
3423 /* Sometimes we wish to automatically clobber registers across an asm.
3424 Case in point is when the i386 backend moved from cc0 to a hard reg --
3425 maintaining source-level compatibility means automatically clobbering
3426 the flags register. */
3427 rtx_insn *after_md_seq = NULL;
3428 if (targetm.md_asm_adjust)
3429 after_md_seq
3430 = targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
3431 constraints, clobber_rvec, clobbered_regs);
3433 /* Do not allow the hook to change the output and input count,
3434 lest it mess up the operand numbering. */
3435 gcc_assert (output_rvec.length() == noutputs);
3436 gcc_assert (input_rvec.length() == ninputs);
3437 gcc_assert (constraints.length() == noutputs + ninputs);
3439 /* But it certainly can adjust the clobbers. */
3440 unsigned nclobbers = clobber_rvec.length ();
3442 /* Third pass checks for easy conflicts. */
3443 /* ??? Why are we doing this on trees instead of rtx. */
3445 bool clobber_conflict_found = 0;
3446 for (i = 0; i < noutputs; ++i)
3447 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3448 clobber_conflict_found = 1;
3449 for (i = 0; i < ninputs - ninout; ++i)
3450 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3451 clobber_conflict_found = 1;
3453 /* Make vectors for the expression-rtx, constraint strings,
3454 and named operands. */
3456 rtvec argvec = rtvec_alloc (ninputs);
3457 rtvec constraintvec = rtvec_alloc (ninputs);
3458 rtvec labelvec = rtvec_alloc (nlabels);
3460 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3461 : GET_MODE (output_rvec[0])),
3462 ggc_strdup (gimple_asm_string (stmt)),
3463 "", 0, argvec, constraintvec,
3464 labelvec, locus);
3465 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3467 for (i = 0; i < ninputs; ++i)
3469 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3470 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3471 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3472 constraints[i + noutputs],
3473 locus);
3476 /* Copy labels to the vector. */
3477 rtx_code_label *fallthru_label = NULL;
3478 if (nlabels > 0)
3480 basic_block fallthru_bb = NULL;
3481 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3482 if (fallthru)
3483 fallthru_bb = fallthru->dest;
3485 for (i = 0; i < nlabels; ++i)
3487 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3488 rtx_insn *r;
3489 /* If asm goto has any labels in the fallthru basic block, use
3490 a label that we emit immediately after the asm goto. Expansion
3491 may insert further instructions into the same basic block after
3492 asm goto and if we don't do this, insertion of instructions on
3493 the fallthru edge might misbehave. See PR58670. */
3494 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3496 if (fallthru_label == NULL_RTX)
3497 fallthru_label = gen_label_rtx ();
3498 r = fallthru_label;
3500 else
3501 r = label_rtx (label);
3502 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3506 /* Now, for each output, construct an rtx
3507 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3508 ARGVEC CONSTRAINTS OPNAMES))
3509 If there is more than one, put them inside a PARALLEL. */
3511 if (noutputs == 0 && nclobbers == 0)
3513 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3514 if (nlabels > 0)
3515 emit_jump_insn (body);
3516 else
3517 emit_insn (body);
3519 else if (noutputs == 1 && nclobbers == 0)
3521 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3522 if (nlabels > 0)
3523 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3524 else
3525 emit_insn (gen_rtx_SET (output_rvec[0], body));
3527 else
3529 rtx obody = body;
3530 int num = noutputs;
3532 if (num == 0)
3533 num = 1;
3535 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3537 /* For each output operand, store a SET. */
3538 for (i = 0; i < noutputs; ++i)
3540 rtx src, o = output_rvec[i];
3541 if (i == 0)
3543 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3544 src = obody;
3546 else
3548 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3549 ASM_OPERANDS_TEMPLATE (obody),
3550 constraints[i], i, argvec,
3551 constraintvec, labelvec, locus);
3552 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3554 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3557 /* If there are no outputs (but there are some clobbers)
3558 store the bare ASM_OPERANDS into the PARALLEL. */
3559 if (i == 0)
3560 XVECEXP (body, 0, i++) = obody;
3562 /* Store (clobber REG) for each clobbered register specified. */
3563 for (unsigned j = 0; j < nclobbers; ++j)
3565 rtx clobbered_reg = clobber_rvec[j];
3567 /* Do sanity check for overlap between clobbers and respectively
3568 input and outputs that hasn't been handled. Such overlap
3569 should have been detected and reported above. */
3570 if (!clobber_conflict_found && REG_P (clobbered_reg))
3572 /* We test the old body (obody) contents to avoid
3573 tripping over the under-construction body. */
3574 for (unsigned k = 0; k < noutputs; ++k)
3575 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3576 internal_error ("%<asm%> clobber conflict with "
3577 "output operand");
3579 for (unsigned k = 0; k < ninputs - ninout; ++k)
3580 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3581 internal_error ("%<asm%> clobber conflict with "
3582 "input operand");
3585 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3588 if (nlabels > 0)
3589 emit_jump_insn (body);
3590 else
3591 emit_insn (body);
3594 generating_concat_p = old_generating_concat_p;
3596 if (fallthru_label)
3597 emit_label (fallthru_label);
3599 if (after_md_seq)
3600 emit_insn (after_md_seq);
3601 if (after_rtl_seq)
3603 if (nlabels == 0)
3604 emit_insn (after_rtl_seq);
3605 else
3607 edge e;
3608 edge_iterator ei;
3610 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3612 start_sequence ();
3613 for (rtx_insn *curr = after_rtl_seq;
3614 curr != NULL_RTX;
3615 curr = NEXT_INSN (curr))
3616 emit_insn (copy_insn (PATTERN (curr)));
3617 rtx_insn *copy = get_insns ();
3618 end_sequence ();
3619 insert_insn_on_edge (copy, e);
3624 free_temp_slots ();
3625 crtl->has_asm_statement = 1;
3628 /* Emit code to jump to the address
3629 specified by the pointer expression EXP. */
3631 static void
3632 expand_computed_goto (tree exp)
3634 rtx x = expand_normal (exp);
3636 do_pending_stack_adjust ();
3637 emit_indirect_jump (x);
3640 /* Generate RTL code for a `goto' statement with target label LABEL.
3641 LABEL should be a LABEL_DECL tree node that was or will later be
3642 defined with `expand_label'. */
3644 static void
3645 expand_goto (tree label)
3647 if (flag_checking)
3649 /* Check for a nonlocal goto to a containing function. Should have
3650 gotten translated to __builtin_nonlocal_goto. */
3651 tree context = decl_function_context (label);
3652 gcc_assert (!context || context == current_function_decl);
3655 emit_jump (jump_target_rtx (label));
3658 /* Output a return with no value. */
3660 static void
3661 expand_null_return_1 (void)
3663 clear_pending_stack_adjust ();
3664 do_pending_stack_adjust ();
3665 emit_jump (return_label);
3668 /* Generate RTL to return from the current function, with no value.
3669 (That is, we do not do anything about returning any value.) */
3671 void
3672 expand_null_return (void)
3674 /* If this function was declared to return a value, but we
3675 didn't, clobber the return registers so that they are not
3676 propagated live to the rest of the function. */
3677 clobber_return_register ();
3679 expand_null_return_1 ();
3682 /* Generate RTL to return from the current function, with value VAL. */
3684 static void
3685 expand_value_return (rtx val)
3687 /* Copy the value to the return location unless it's already there. */
3689 tree decl = DECL_RESULT (current_function_decl);
3690 rtx return_reg = DECL_RTL (decl);
3691 if (return_reg != val)
3693 tree funtype = TREE_TYPE (current_function_decl);
3694 tree type = TREE_TYPE (decl);
3695 int unsignedp = TYPE_UNSIGNED (type);
3696 machine_mode old_mode = DECL_MODE (decl);
3697 machine_mode mode;
3698 if (DECL_BY_REFERENCE (decl))
3699 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3700 else
3701 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3703 if (mode != old_mode)
3704 val = convert_modes (mode, old_mode, val, unsignedp);
3706 if (GET_CODE (return_reg) == PARALLEL)
3707 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3708 else
3709 emit_move_insn (return_reg, val);
3712 expand_null_return_1 ();
3715 /* Generate RTL to evaluate the expression RETVAL and return it
3716 from the current function. */
3718 static void
3719 expand_return (tree retval)
3721 rtx result_rtl;
3722 rtx val = 0;
3723 tree retval_rhs;
3725 /* If function wants no value, give it none. */
3726 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3728 expand_normal (retval);
3729 expand_null_return ();
3730 return;
3733 if (retval == error_mark_node)
3735 /* Treat this like a return of no value from a function that
3736 returns a value. */
3737 expand_null_return ();
3738 return;
3740 else if ((TREE_CODE (retval) == MODIFY_EXPR
3741 || TREE_CODE (retval) == INIT_EXPR)
3742 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3743 retval_rhs = TREE_OPERAND (retval, 1);
3744 else
3745 retval_rhs = retval;
3747 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3749 /* If we are returning the RESULT_DECL, then the value has already
3750 been stored into it, so we don't have to do anything special. */
3751 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3752 expand_value_return (result_rtl);
3754 /* If the result is an aggregate that is being returned in one (or more)
3755 registers, load the registers here. */
3757 else if (retval_rhs != 0
3758 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3759 && REG_P (result_rtl))
3761 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3762 if (val)
3764 /* Use the mode of the result value on the return register. */
3765 PUT_MODE (result_rtl, GET_MODE (val));
3766 expand_value_return (val);
3768 else
3769 expand_null_return ();
3771 else if (retval_rhs != 0
3772 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3773 && (REG_P (result_rtl)
3774 || (GET_CODE (result_rtl) == PARALLEL)))
3776 /* Compute the return value into a temporary (usually a pseudo reg). */
3778 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3779 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3780 val = force_not_mem (val);
3781 expand_value_return (val);
3783 else
3785 /* No hard reg used; calculate value into hard return reg. */
3786 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3787 expand_value_return (result_rtl);
3791 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3792 register, tell the rtl optimizers that its value is no longer
3793 needed. */
3795 static void
3796 expand_clobber (tree lhs)
3798 if (DECL_P (lhs))
3800 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3801 if (decl_rtl && REG_P (decl_rtl))
3803 machine_mode decl_mode = GET_MODE (decl_rtl);
3804 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3805 REGMODE_NATURAL_SIZE (decl_mode)))
3806 emit_clobber (decl_rtl);
3811 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3812 STMT that doesn't require special handling for outgoing edges. That
3813 is no tailcalls and no GIMPLE_COND. */
3815 static void
3816 expand_gimple_stmt_1 (gimple *stmt)
3818 tree op0;
3820 set_curr_insn_location (gimple_location (stmt));
3822 switch (gimple_code (stmt))
3824 case GIMPLE_GOTO:
3825 op0 = gimple_goto_dest (stmt);
3826 if (TREE_CODE (op0) == LABEL_DECL)
3827 expand_goto (op0);
3828 else
3829 expand_computed_goto (op0);
3830 break;
3831 case GIMPLE_LABEL:
3832 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3833 break;
3834 case GIMPLE_NOP:
3835 case GIMPLE_PREDICT:
3836 break;
3837 case GIMPLE_SWITCH:
3839 gswitch *swtch = as_a <gswitch *> (stmt);
3840 if (gimple_switch_num_labels (swtch) == 1)
3841 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3842 else
3843 expand_case (swtch);
3845 break;
3846 case GIMPLE_ASM:
3847 expand_asm_stmt (as_a <gasm *> (stmt));
3848 break;
3849 case GIMPLE_CALL:
3850 expand_call_stmt (as_a <gcall *> (stmt));
3851 break;
3853 case GIMPLE_RETURN:
3855 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3857 /* If a return doesn't have a location, it very likely represents
3858 multiple user returns so we cannot let it inherit the location
3859 of the last statement of the previous basic block in RTL. */
3860 if (!gimple_has_location (stmt))
3861 set_curr_insn_location (cfun->function_end_locus);
3863 if (op0 && op0 != error_mark_node)
3865 tree result = DECL_RESULT (current_function_decl);
3867 /* If we are not returning the current function's RESULT_DECL,
3868 build an assignment to it. */
3869 if (op0 != result)
3871 /* I believe that a function's RESULT_DECL is unique. */
3872 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3874 /* ??? We'd like to use simply expand_assignment here,
3875 but this fails if the value is of BLKmode but the return
3876 decl is a register. expand_return has special handling
3877 for this combination, which eventually should move
3878 to common code. See comments there. Until then, let's
3879 build a modify expression :-/ */
3880 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3881 result, op0);
3885 if (!op0)
3886 expand_null_return ();
3887 else
3888 expand_return (op0);
3890 break;
3892 case GIMPLE_ASSIGN:
3894 gassign *assign_stmt = as_a <gassign *> (stmt);
3895 tree lhs = gimple_assign_lhs (assign_stmt);
3897 /* Tree expand used to fiddle with |= and &= of two bitfield
3898 COMPONENT_REFs here. This can't happen with gimple, the LHS
3899 of binary assigns must be a gimple reg. */
3901 if (TREE_CODE (lhs) != SSA_NAME
3902 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
3904 tree rhs = gimple_assign_rhs1 (assign_stmt);
3905 gcc_assert (gimple_assign_rhs_class (assign_stmt)
3906 == GIMPLE_SINGLE_RHS);
3907 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3908 /* Do not put locations on possibly shared trees. */
3909 && !is_gimple_min_invariant (rhs))
3910 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3911 if (TREE_CLOBBER_P (rhs))
3912 /* This is a clobber to mark the going out of scope for
3913 this LHS. */
3914 expand_clobber (lhs);
3915 else
3916 expand_assignment (lhs, rhs,
3917 gimple_assign_nontemporal_move_p (
3918 assign_stmt));
3920 else
3922 rtx target, temp;
3923 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3924 struct separate_ops ops;
3925 bool promoted = false;
3927 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3928 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3929 promoted = true;
3931 ops.code = gimple_assign_rhs_code (assign_stmt);
3932 ops.type = TREE_TYPE (lhs);
3933 switch (get_gimple_rhs_class (ops.code))
3935 case GIMPLE_TERNARY_RHS:
3936 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3937 /* Fallthru */
3938 case GIMPLE_BINARY_RHS:
3939 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3940 /* Fallthru */
3941 case GIMPLE_UNARY_RHS:
3942 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3943 break;
3944 default:
3945 gcc_unreachable ();
3947 ops.location = gimple_location (stmt);
3949 /* If we want to use a nontemporal store, force the value to
3950 register first. If we store into a promoted register,
3951 don't directly expand to target. */
3952 temp = nontemporal || promoted ? NULL_RTX : target;
3953 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3954 EXPAND_NORMAL);
3956 if (temp == target)
3958 else if (promoted)
3960 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3961 /* If TEMP is a VOIDmode constant, use convert_modes to make
3962 sure that we properly convert it. */
3963 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3965 temp = convert_modes (GET_MODE (target),
3966 TYPE_MODE (ops.type),
3967 temp, unsignedp);
3968 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3969 GET_MODE (target), temp, unsignedp);
3972 convert_move (SUBREG_REG (target), temp, unsignedp);
3974 else if (nontemporal && emit_storent_insn (target, temp))
3976 else
3978 temp = force_operand (temp, target);
3979 if (temp != target)
3980 emit_move_insn (target, temp);
3984 break;
3986 default:
3987 gcc_unreachable ();
3991 /* Expand one gimple statement STMT and return the last RTL instruction
3992 before any of the newly generated ones.
3994 In addition to generating the necessary RTL instructions this also
3995 sets REG_EH_REGION notes if necessary and sets the current source
3996 location for diagnostics. */
3998 static rtx_insn *
3999 expand_gimple_stmt (gimple *stmt)
4001 location_t saved_location = input_location;
4002 rtx_insn *last = get_last_insn ();
4003 int lp_nr;
4005 gcc_assert (cfun);
4007 /* We need to save and restore the current source location so that errors
4008 discovered during expansion are emitted with the right location. But
4009 it would be better if the diagnostic routines used the source location
4010 embedded in the tree nodes rather than globals. */
4011 if (gimple_has_location (stmt))
4012 input_location = gimple_location (stmt);
4014 expand_gimple_stmt_1 (stmt);
4016 /* Free any temporaries used to evaluate this statement. */
4017 free_temp_slots ();
4019 input_location = saved_location;
4021 /* Mark all insns that may trap. */
4022 lp_nr = lookup_stmt_eh_lp (stmt);
4023 if (lp_nr)
4025 rtx_insn *insn;
4026 for (insn = next_real_insn (last); insn;
4027 insn = next_real_insn (insn))
4029 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
4030 /* If we want exceptions for non-call insns, any
4031 may_trap_p instruction may throw. */
4032 && GET_CODE (PATTERN (insn)) != CLOBBER
4033 && GET_CODE (PATTERN (insn)) != USE
4034 && insn_could_throw_p (insn))
4035 make_reg_eh_region_note (insn, 0, lp_nr);
4039 return last;
4042 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
4043 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
4044 generated a tail call (something that might be denied by the ABI
4045 rules governing the call; see calls.c).
4047 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
4048 can still reach the rest of BB. The case here is __builtin_sqrt,
4049 where the NaN result goes through the external function (with a
4050 tailcall) and the normal result happens via a sqrt instruction. */
4052 static basic_block
4053 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
4055 rtx_insn *last2, *last;
4056 edge e;
4057 edge_iterator ei;
4058 profile_probability probability;
4060 last2 = last = expand_gimple_stmt (stmt);
4062 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
4063 if (CALL_P (last) && SIBLING_CALL_P (last))
4064 goto found;
4066 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4068 *can_fallthru = true;
4069 return NULL;
4071 found:
4072 /* ??? Wouldn't it be better to just reset any pending stack adjust?
4073 Any instructions emitted here are about to be deleted. */
4074 do_pending_stack_adjust ();
4076 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
4077 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
4078 EH or abnormal edges, we shouldn't have created a tail call in
4079 the first place. So it seems to me we should just be removing
4080 all edges here, or redirecting the existing fallthru edge to
4081 the exit block. */
4083 probability = profile_probability::never ();
4085 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
4087 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
4089 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
4090 e->dest->count -= e->count ();
4091 probability += e->probability;
4092 remove_edge (e);
4094 else
4095 ei_next (&ei);
4098 /* This is somewhat ugly: the call_expr expander often emits instructions
4099 after the sibcall (to perform the function return). These confuse the
4100 find_many_sub_basic_blocks code, so we need to get rid of these. */
4101 last = NEXT_INSN (last);
4102 gcc_assert (BARRIER_P (last));
4104 *can_fallthru = false;
4105 while (NEXT_INSN (last))
4107 /* For instance an sqrt builtin expander expands if with
4108 sibcall in the then and label for `else`. */
4109 if (LABEL_P (NEXT_INSN (last)))
4111 *can_fallthru = true;
4112 break;
4114 delete_insn (NEXT_INSN (last));
4117 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
4118 | EDGE_SIBCALL);
4119 e->probability = probability;
4120 BB_END (bb) = last;
4121 update_bb_for_insn (bb);
4123 if (NEXT_INSN (last))
4125 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
4127 last = BB_END (bb);
4128 if (BARRIER_P (last))
4129 BB_END (bb) = PREV_INSN (last);
4132 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4134 return bb;
4137 /* Return the difference between the floor and the truncated result of
4138 a signed division by OP1 with remainder MOD. */
4139 static rtx
4140 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4142 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4143 return gen_rtx_IF_THEN_ELSE
4144 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4145 gen_rtx_IF_THEN_ELSE
4146 (mode, gen_rtx_LT (BImode,
4147 gen_rtx_DIV (mode, op1, mod),
4148 const0_rtx),
4149 constm1_rtx, const0_rtx),
4150 const0_rtx);
4153 /* Return the difference between the ceil and the truncated result of
4154 a signed division by OP1 with remainder MOD. */
4155 static rtx
4156 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4158 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4159 return gen_rtx_IF_THEN_ELSE
4160 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4161 gen_rtx_IF_THEN_ELSE
4162 (mode, gen_rtx_GT (BImode,
4163 gen_rtx_DIV (mode, op1, mod),
4164 const0_rtx),
4165 const1_rtx, const0_rtx),
4166 const0_rtx);
4169 /* Return the difference between the ceil and the truncated result of
4170 an unsigned division by OP1 with remainder MOD. */
4171 static rtx
4172 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4174 /* (mod != 0 ? 1 : 0) */
4175 return gen_rtx_IF_THEN_ELSE
4176 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4177 const1_rtx, const0_rtx);
4180 /* Return the difference between the rounded and the truncated result
4181 of a signed division by OP1 with remainder MOD. Halfway cases are
4182 rounded away from zero, rather than to the nearest even number. */
4183 static rtx
4184 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4186 /* (abs (mod) >= abs (op1) - abs (mod)
4187 ? (op1 / mod > 0 ? 1 : -1)
4188 : 0) */
4189 return gen_rtx_IF_THEN_ELSE
4190 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4191 gen_rtx_MINUS (mode,
4192 gen_rtx_ABS (mode, op1),
4193 gen_rtx_ABS (mode, mod))),
4194 gen_rtx_IF_THEN_ELSE
4195 (mode, gen_rtx_GT (BImode,
4196 gen_rtx_DIV (mode, op1, mod),
4197 const0_rtx),
4198 const1_rtx, constm1_rtx),
4199 const0_rtx);
4202 /* Return the difference between the rounded and the truncated result
4203 of a unsigned division by OP1 with remainder MOD. Halfway cases
4204 are rounded away from zero, rather than to the nearest even
4205 number. */
4206 static rtx
4207 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4209 /* (mod >= op1 - mod ? 1 : 0) */
4210 return gen_rtx_IF_THEN_ELSE
4211 (mode, gen_rtx_GE (BImode, mod,
4212 gen_rtx_MINUS (mode, op1, mod)),
4213 const1_rtx, const0_rtx);
4216 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4217 any rtl. */
4219 static rtx
4220 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4221 addr_space_t as)
4223 #ifndef POINTERS_EXTEND_UNSIGNED
4224 gcc_assert (mode == Pmode
4225 || mode == targetm.addr_space.address_mode (as));
4226 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4227 #else
4228 rtx temp;
4230 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4232 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4233 return x;
4235 /* X must have some form of address mode already. */
4236 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4237 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4238 x = lowpart_subreg (mode, x, xmode);
4239 else if (POINTERS_EXTEND_UNSIGNED > 0)
4240 x = gen_rtx_ZERO_EXTEND (mode, x);
4241 else if (!POINTERS_EXTEND_UNSIGNED)
4242 x = gen_rtx_SIGN_EXTEND (mode, x);
4243 else
4245 switch (GET_CODE (x))
4247 case SUBREG:
4248 if ((SUBREG_PROMOTED_VAR_P (x)
4249 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4250 || (GET_CODE (SUBREG_REG (x)) == PLUS
4251 && REG_P (XEXP (SUBREG_REG (x), 0))
4252 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4253 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4254 && GET_MODE (SUBREG_REG (x)) == mode)
4255 return SUBREG_REG (x);
4256 break;
4257 case LABEL_REF:
4258 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4259 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4260 return temp;
4261 case SYMBOL_REF:
4262 temp = shallow_copy_rtx (x);
4263 PUT_MODE (temp, mode);
4264 return temp;
4265 case CONST:
4266 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4267 if (temp)
4268 temp = gen_rtx_CONST (mode, temp);
4269 return temp;
4270 case PLUS:
4271 case MINUS:
4272 if (CONST_INT_P (XEXP (x, 1)))
4274 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4275 if (temp)
4276 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4278 break;
4279 default:
4280 break;
4282 /* Don't know how to express ptr_extend as operation in debug info. */
4283 return NULL;
4285 #endif /* POINTERS_EXTEND_UNSIGNED */
4287 return x;
4290 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4291 by avoid_deep_ter_for_debug. */
4293 static hash_map<tree, tree> *deep_ter_debug_map;
4295 /* Split too deep TER chains for debug stmts using debug temporaries. */
4297 static void
4298 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4300 use_operand_p use_p;
4301 ssa_op_iter iter;
4302 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4304 tree use = USE_FROM_PTR (use_p);
4305 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4306 continue;
4307 gimple *g = get_gimple_for_ssa_name (use);
4308 if (g == NULL)
4309 continue;
4310 if (depth > 6 && !stmt_ends_bb_p (g))
4312 if (deep_ter_debug_map == NULL)
4313 deep_ter_debug_map = new hash_map<tree, tree>;
4315 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4316 if (vexpr != NULL)
4317 continue;
4318 vexpr = make_node (DEBUG_EXPR_DECL);
4319 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4320 DECL_ARTIFICIAL (vexpr) = 1;
4321 TREE_TYPE (vexpr) = TREE_TYPE (use);
4322 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4323 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4324 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4325 avoid_deep_ter_for_debug (def_temp, 0);
4327 else
4328 avoid_deep_ter_for_debug (g, depth + 1);
4332 /* Return an RTX equivalent to the value of the parameter DECL. */
4334 static rtx
4335 expand_debug_parm_decl (tree decl)
4337 rtx incoming = DECL_INCOMING_RTL (decl);
4339 if (incoming
4340 && GET_MODE (incoming) != BLKmode
4341 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4342 || (MEM_P (incoming)
4343 && REG_P (XEXP (incoming, 0))
4344 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4346 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4348 #ifdef HAVE_window_save
4349 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4350 If the target machine has an explicit window save instruction, the
4351 actual entry value is the corresponding OUTGOING_REGNO instead. */
4352 if (REG_P (incoming)
4353 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4354 incoming
4355 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4356 OUTGOING_REGNO (REGNO (incoming)), 0);
4357 else if (MEM_P (incoming))
4359 rtx reg = XEXP (incoming, 0);
4360 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4362 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4363 incoming = replace_equiv_address_nv (incoming, reg);
4365 else
4366 incoming = copy_rtx (incoming);
4368 #endif
4370 ENTRY_VALUE_EXP (rtl) = incoming;
4371 return rtl;
4374 if (incoming
4375 && GET_MODE (incoming) != BLKmode
4376 && !TREE_ADDRESSABLE (decl)
4377 && MEM_P (incoming)
4378 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4379 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4380 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4381 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4382 return copy_rtx (incoming);
4384 return NULL_RTX;
4387 /* Return an RTX equivalent to the value of the tree expression EXP. */
4389 static rtx
4390 expand_debug_expr (tree exp)
4392 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4393 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4394 machine_mode inner_mode = VOIDmode;
4395 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4396 addr_space_t as;
4397 scalar_int_mode op0_mode, op1_mode, addr_mode;
4399 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4401 case tcc_expression:
4402 switch (TREE_CODE (exp))
4404 case COND_EXPR:
4405 case DOT_PROD_EXPR:
4406 case SAD_EXPR:
4407 case WIDEN_MULT_PLUS_EXPR:
4408 case WIDEN_MULT_MINUS_EXPR:
4409 goto ternary;
4411 case TRUTH_ANDIF_EXPR:
4412 case TRUTH_ORIF_EXPR:
4413 case TRUTH_AND_EXPR:
4414 case TRUTH_OR_EXPR:
4415 case TRUTH_XOR_EXPR:
4416 goto binary;
4418 case TRUTH_NOT_EXPR:
4419 goto unary;
4421 default:
4422 break;
4424 break;
4426 ternary:
4427 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4428 if (!op2)
4429 return NULL_RTX;
4430 /* Fall through. */
4432 binary:
4433 case tcc_binary:
4434 if (mode == BLKmode)
4435 return NULL_RTX;
4436 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4437 if (!op1)
4438 return NULL_RTX;
4439 switch (TREE_CODE (exp))
4441 case LSHIFT_EXPR:
4442 case RSHIFT_EXPR:
4443 case LROTATE_EXPR:
4444 case RROTATE_EXPR:
4445 case WIDEN_LSHIFT_EXPR:
4446 /* Ensure second operand isn't wider than the first one. */
4447 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4448 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4449 && (GET_MODE_UNIT_PRECISION (mode)
4450 < GET_MODE_PRECISION (op1_mode)))
4451 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4452 break;
4453 default:
4454 break;
4456 /* Fall through. */
4458 unary:
4459 case tcc_unary:
4460 if (mode == BLKmode)
4461 return NULL_RTX;
4462 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4463 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4464 if (!op0)
4465 return NULL_RTX;
4466 break;
4468 case tcc_comparison:
4469 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4470 goto binary;
4472 case tcc_type:
4473 case tcc_statement:
4474 gcc_unreachable ();
4476 case tcc_constant:
4477 case tcc_exceptional:
4478 case tcc_declaration:
4479 case tcc_reference:
4480 case tcc_vl_exp:
4481 break;
4484 switch (TREE_CODE (exp))
4486 case STRING_CST:
4487 if (!lookup_constant_def (exp))
4489 if (strlen (TREE_STRING_POINTER (exp)) + 1
4490 != (size_t) TREE_STRING_LENGTH (exp))
4491 return NULL_RTX;
4492 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4493 op0 = gen_rtx_MEM (BLKmode, op0);
4494 set_mem_attributes (op0, exp, 0);
4495 return op0;
4497 /* Fall through. */
4499 case INTEGER_CST:
4500 case REAL_CST:
4501 case FIXED_CST:
4502 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4503 return op0;
4505 case POLY_INT_CST:
4506 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4508 case COMPLEX_CST:
4509 gcc_assert (COMPLEX_MODE_P (mode));
4510 op0 = expand_debug_expr (TREE_REALPART (exp));
4511 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4512 return gen_rtx_CONCAT (mode, op0, op1);
4514 case DEBUG_EXPR_DECL:
4515 op0 = DECL_RTL_IF_SET (exp);
4517 if (op0)
4519 if (GET_MODE (op0) != mode)
4520 gcc_assert (VECTOR_TYPE_P (TREE_TYPE (exp)));
4521 else
4522 return op0;
4525 op0 = gen_rtx_DEBUG_EXPR (mode);
4526 DEBUG_EXPR_TREE_DECL (op0) = exp;
4527 SET_DECL_RTL (exp, op0);
4529 return op0;
4531 case VAR_DECL:
4532 case PARM_DECL:
4533 case FUNCTION_DECL:
4534 case LABEL_DECL:
4535 case CONST_DECL:
4536 case RESULT_DECL:
4537 op0 = DECL_RTL_IF_SET (exp);
4539 /* This decl was probably optimized away. */
4540 if (!op0
4541 /* At least label RTXen are sometimes replaced by
4542 NOTE_INSN_DELETED_LABEL. Any notes here are not
4543 handled by copy_rtx. */
4544 || NOTE_P (op0))
4546 if (!VAR_P (exp)
4547 || DECL_EXTERNAL (exp)
4548 || !TREE_STATIC (exp)
4549 || !DECL_NAME (exp)
4550 || DECL_HARD_REGISTER (exp)
4551 || DECL_IN_CONSTANT_POOL (exp)
4552 || mode == VOIDmode)
4553 return NULL;
4555 op0 = make_decl_rtl_for_debug (exp);
4556 if (!MEM_P (op0)
4557 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4558 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4559 return NULL;
4561 else
4562 op0 = copy_rtx (op0);
4564 if (GET_MODE (op0) == BLKmode
4565 /* If op0 is not BLKmode, but mode is, adjust_mode
4566 below would ICE. While it is likely a FE bug,
4567 try to be robust here. See PR43166. */
4568 || mode == BLKmode
4569 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4571 gcc_assert (MEM_P (op0));
4572 op0 = adjust_address_nv (op0, mode, 0);
4573 return op0;
4576 /* Fall through. */
4578 adjust_mode:
4579 case PAREN_EXPR:
4580 CASE_CONVERT:
4582 inner_mode = GET_MODE (op0);
4584 if (mode == inner_mode)
4585 return op0;
4587 if (inner_mode == VOIDmode)
4589 if (TREE_CODE (exp) == SSA_NAME)
4590 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4591 else
4592 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4593 if (mode == inner_mode)
4594 return op0;
4597 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4599 if (GET_MODE_UNIT_BITSIZE (mode)
4600 == GET_MODE_UNIT_BITSIZE (inner_mode))
4601 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4602 else if (GET_MODE_UNIT_BITSIZE (mode)
4603 < GET_MODE_UNIT_BITSIZE (inner_mode))
4604 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4605 else
4606 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4608 else if (FLOAT_MODE_P (mode))
4610 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4611 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4612 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4613 else
4614 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4616 else if (FLOAT_MODE_P (inner_mode))
4618 if (unsignedp)
4619 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4620 else
4621 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4623 else if (GET_MODE_UNIT_PRECISION (mode)
4624 == GET_MODE_UNIT_PRECISION (inner_mode))
4625 op0 = lowpart_subreg (mode, op0, inner_mode);
4626 else if (GET_MODE_UNIT_PRECISION (mode)
4627 < GET_MODE_UNIT_PRECISION (inner_mode))
4628 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4629 else if (UNARY_CLASS_P (exp)
4630 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4631 : unsignedp)
4632 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4633 else
4634 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4636 return op0;
4639 case MEM_REF:
4640 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4642 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4643 TREE_OPERAND (exp, 0),
4644 TREE_OPERAND (exp, 1));
4645 if (newexp)
4646 return expand_debug_expr (newexp);
4648 /* FALLTHROUGH */
4649 case INDIRECT_REF:
4650 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4651 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4652 if (!op0)
4653 return NULL;
4655 if (TREE_CODE (exp) == MEM_REF)
4657 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4658 || (GET_CODE (op0) == PLUS
4659 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4660 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4661 Instead just use get_inner_reference. */
4662 goto component_ref;
4664 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4665 poly_int64 offset;
4666 if (!op1 || !poly_int_rtx_p (op1, &offset))
4667 return NULL;
4669 op0 = plus_constant (inner_mode, op0, offset);
4672 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4674 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4675 op0, as);
4676 if (op0 == NULL_RTX)
4677 return NULL;
4679 op0 = gen_rtx_MEM (mode, op0);
4680 set_mem_attributes (op0, exp, 0);
4681 if (TREE_CODE (exp) == MEM_REF
4682 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4683 set_mem_expr (op0, NULL_TREE);
4684 set_mem_addr_space (op0, as);
4686 return op0;
4688 case TARGET_MEM_REF:
4689 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4690 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4691 return NULL;
4693 op0 = expand_debug_expr
4694 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4695 if (!op0)
4696 return NULL;
4698 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4699 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4700 op0, as);
4701 if (op0 == NULL_RTX)
4702 return NULL;
4704 op0 = gen_rtx_MEM (mode, op0);
4706 set_mem_attributes (op0, exp, 0);
4707 set_mem_addr_space (op0, as);
4709 return op0;
4711 component_ref:
4712 case ARRAY_REF:
4713 case ARRAY_RANGE_REF:
4714 case COMPONENT_REF:
4715 case BIT_FIELD_REF:
4716 case REALPART_EXPR:
4717 case IMAGPART_EXPR:
4718 case VIEW_CONVERT_EXPR:
4720 machine_mode mode1;
4721 poly_int64 bitsize, bitpos;
4722 tree offset;
4723 int reversep, volatilep = 0;
4724 tree tem
4725 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4726 &unsignedp, &reversep, &volatilep);
4727 rtx orig_op0;
4729 if (known_eq (bitsize, 0))
4730 return NULL;
4732 orig_op0 = op0 = expand_debug_expr (tem);
4734 if (!op0)
4735 return NULL;
4737 if (offset)
4739 machine_mode addrmode, offmode;
4741 if (!MEM_P (op0))
4742 return NULL;
4744 op0 = XEXP (op0, 0);
4745 addrmode = GET_MODE (op0);
4746 if (addrmode == VOIDmode)
4747 addrmode = Pmode;
4749 op1 = expand_debug_expr (offset);
4750 if (!op1)
4751 return NULL;
4753 offmode = GET_MODE (op1);
4754 if (offmode == VOIDmode)
4755 offmode = TYPE_MODE (TREE_TYPE (offset));
4757 if (addrmode != offmode)
4758 op1 = lowpart_subreg (addrmode, op1, offmode);
4760 /* Don't use offset_address here, we don't need a
4761 recognizable address, and we don't want to generate
4762 code. */
4763 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4764 op0, op1));
4767 if (MEM_P (op0))
4769 if (mode1 == VOIDmode)
4771 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4772 return NULL;
4773 /* Bitfield. */
4774 mode1 = smallest_int_mode_for_size (bitsize);
4776 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4777 if (maybe_ne (bytepos, 0))
4779 op0 = adjust_address_nv (op0, mode1, bytepos);
4780 bitpos = num_trailing_bits (bitpos);
4782 else if (known_eq (bitpos, 0)
4783 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4784 op0 = adjust_address_nv (op0, mode, 0);
4785 else if (GET_MODE (op0) != mode1)
4786 op0 = adjust_address_nv (op0, mode1, 0);
4787 else
4788 op0 = copy_rtx (op0);
4789 if (op0 == orig_op0)
4790 op0 = shallow_copy_rtx (op0);
4791 if (TREE_CODE (tem) != SSA_NAME)
4792 set_mem_attributes (op0, exp, 0);
4795 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4796 return op0;
4798 if (maybe_lt (bitpos, 0))
4799 return NULL;
4801 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4802 return NULL;
4804 poly_int64 bytepos;
4805 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4806 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4808 machine_mode opmode = GET_MODE (op0);
4810 if (opmode == VOIDmode)
4811 opmode = TYPE_MODE (TREE_TYPE (tem));
4813 /* This condition may hold if we're expanding the address
4814 right past the end of an array that turned out not to
4815 be addressable (i.e., the address was only computed in
4816 debug stmts). The gen_subreg below would rightfully
4817 crash, and the address doesn't really exist, so just
4818 drop it. */
4819 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4820 return NULL;
4822 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4823 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4826 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4827 && TYPE_UNSIGNED (TREE_TYPE (exp))
4828 ? SIGN_EXTRACT
4829 : ZERO_EXTRACT, mode,
4830 GET_MODE (op0) != VOIDmode
4831 ? GET_MODE (op0)
4832 : TYPE_MODE (TREE_TYPE (tem)),
4833 op0, gen_int_mode (bitsize, word_mode),
4834 gen_int_mode (bitpos, word_mode));
4837 case ABS_EXPR:
4838 case ABSU_EXPR:
4839 return simplify_gen_unary (ABS, mode, op0, mode);
4841 case NEGATE_EXPR:
4842 return simplify_gen_unary (NEG, mode, op0, mode);
4844 case BIT_NOT_EXPR:
4845 return simplify_gen_unary (NOT, mode, op0, mode);
4847 case FLOAT_EXPR:
4848 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4849 0)))
4850 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4851 inner_mode);
4853 case FIX_TRUNC_EXPR:
4854 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4855 inner_mode);
4857 case POINTER_PLUS_EXPR:
4858 /* For the rare target where pointers are not the same size as
4859 size_t, we need to check for mis-matched modes and correct
4860 the addend. */
4861 if (op0 && op1
4862 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4863 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4864 && op0_mode != op1_mode)
4866 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4867 /* If OP0 is a partial mode, then we must truncate, even
4868 if it has the same bitsize as OP1 as GCC's
4869 representation of partial modes is opaque. */
4870 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4871 && (GET_MODE_BITSIZE (op0_mode)
4872 == GET_MODE_BITSIZE (op1_mode))))
4873 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4874 else
4875 /* We always sign-extend, regardless of the signedness of
4876 the operand, because the operand is always unsigned
4877 here even if the original C expression is signed. */
4878 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4880 /* Fall through. */
4881 case PLUS_EXPR:
4882 return simplify_gen_binary (PLUS, mode, op0, op1);
4884 case MINUS_EXPR:
4885 case POINTER_DIFF_EXPR:
4886 return simplify_gen_binary (MINUS, mode, op0, op1);
4888 case MULT_EXPR:
4889 return simplify_gen_binary (MULT, mode, op0, op1);
4891 case RDIV_EXPR:
4892 case TRUNC_DIV_EXPR:
4893 case EXACT_DIV_EXPR:
4894 if (unsignedp)
4895 return simplify_gen_binary (UDIV, mode, op0, op1);
4896 else
4897 return simplify_gen_binary (DIV, mode, op0, op1);
4899 case TRUNC_MOD_EXPR:
4900 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4902 case FLOOR_DIV_EXPR:
4903 if (unsignedp)
4904 return simplify_gen_binary (UDIV, mode, op0, op1);
4905 else
4907 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4908 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4909 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4910 return simplify_gen_binary (PLUS, mode, div, adj);
4913 case FLOOR_MOD_EXPR:
4914 if (unsignedp)
4915 return simplify_gen_binary (UMOD, mode, op0, op1);
4916 else
4918 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4919 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4920 adj = simplify_gen_unary (NEG, mode,
4921 simplify_gen_binary (MULT, mode, adj, op1),
4922 mode);
4923 return simplify_gen_binary (PLUS, mode, mod, adj);
4926 case CEIL_DIV_EXPR:
4927 if (unsignedp)
4929 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4930 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4931 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4932 return simplify_gen_binary (PLUS, mode, div, adj);
4934 else
4936 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4937 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4938 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4939 return simplify_gen_binary (PLUS, mode, div, adj);
4942 case CEIL_MOD_EXPR:
4943 if (unsignedp)
4945 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4946 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4947 adj = simplify_gen_unary (NEG, mode,
4948 simplify_gen_binary (MULT, mode, adj, op1),
4949 mode);
4950 return simplify_gen_binary (PLUS, mode, mod, adj);
4952 else
4954 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4955 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4956 adj = simplify_gen_unary (NEG, mode,
4957 simplify_gen_binary (MULT, mode, adj, op1),
4958 mode);
4959 return simplify_gen_binary (PLUS, mode, mod, adj);
4962 case ROUND_DIV_EXPR:
4963 if (unsignedp)
4965 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4966 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4967 rtx adj = round_udiv_adjust (mode, mod, op1);
4968 return simplify_gen_binary (PLUS, mode, div, adj);
4970 else
4972 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4973 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4974 rtx adj = round_sdiv_adjust (mode, mod, op1);
4975 return simplify_gen_binary (PLUS, mode, div, adj);
4978 case ROUND_MOD_EXPR:
4979 if (unsignedp)
4981 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4982 rtx adj = round_udiv_adjust (mode, mod, op1);
4983 adj = simplify_gen_unary (NEG, mode,
4984 simplify_gen_binary (MULT, mode, adj, op1),
4985 mode);
4986 return simplify_gen_binary (PLUS, mode, mod, adj);
4988 else
4990 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4991 rtx adj = round_sdiv_adjust (mode, mod, op1);
4992 adj = simplify_gen_unary (NEG, mode,
4993 simplify_gen_binary (MULT, mode, adj, op1),
4994 mode);
4995 return simplify_gen_binary (PLUS, mode, mod, adj);
4998 case LSHIFT_EXPR:
4999 return simplify_gen_binary (ASHIFT, mode, op0, op1);
5001 case RSHIFT_EXPR:
5002 if (unsignedp)
5003 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
5004 else
5005 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
5007 case LROTATE_EXPR:
5008 return simplify_gen_binary (ROTATE, mode, op0, op1);
5010 case RROTATE_EXPR:
5011 return simplify_gen_binary (ROTATERT, mode, op0, op1);
5013 case MIN_EXPR:
5014 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
5016 case MAX_EXPR:
5017 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
5019 case BIT_AND_EXPR:
5020 case TRUTH_AND_EXPR:
5021 return simplify_gen_binary (AND, mode, op0, op1);
5023 case BIT_IOR_EXPR:
5024 case TRUTH_OR_EXPR:
5025 return simplify_gen_binary (IOR, mode, op0, op1);
5027 case BIT_XOR_EXPR:
5028 case TRUTH_XOR_EXPR:
5029 return simplify_gen_binary (XOR, mode, op0, op1);
5031 case TRUTH_ANDIF_EXPR:
5032 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
5034 case TRUTH_ORIF_EXPR:
5035 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
5037 case TRUTH_NOT_EXPR:
5038 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
5040 case LT_EXPR:
5041 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
5042 op0, op1);
5044 case LE_EXPR:
5045 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
5046 op0, op1);
5048 case GT_EXPR:
5049 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
5050 op0, op1);
5052 case GE_EXPR:
5053 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
5054 op0, op1);
5056 case EQ_EXPR:
5057 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
5059 case NE_EXPR:
5060 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
5062 case UNORDERED_EXPR:
5063 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
5065 case ORDERED_EXPR:
5066 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
5068 case UNLT_EXPR:
5069 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
5071 case UNLE_EXPR:
5072 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
5074 case UNGT_EXPR:
5075 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
5077 case UNGE_EXPR:
5078 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
5080 case UNEQ_EXPR:
5081 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
5083 case LTGT_EXPR:
5084 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
5086 case COND_EXPR:
5087 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
5089 case COMPLEX_EXPR:
5090 gcc_assert (COMPLEX_MODE_P (mode));
5091 if (GET_MODE (op0) == VOIDmode)
5092 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
5093 if (GET_MODE (op1) == VOIDmode)
5094 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
5095 return gen_rtx_CONCAT (mode, op0, op1);
5097 case CONJ_EXPR:
5098 if (GET_CODE (op0) == CONCAT)
5099 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
5100 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
5101 XEXP (op0, 1),
5102 GET_MODE_INNER (mode)));
5103 else
5105 scalar_mode imode = GET_MODE_INNER (mode);
5106 rtx re, im;
5108 if (MEM_P (op0))
5110 re = adjust_address_nv (op0, imode, 0);
5111 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
5113 else
5115 scalar_int_mode ifmode;
5116 scalar_int_mode ihmode;
5117 rtx halfsize;
5118 if (!int_mode_for_mode (mode).exists (&ifmode)
5119 || !int_mode_for_mode (imode).exists (&ihmode))
5120 return NULL;
5121 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
5122 re = op0;
5123 if (mode != ifmode)
5124 re = gen_rtx_SUBREG (ifmode, re, 0);
5125 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
5126 if (imode != ihmode)
5127 re = gen_rtx_SUBREG (imode, re, 0);
5128 im = copy_rtx (op0);
5129 if (mode != ifmode)
5130 im = gen_rtx_SUBREG (ifmode, im, 0);
5131 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
5132 if (imode != ihmode)
5133 im = gen_rtx_SUBREG (imode, im, 0);
5135 im = gen_rtx_NEG (imode, im);
5136 return gen_rtx_CONCAT (mode, re, im);
5139 case ADDR_EXPR:
5140 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
5141 if (!op0 || !MEM_P (op0))
5143 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5144 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5145 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5146 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5147 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5148 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5150 if (handled_component_p (TREE_OPERAND (exp, 0)))
5152 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5153 bool reverse;
5154 tree decl
5155 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5156 &bitsize, &maxsize, &reverse);
5157 if ((VAR_P (decl)
5158 || TREE_CODE (decl) == PARM_DECL
5159 || TREE_CODE (decl) == RESULT_DECL)
5160 && (!TREE_ADDRESSABLE (decl)
5161 || target_for_debug_bind (decl))
5162 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5163 && known_gt (bitsize, 0)
5164 && known_eq (bitsize, maxsize))
5166 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5167 return plus_constant (mode, base, byteoffset);
5171 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5172 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5173 == ADDR_EXPR)
5175 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5176 0));
5177 if (op0 != NULL
5178 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5179 || (GET_CODE (op0) == PLUS
5180 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5181 && CONST_INT_P (XEXP (op0, 1)))))
5183 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5184 1));
5185 poly_int64 offset;
5186 if (!op1 || !poly_int_rtx_p (op1, &offset))
5187 return NULL;
5189 return plus_constant (mode, op0, offset);
5193 return NULL;
5196 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5197 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5198 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5200 return op0;
5202 case VECTOR_CST:
5204 unsigned HOST_WIDE_INT i, nelts;
5206 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5207 return NULL;
5209 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5211 for (i = 0; i < nelts; ++i)
5213 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5214 if (!op1)
5215 return NULL;
5216 XVECEXP (op0, 0, i) = op1;
5219 return op0;
5222 case CONSTRUCTOR:
5223 if (TREE_CLOBBER_P (exp))
5224 return NULL;
5225 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5227 unsigned i;
5228 unsigned HOST_WIDE_INT nelts;
5229 tree val;
5231 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5232 goto flag_unsupported;
5234 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5236 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5238 op1 = expand_debug_expr (val);
5239 if (!op1)
5240 return NULL;
5241 XVECEXP (op0, 0, i) = op1;
5244 if (i < nelts)
5246 op1 = expand_debug_expr
5247 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5249 if (!op1)
5250 return NULL;
5252 for (; i < nelts; i++)
5253 XVECEXP (op0, 0, i) = op1;
5256 return op0;
5258 else
5259 goto flag_unsupported;
5261 case CALL_EXPR:
5262 /* ??? Maybe handle some builtins? */
5263 return NULL;
5265 case SSA_NAME:
5267 gimple *g = get_gimple_for_ssa_name (exp);
5268 if (g)
5270 tree t = NULL_TREE;
5271 if (deep_ter_debug_map)
5273 tree *slot = deep_ter_debug_map->get (exp);
5274 if (slot)
5275 t = *slot;
5277 if (t == NULL_TREE)
5278 t = gimple_assign_rhs_to_tree (g);
5279 op0 = expand_debug_expr (t);
5280 if (!op0)
5281 return NULL;
5283 else
5285 /* If this is a reference to an incoming value of
5286 parameter that is never used in the code or where the
5287 incoming value is never used in the code, use
5288 PARM_DECL's DECL_RTL if set. */
5289 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5290 && SSA_NAME_VAR (exp)
5291 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5292 && has_zero_uses (exp))
5294 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5295 if (op0)
5296 goto adjust_mode;
5297 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5298 if (op0)
5299 goto adjust_mode;
5302 int part = var_to_partition (SA.map, exp);
5304 if (part == NO_PARTITION)
5305 return NULL;
5307 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5309 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5311 goto adjust_mode;
5314 case ERROR_MARK:
5315 return NULL;
5317 /* Vector stuff. For most of the codes we don't have rtl codes. */
5318 case REALIGN_LOAD_EXPR:
5319 case VEC_COND_EXPR:
5320 case VEC_PACK_FIX_TRUNC_EXPR:
5321 case VEC_PACK_FLOAT_EXPR:
5322 case VEC_PACK_SAT_EXPR:
5323 case VEC_PACK_TRUNC_EXPR:
5324 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5325 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5326 case VEC_UNPACK_FLOAT_HI_EXPR:
5327 case VEC_UNPACK_FLOAT_LO_EXPR:
5328 case VEC_UNPACK_HI_EXPR:
5329 case VEC_UNPACK_LO_EXPR:
5330 case VEC_WIDEN_MULT_HI_EXPR:
5331 case VEC_WIDEN_MULT_LO_EXPR:
5332 case VEC_WIDEN_MULT_EVEN_EXPR:
5333 case VEC_WIDEN_MULT_ODD_EXPR:
5334 case VEC_WIDEN_LSHIFT_HI_EXPR:
5335 case VEC_WIDEN_LSHIFT_LO_EXPR:
5336 case VEC_PERM_EXPR:
5337 case VEC_DUPLICATE_EXPR:
5338 case VEC_SERIES_EXPR:
5339 case SAD_EXPR:
5340 return NULL;
5342 /* Misc codes. */
5343 case ADDR_SPACE_CONVERT_EXPR:
5344 case FIXED_CONVERT_EXPR:
5345 case OBJ_TYPE_REF:
5346 case WITH_SIZE_EXPR:
5347 case BIT_INSERT_EXPR:
5348 return NULL;
5350 case DOT_PROD_EXPR:
5351 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5352 && SCALAR_INT_MODE_P (mode))
5355 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5356 0)))
5357 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5358 inner_mode);
5360 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5361 1)))
5362 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5363 inner_mode);
5364 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5365 return simplify_gen_binary (PLUS, mode, op0, op2);
5367 return NULL;
5369 case WIDEN_MULT_EXPR:
5370 case WIDEN_MULT_PLUS_EXPR:
5371 case WIDEN_MULT_MINUS_EXPR:
5372 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5373 && SCALAR_INT_MODE_P (mode))
5375 inner_mode = GET_MODE (op0);
5376 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5377 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5378 else
5379 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5380 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5381 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5382 else
5383 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5384 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5385 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5386 return op0;
5387 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5388 return simplify_gen_binary (PLUS, mode, op0, op2);
5389 else
5390 return simplify_gen_binary (MINUS, mode, op2, op0);
5392 return NULL;
5394 case MULT_HIGHPART_EXPR:
5395 /* ??? Similar to the above. */
5396 return NULL;
5398 case WIDEN_SUM_EXPR:
5399 case WIDEN_LSHIFT_EXPR:
5400 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5401 && SCALAR_INT_MODE_P (mode))
5404 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5405 0)))
5406 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5407 inner_mode);
5408 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5409 ? ASHIFT : PLUS, mode, op0, op1);
5411 return NULL;
5413 default:
5414 flag_unsupported:
5415 if (flag_checking)
5417 debug_tree (exp);
5418 gcc_unreachable ();
5420 return NULL;
5424 /* Return an RTX equivalent to the source bind value of the tree expression
5425 EXP. */
5427 static rtx
5428 expand_debug_source_expr (tree exp)
5430 rtx op0 = NULL_RTX;
5431 machine_mode mode = VOIDmode, inner_mode;
5433 switch (TREE_CODE (exp))
5435 case VAR_DECL:
5436 if (DECL_ABSTRACT_ORIGIN (exp))
5437 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5438 break;
5439 case PARM_DECL:
5441 mode = DECL_MODE (exp);
5442 op0 = expand_debug_parm_decl (exp);
5443 if (op0)
5444 break;
5445 /* See if this isn't an argument that has been completely
5446 optimized out. */
5447 if (!DECL_RTL_SET_P (exp)
5448 && !DECL_INCOMING_RTL (exp)
5449 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5451 tree aexp = DECL_ORIGIN (exp);
5452 if (DECL_CONTEXT (aexp)
5453 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5455 vec<tree, va_gc> **debug_args;
5456 unsigned int ix;
5457 tree ddecl;
5458 debug_args = decl_debug_args_lookup (current_function_decl);
5459 if (debug_args != NULL)
5461 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5462 ix += 2)
5463 if (ddecl == aexp)
5464 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5468 break;
5470 default:
5471 break;
5474 if (op0 == NULL_RTX)
5475 return NULL_RTX;
5477 inner_mode = GET_MODE (op0);
5478 if (mode == inner_mode)
5479 return op0;
5481 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5483 if (GET_MODE_UNIT_BITSIZE (mode)
5484 == GET_MODE_UNIT_BITSIZE (inner_mode))
5485 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5486 else if (GET_MODE_UNIT_BITSIZE (mode)
5487 < GET_MODE_UNIT_BITSIZE (inner_mode))
5488 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5489 else
5490 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5492 else if (FLOAT_MODE_P (mode))
5493 gcc_unreachable ();
5494 else if (FLOAT_MODE_P (inner_mode))
5496 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5497 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5498 else
5499 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5501 else if (GET_MODE_UNIT_PRECISION (mode)
5502 == GET_MODE_UNIT_PRECISION (inner_mode))
5503 op0 = lowpart_subreg (mode, op0, inner_mode);
5504 else if (GET_MODE_UNIT_PRECISION (mode)
5505 < GET_MODE_UNIT_PRECISION (inner_mode))
5506 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5507 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5508 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5509 else
5510 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5512 return op0;
5515 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5516 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5517 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5519 static void
5520 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5522 rtx exp = *exp_p;
5524 if (exp == NULL_RTX)
5525 return;
5527 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5528 return;
5530 if (depth == 4)
5532 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5533 rtx dval = make_debug_expr_from_rtl (exp);
5535 /* Emit a debug bind insn before INSN. */
5536 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5537 DEBUG_EXPR_TREE_DECL (dval), exp,
5538 VAR_INIT_STATUS_INITIALIZED);
5540 emit_debug_insn_before (bind, insn);
5541 *exp_p = dval;
5542 return;
5545 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5546 int i, j;
5547 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5548 switch (*format_ptr++)
5550 case 'e':
5551 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5552 break;
5554 case 'E':
5555 case 'V':
5556 for (j = 0; j < XVECLEN (exp, i); j++)
5557 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5558 break;
5560 default:
5561 break;
5565 /* Expand the _LOCs in debug insns. We run this after expanding all
5566 regular insns, so that any variables referenced in the function
5567 will have their DECL_RTLs set. */
5569 static void
5570 expand_debug_locations (void)
5572 rtx_insn *insn;
5573 rtx_insn *last = get_last_insn ();
5574 int save_strict_alias = flag_strict_aliasing;
5576 /* New alias sets while setting up memory attributes cause
5577 -fcompare-debug failures, even though it doesn't bring about any
5578 codegen changes. */
5579 flag_strict_aliasing = 0;
5581 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5582 if (DEBUG_BIND_INSN_P (insn))
5584 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5585 rtx val;
5586 rtx_insn *prev_insn, *insn2;
5587 machine_mode mode;
5589 if (value == NULL_TREE)
5590 val = NULL_RTX;
5591 else
5593 if (INSN_VAR_LOCATION_STATUS (insn)
5594 == VAR_INIT_STATUS_UNINITIALIZED)
5595 val = expand_debug_source_expr (value);
5596 /* The avoid_deep_ter_for_debug function inserts
5597 debug bind stmts after SSA_NAME definition, with the
5598 SSA_NAME as the whole bind location. Disable temporarily
5599 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5600 being defined in this DEBUG_INSN. */
5601 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5603 tree *slot = deep_ter_debug_map->get (value);
5604 if (slot)
5606 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5607 *slot = NULL_TREE;
5608 else
5609 slot = NULL;
5611 val = expand_debug_expr (value);
5612 if (slot)
5613 *slot = INSN_VAR_LOCATION_DECL (insn);
5615 else
5616 val = expand_debug_expr (value);
5617 gcc_assert (last == get_last_insn ());
5620 if (!val)
5621 val = gen_rtx_UNKNOWN_VAR_LOC ();
5622 else
5624 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5626 gcc_assert (mode == GET_MODE (val)
5627 || (GET_MODE (val) == VOIDmode
5628 && (CONST_SCALAR_INT_P (val)
5629 || GET_CODE (val) == CONST_FIXED
5630 || GET_CODE (val) == LABEL_REF)));
5633 INSN_VAR_LOCATION_LOC (insn) = val;
5634 prev_insn = PREV_INSN (insn);
5635 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5636 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5639 flag_strict_aliasing = save_strict_alias;
5642 /* Performs swapping operands of commutative operations to expand
5643 the expensive one first. */
5645 static void
5646 reorder_operands (basic_block bb)
5648 unsigned int *lattice; /* Hold cost of each statement. */
5649 unsigned int i = 0, n = 0;
5650 gimple_stmt_iterator gsi;
5651 gimple_seq stmts;
5652 gimple *stmt;
5653 bool swap;
5654 tree op0, op1;
5655 ssa_op_iter iter;
5656 use_operand_p use_p;
5657 gimple *def0, *def1;
5659 /* Compute cost of each statement using estimate_num_insns. */
5660 stmts = bb_seq (bb);
5661 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5663 stmt = gsi_stmt (gsi);
5664 if (!is_gimple_debug (stmt))
5665 gimple_set_uid (stmt, n++);
5667 lattice = XNEWVEC (unsigned int, n);
5668 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5670 unsigned cost;
5671 stmt = gsi_stmt (gsi);
5672 if (is_gimple_debug (stmt))
5673 continue;
5674 cost = estimate_num_insns (stmt, &eni_size_weights);
5675 lattice[i] = cost;
5676 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5678 tree use = USE_FROM_PTR (use_p);
5679 gimple *def_stmt;
5680 if (TREE_CODE (use) != SSA_NAME)
5681 continue;
5682 def_stmt = get_gimple_for_ssa_name (use);
5683 if (!def_stmt)
5684 continue;
5685 lattice[i] += lattice[gimple_uid (def_stmt)];
5687 i++;
5688 if (!is_gimple_assign (stmt)
5689 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5690 continue;
5691 op0 = gimple_op (stmt, 1);
5692 op1 = gimple_op (stmt, 2);
5693 if (TREE_CODE (op0) != SSA_NAME
5694 || TREE_CODE (op1) != SSA_NAME)
5695 continue;
5696 /* Swap operands if the second one is more expensive. */
5697 def0 = get_gimple_for_ssa_name (op0);
5698 def1 = get_gimple_for_ssa_name (op1);
5699 if (!def1)
5700 continue;
5701 swap = false;
5702 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5703 swap = true;
5704 if (swap)
5706 if (dump_file && (dump_flags & TDF_DETAILS))
5708 fprintf (dump_file, "Swap operands in stmt:\n");
5709 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5710 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5711 def0 ? lattice[gimple_uid (def0)] : 0,
5712 lattice[gimple_uid (def1)]);
5714 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5715 gimple_assign_rhs2_ptr (stmt));
5718 XDELETE (lattice);
5721 /* Expand basic block BB from GIMPLE trees to RTL. */
5723 static basic_block
5724 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5726 gimple_stmt_iterator gsi;
5727 gimple_seq stmts;
5728 gimple *stmt = NULL;
5729 rtx_note *note = NULL;
5730 rtx_insn *last;
5731 edge e;
5732 edge_iterator ei;
5734 if (dump_file)
5735 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5736 bb->index);
5738 /* Note that since we are now transitioning from GIMPLE to RTL, we
5739 cannot use the gsi_*_bb() routines because they expect the basic
5740 block to be in GIMPLE, instead of RTL. Therefore, we need to
5741 access the BB sequence directly. */
5742 if (optimize)
5743 reorder_operands (bb);
5744 stmts = bb_seq (bb);
5745 bb->il.gimple.seq = NULL;
5746 bb->il.gimple.phi_nodes = NULL;
5747 rtl_profile_for_bb (bb);
5748 init_rtl_bb_info (bb);
5749 bb->flags |= BB_RTL;
5751 /* Remove the RETURN_EXPR if we may fall though to the exit
5752 instead. */
5753 gsi = gsi_last (stmts);
5754 if (!gsi_end_p (gsi)
5755 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5757 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5759 gcc_assert (single_succ_p (bb));
5760 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5762 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5763 && !gimple_return_retval (ret_stmt))
5765 gsi_remove (&gsi, false);
5766 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5770 gsi = gsi_start (stmts);
5771 if (!gsi_end_p (gsi))
5773 stmt = gsi_stmt (gsi);
5774 if (gimple_code (stmt) != GIMPLE_LABEL)
5775 stmt = NULL;
5778 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5780 if (stmt || elt)
5782 gcc_checking_assert (!note);
5783 last = get_last_insn ();
5785 if (stmt)
5787 expand_gimple_stmt (stmt);
5788 gsi_next (&gsi);
5791 if (elt)
5792 emit_label (*elt);
5794 BB_HEAD (bb) = NEXT_INSN (last);
5795 if (NOTE_P (BB_HEAD (bb)))
5796 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5797 gcc_assert (LABEL_P (BB_HEAD (bb)));
5798 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5800 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5802 else
5803 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5805 if (note)
5806 NOTE_BASIC_BLOCK (note) = bb;
5808 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5810 basic_block new_bb;
5812 stmt = gsi_stmt (gsi);
5814 /* If this statement is a non-debug one, and we generate debug
5815 insns, then this one might be the last real use of a TERed
5816 SSA_NAME, but where there are still some debug uses further
5817 down. Expanding the current SSA name in such further debug
5818 uses by their RHS might lead to wrong debug info, as coalescing
5819 might make the operands of such RHS be placed into the same
5820 pseudo as something else. Like so:
5821 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5822 use(a_1);
5823 a_2 = ...
5824 #DEBUG ... => a_1
5825 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5826 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5827 the write to a_2 would actually have clobbered the place which
5828 formerly held a_0.
5830 So, instead of that, we recognize the situation, and generate
5831 debug temporaries at the last real use of TERed SSA names:
5832 a_1 = a_0 + 1;
5833 #DEBUG #D1 => a_1
5834 use(a_1);
5835 a_2 = ...
5836 #DEBUG ... => #D1
5838 if (MAY_HAVE_DEBUG_BIND_INSNS
5839 && SA.values
5840 && !is_gimple_debug (stmt))
5842 ssa_op_iter iter;
5843 tree op;
5844 gimple *def;
5846 location_t sloc = curr_insn_location ();
5848 /* Look for SSA names that have their last use here (TERed
5849 names always have only one real use). */
5850 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5851 if ((def = get_gimple_for_ssa_name (op)))
5853 imm_use_iterator imm_iter;
5854 use_operand_p use_p;
5855 bool have_debug_uses = false;
5857 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5859 if (gimple_debug_bind_p (USE_STMT (use_p)))
5861 have_debug_uses = true;
5862 break;
5866 if (have_debug_uses)
5868 /* OP is a TERed SSA name, with DEF its defining
5869 statement, and where OP is used in further debug
5870 instructions. Generate a debug temporary, and
5871 replace all uses of OP in debug insns with that
5872 temporary. */
5873 gimple *debugstmt;
5874 tree value = gimple_assign_rhs_to_tree (def);
5875 tree vexpr = make_node (DEBUG_EXPR_DECL);
5876 rtx val;
5877 machine_mode mode;
5879 set_curr_insn_location (gimple_location (def));
5881 DECL_ARTIFICIAL (vexpr) = 1;
5882 TREE_TYPE (vexpr) = TREE_TYPE (value);
5883 if (DECL_P (value))
5884 mode = DECL_MODE (value);
5885 else
5886 mode = TYPE_MODE (TREE_TYPE (value));
5887 SET_DECL_MODE (vexpr, mode);
5889 val = gen_rtx_VAR_LOCATION
5890 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5892 emit_debug_insn (val);
5894 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5896 if (!gimple_debug_bind_p (debugstmt))
5897 continue;
5899 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5900 SET_USE (use_p, vexpr);
5902 update_stmt (debugstmt);
5906 set_curr_insn_location (sloc);
5909 currently_expanding_gimple_stmt = stmt;
5911 /* Expand this statement, then evaluate the resulting RTL and
5912 fixup the CFG accordingly. */
5913 if (gimple_code (stmt) == GIMPLE_COND)
5915 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5916 if (new_bb)
5917 return new_bb;
5919 else if (is_gimple_debug (stmt))
5921 location_t sloc = curr_insn_location ();
5922 gimple_stmt_iterator nsi = gsi;
5924 for (;;)
5926 tree var;
5927 tree value = NULL_TREE;
5928 rtx val = NULL_RTX;
5929 machine_mode mode;
5931 if (!gimple_debug_nonbind_marker_p (stmt))
5933 if (gimple_debug_bind_p (stmt))
5935 var = gimple_debug_bind_get_var (stmt);
5937 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5938 && TREE_CODE (var) != LABEL_DECL
5939 && !target_for_debug_bind (var))
5940 goto delink_debug_stmt;
5942 if (DECL_P (var) && !VECTOR_TYPE_P (TREE_TYPE (var)))
5943 mode = DECL_MODE (var);
5944 else
5945 mode = TYPE_MODE (TREE_TYPE (var));
5947 if (gimple_debug_bind_has_value_p (stmt))
5948 value = gimple_debug_bind_get_value (stmt);
5950 val = gen_rtx_VAR_LOCATION
5951 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5953 else if (gimple_debug_source_bind_p (stmt))
5955 var = gimple_debug_source_bind_get_var (stmt);
5957 value = gimple_debug_source_bind_get_value (stmt);
5959 if (!VECTOR_TYPE_P (TREE_TYPE (var)))
5960 mode = DECL_MODE (var);
5961 else
5962 mode = TYPE_MODE (TREE_TYPE (var));
5964 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5965 VAR_INIT_STATUS_UNINITIALIZED);
5967 else
5968 gcc_unreachable ();
5970 /* If this function was first compiled with markers
5971 enabled, but they're now disable (e.g. LTO), drop
5972 them on the floor. */
5973 else if (gimple_debug_nonbind_marker_p (stmt)
5974 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5975 goto delink_debug_stmt;
5976 else if (gimple_debug_begin_stmt_p (stmt))
5977 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5978 else if (gimple_debug_inline_entry_p (stmt))
5979 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5980 else
5981 gcc_unreachable ();
5983 last = get_last_insn ();
5985 set_curr_insn_location (gimple_location (stmt));
5987 emit_debug_insn (val);
5989 if (dump_file && (dump_flags & TDF_DETAILS))
5991 /* We can't dump the insn with a TREE where an RTX
5992 is expected. */
5993 if (GET_CODE (val) == VAR_LOCATION)
5995 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5996 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5998 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5999 if (GET_CODE (val) == VAR_LOCATION)
6000 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
6003 delink_debug_stmt:
6004 /* In order not to generate too many debug temporaries,
6005 we delink all uses of debug statements we already expanded.
6006 Therefore debug statements between definition and real
6007 use of TERed SSA names will continue to use the SSA name,
6008 and not be replaced with debug temps. */
6009 delink_stmt_imm_use (stmt);
6011 gsi = nsi;
6012 gsi_next (&nsi);
6013 if (gsi_end_p (nsi))
6014 break;
6015 stmt = gsi_stmt (nsi);
6016 if (!is_gimple_debug (stmt))
6017 break;
6020 set_curr_insn_location (sloc);
6022 else
6024 gcall *call_stmt = dyn_cast <gcall *> (stmt);
6025 if (call_stmt
6026 && gimple_call_tail_p (call_stmt)
6027 && disable_tail_calls)
6028 gimple_call_set_tail (call_stmt, false);
6030 if (call_stmt && gimple_call_tail_p (call_stmt))
6032 bool can_fallthru;
6033 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
6034 if (new_bb)
6036 if (can_fallthru)
6037 bb = new_bb;
6038 else
6039 return new_bb;
6042 else
6044 def_operand_p def_p;
6045 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
6047 if (def_p != NULL)
6049 /* Ignore this stmt if it is in the list of
6050 replaceable expressions. */
6051 if (SA.values
6052 && bitmap_bit_p (SA.values,
6053 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
6054 continue;
6056 last = expand_gimple_stmt (stmt);
6057 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6062 currently_expanding_gimple_stmt = NULL;
6064 /* Expand implicit goto and convert goto_locus. */
6065 FOR_EACH_EDGE (e, ei, bb->succs)
6067 if (e->goto_locus != UNKNOWN_LOCATION || !stmt)
6068 set_curr_insn_location (e->goto_locus);
6069 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
6071 emit_jump (label_rtx_for_bb (e->dest));
6072 e->flags &= ~EDGE_FALLTHRU;
6076 /* Expanded RTL can create a jump in the last instruction of block.
6077 This later might be assumed to be a jump to successor and break edge insertion.
6078 We need to insert dummy move to prevent this. PR41440. */
6079 if (single_succ_p (bb)
6080 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
6081 && (last = get_last_insn ())
6082 && (JUMP_P (last)
6083 || (DEBUG_INSN_P (last)
6084 && JUMP_P (prev_nondebug_insn (last)))))
6086 rtx dummy = gen_reg_rtx (SImode);
6087 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
6090 do_pending_stack_adjust ();
6092 /* Find the block tail. The last insn in the block is the insn
6093 before a barrier and/or table jump insn. */
6094 last = get_last_insn ();
6095 if (BARRIER_P (last))
6096 last = PREV_INSN (last);
6097 if (JUMP_TABLE_DATA_P (last))
6098 last = PREV_INSN (PREV_INSN (last));
6099 if (BARRIER_P (last))
6100 last = PREV_INSN (last);
6101 BB_END (bb) = last;
6103 update_bb_for_insn (bb);
6105 return bb;
6109 /* Create a basic block for initialization code. */
6111 static basic_block
6112 construct_init_block (void)
6114 basic_block init_block, first_block;
6115 edge e = NULL;
6116 int flags;
6118 /* Multiple entry points not supported yet. */
6119 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
6120 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
6121 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
6122 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6123 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6125 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
6127 /* When entry edge points to first basic block, we don't need jump,
6128 otherwise we have to jump into proper target. */
6129 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
6131 tree label = gimple_block_label (e->dest);
6133 emit_jump (jump_target_rtx (label));
6134 flags = 0;
6136 else
6137 flags = EDGE_FALLTHRU;
6139 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6140 get_last_insn (),
6141 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6142 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6143 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6144 if (e)
6146 first_block = e->dest;
6147 redirect_edge_succ (e, init_block);
6148 make_single_succ_edge (init_block, first_block, flags);
6150 else
6151 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6152 EDGE_FALLTHRU);
6154 update_bb_for_insn (init_block);
6155 return init_block;
6158 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6159 found in the block tree. */
6161 static void
6162 set_block_levels (tree block, int level)
6164 while (block)
6166 BLOCK_NUMBER (block) = level;
6167 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6168 block = BLOCK_CHAIN (block);
6172 /* Create a block containing landing pads and similar stuff. */
6174 static void
6175 construct_exit_block (void)
6177 rtx_insn *head = get_last_insn ();
6178 rtx_insn *end;
6179 basic_block exit_block;
6180 edge e, e2;
6181 unsigned ix;
6182 edge_iterator ei;
6183 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6184 rtx_insn *orig_end = BB_END (prev_bb);
6186 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6188 /* Make sure the locus is set to the end of the function, so that
6189 epilogue line numbers and warnings are set properly. */
6190 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6191 input_location = cfun->function_end_locus;
6193 /* Generate rtl for function exit. */
6194 expand_function_end ();
6196 end = get_last_insn ();
6197 if (head == end)
6198 return;
6199 /* While emitting the function end we could move end of the last basic
6200 block. */
6201 BB_END (prev_bb) = orig_end;
6202 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6203 head = NEXT_INSN (head);
6204 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6205 bb count counting will be confused. Any instructions before that
6206 label are emitted for the case where PREV_BB falls through into the
6207 exit block, so append those instructions to prev_bb in that case. */
6208 if (NEXT_INSN (head) != return_label)
6210 while (NEXT_INSN (head) != return_label)
6212 if (!NOTE_P (NEXT_INSN (head)))
6213 BB_END (prev_bb) = NEXT_INSN (head);
6214 head = NEXT_INSN (head);
6217 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6218 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6219 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6221 ix = 0;
6222 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6224 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6225 if (!(e->flags & EDGE_ABNORMAL))
6226 redirect_edge_succ (e, exit_block);
6227 else
6228 ix++;
6231 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6232 EDGE_FALLTHRU);
6233 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6234 if (e2 != e)
6236 exit_block->count -= e2->count ();
6238 update_bb_for_insn (exit_block);
6241 /* Helper function for discover_nonconstant_array_refs.
6242 Look for ARRAY_REF nodes with non-constant indexes and mark them
6243 addressable. */
6245 static tree
6246 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6247 void *data)
6249 tree t = *tp;
6250 bitmap forced_stack_vars = (bitmap)((walk_stmt_info *)data)->info;
6252 if (IS_TYPE_OR_DECL_P (t))
6253 *walk_subtrees = 0;
6254 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6256 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6257 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6258 && (!TREE_OPERAND (t, 2)
6259 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6260 || (TREE_CODE (t) == COMPONENT_REF
6261 && (!TREE_OPERAND (t,2)
6262 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6263 || TREE_CODE (t) == BIT_FIELD_REF
6264 || TREE_CODE (t) == REALPART_EXPR
6265 || TREE_CODE (t) == IMAGPART_EXPR
6266 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6267 || CONVERT_EXPR_P (t))
6268 t = TREE_OPERAND (t, 0);
6270 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6272 t = get_base_address (t);
6273 if (t && DECL_P (t)
6274 && DECL_MODE (t) != BLKmode
6275 && !TREE_ADDRESSABLE (t))
6276 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6279 *walk_subtrees = 0;
6281 /* References of size POLY_INT_CST to a fixed-size object must go
6282 through memory. It's more efficient to force that here than
6283 to create temporary slots on the fly.
6284 RTL expansion expectes TARGET_MEM_REF to always address actual memory. */
6285 else if (TREE_CODE (t) == TARGET_MEM_REF
6286 || (TREE_CODE (t) == MEM_REF
6287 && TYPE_SIZE (TREE_TYPE (t))
6288 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t)))))
6290 tree base = get_base_address (t);
6291 if (base
6292 && DECL_P (base)
6293 && !TREE_ADDRESSABLE (base)
6294 && DECL_MODE (base) != BLKmode
6295 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6296 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6297 *walk_subtrees = 0;
6300 return NULL_TREE;
6303 /* If there's a chance to get a pseudo for t then if it would be of float mode
6304 and the actual access is via an integer mode (lowered memcpy or similar
6305 access) then avoid the register expansion if the mode likely is not storage
6306 suitable for raw bits processing (like XFmode on i?86). */
6308 static void
6309 avoid_type_punning_on_regs (tree t, bitmap forced_stack_vars)
6311 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6312 if (access_mode != BLKmode
6313 && !SCALAR_INT_MODE_P (access_mode))
6314 return;
6315 tree base = get_base_address (t);
6316 if (DECL_P (base)
6317 && !TREE_ADDRESSABLE (base)
6318 && FLOAT_MODE_P (DECL_MODE (base))
6319 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6320 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6321 /* Double check in the expensive way we really would get a pseudo. */
6322 && use_register_for_decl (base))
6323 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6326 /* RTL expansion is not able to compile array references with variable
6327 offsets for arrays stored in single register. Discover such
6328 expressions and mark variables as addressable to avoid this
6329 scenario. */
6331 static void
6332 discover_nonconstant_array_refs (bitmap forced_stack_vars)
6334 basic_block bb;
6335 gimple_stmt_iterator gsi;
6337 walk_stmt_info wi = {};
6338 wi.info = forced_stack_vars;
6339 FOR_EACH_BB_FN (bb, cfun)
6340 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6342 gimple *stmt = gsi_stmt (gsi);
6343 if (!is_gimple_debug (stmt))
6345 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, &wi);
6346 gcall *call = dyn_cast <gcall *> (stmt);
6347 if (call && gimple_call_internal_p (call))
6349 tree cand = NULL_TREE;
6350 switch (gimple_call_internal_fn (call))
6352 case IFN_LOAD_LANES:
6353 /* The source must be a MEM. */
6354 cand = gimple_call_arg (call, 0);
6355 break;
6356 case IFN_STORE_LANES:
6357 /* The destination must be a MEM. */
6358 cand = gimple_call_lhs (call);
6359 break;
6360 default:
6361 break;
6363 if (cand)
6364 cand = get_base_address (cand);
6365 if (cand
6366 && DECL_P (cand)
6367 && use_register_for_decl (cand))
6368 bitmap_set_bit (forced_stack_vars, DECL_UID (cand));
6370 if (gimple_vdef (stmt))
6372 tree t = gimple_get_lhs (stmt);
6373 if (t && REFERENCE_CLASS_P (t))
6374 avoid_type_punning_on_regs (t, forced_stack_vars);
6380 /* This function sets crtl->args.internal_arg_pointer to a virtual
6381 register if DRAP is needed. Local register allocator will replace
6382 virtual_incoming_args_rtx with the virtual register. */
6384 static void
6385 expand_stack_alignment (void)
6387 rtx drap_rtx;
6388 unsigned int preferred_stack_boundary;
6390 if (! SUPPORTS_STACK_ALIGNMENT)
6391 return;
6393 if (cfun->calls_alloca
6394 || cfun->has_nonlocal_label
6395 || crtl->has_nonlocal_goto)
6396 crtl->need_drap = true;
6398 /* Call update_stack_boundary here again to update incoming stack
6399 boundary. It may set incoming stack alignment to a different
6400 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6401 use the minimum incoming stack alignment to check if it is OK
6402 to perform sibcall optimization since sibcall optimization will
6403 only align the outgoing stack to incoming stack boundary. */
6404 if (targetm.calls.update_stack_boundary)
6405 targetm.calls.update_stack_boundary ();
6407 /* The incoming stack frame has to be aligned at least at
6408 parm_stack_boundary. */
6409 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6411 /* Update crtl->stack_alignment_estimated and use it later to align
6412 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6413 exceptions since callgraph doesn't collect incoming stack alignment
6414 in this case. */
6415 if (cfun->can_throw_non_call_exceptions
6416 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6417 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6418 else
6419 preferred_stack_boundary = crtl->preferred_stack_boundary;
6420 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6421 crtl->stack_alignment_estimated = preferred_stack_boundary;
6422 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6423 crtl->stack_alignment_needed = preferred_stack_boundary;
6425 gcc_assert (crtl->stack_alignment_needed
6426 <= crtl->stack_alignment_estimated);
6428 crtl->stack_realign_needed
6429 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6430 crtl->stack_realign_tried = crtl->stack_realign_needed;
6432 crtl->stack_realign_processed = true;
6434 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6435 alignment. */
6436 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6437 drap_rtx = targetm.calls.get_drap_rtx ();
6439 /* stack_realign_drap and drap_rtx must match. */
6440 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6442 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6443 if (drap_rtx != NULL)
6445 crtl->args.internal_arg_pointer = drap_rtx;
6447 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6448 needed. */
6449 fixup_tail_calls ();
6454 static void
6455 expand_main_function (void)
6457 #if (defined(INVOKE__main) \
6458 || (!defined(HAS_INIT_SECTION) \
6459 && !defined(INIT_SECTION_ASM_OP) \
6460 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6461 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6462 #endif
6466 /* Expand code to initialize the stack_protect_guard. This is invoked at
6467 the beginning of a function to be protected. */
6469 static void
6470 stack_protect_prologue (void)
6472 tree guard_decl = targetm.stack_protect_guard ();
6473 rtx x, y;
6475 crtl->stack_protect_guard_decl = guard_decl;
6476 x = expand_normal (crtl->stack_protect_guard);
6478 if (targetm.have_stack_protect_combined_set () && guard_decl)
6480 gcc_assert (DECL_P (guard_decl));
6481 y = DECL_RTL (guard_decl);
6483 /* Allow the target to compute address of Y and copy it to X without
6484 leaking Y into a register. This combined address + copy pattern
6485 allows the target to prevent spilling of any intermediate results by
6486 splitting it after register allocator. */
6487 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6489 emit_insn (insn);
6490 return;
6494 if (guard_decl)
6495 y = expand_normal (guard_decl);
6496 else
6497 y = const0_rtx;
6499 /* Allow the target to copy from Y to X without leaking Y into a
6500 register. */
6501 if (targetm.have_stack_protect_set ())
6502 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6504 emit_insn (insn);
6505 return;
6508 /* Otherwise do a straight move. */
6509 emit_move_insn (x, y);
6512 /* Translate the intermediate representation contained in the CFG
6513 from GIMPLE trees to RTL.
6515 We do conversion per basic block and preserve/update the tree CFG.
6516 This implies we have to do some magic as the CFG can simultaneously
6517 consist of basic blocks containing RTL and GIMPLE trees. This can
6518 confuse the CFG hooks, so be careful to not manipulate CFG during
6519 the expansion. */
6521 namespace {
6523 const pass_data pass_data_expand =
6525 RTL_PASS, /* type */
6526 "expand", /* name */
6527 OPTGROUP_NONE, /* optinfo_flags */
6528 TV_EXPAND, /* tv_id */
6529 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6530 | PROP_gimple_lcx
6531 | PROP_gimple_lvec
6532 | PROP_gimple_lva), /* properties_required */
6533 PROP_rtl, /* properties_provided */
6534 ( PROP_ssa | PROP_gimple ), /* properties_destroyed */
6535 0, /* todo_flags_start */
6536 0, /* todo_flags_finish */
6539 class pass_expand : public rtl_opt_pass
6541 public:
6542 pass_expand (gcc::context *ctxt)
6543 : rtl_opt_pass (pass_data_expand, ctxt)
6546 /* opt_pass methods: */
6547 virtual unsigned int execute (function *);
6549 }; // class pass_expand
6551 unsigned int
6552 pass_expand::execute (function *fun)
6554 basic_block bb, init_block;
6555 edge_iterator ei;
6556 edge e;
6557 rtx_insn *var_seq, *var_ret_seq;
6558 unsigned i;
6560 timevar_push (TV_OUT_OF_SSA);
6561 rewrite_out_of_ssa (&SA);
6562 timevar_pop (TV_OUT_OF_SSA);
6563 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6565 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6567 gimple_stmt_iterator gsi;
6568 FOR_EACH_BB_FN (bb, cfun)
6569 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6570 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6571 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6574 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6575 auto_bitmap forced_stack_vars;
6576 discover_nonconstant_array_refs (forced_stack_vars);
6578 /* Make sure all values used by the optimization passes have sane
6579 defaults. */
6580 reg_renumber = 0;
6582 /* Some backends want to know that we are expanding to RTL. */
6583 currently_expanding_to_rtl = 1;
6584 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6585 free_dominance_info (CDI_DOMINATORS);
6587 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6589 insn_locations_init ();
6590 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6592 /* Eventually, all FEs should explicitly set function_start_locus. */
6593 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6594 set_curr_insn_location
6595 (DECL_SOURCE_LOCATION (current_function_decl));
6596 else
6597 set_curr_insn_location (fun->function_start_locus);
6599 else
6600 set_curr_insn_location (UNKNOWN_LOCATION);
6601 prologue_location = curr_insn_location ();
6603 #ifdef INSN_SCHEDULING
6604 init_sched_attrs ();
6605 #endif
6607 /* Make sure first insn is a note even if we don't want linenums.
6608 This makes sure the first insn will never be deleted.
6609 Also, final expects a note to appear there. */
6610 emit_note (NOTE_INSN_DELETED);
6612 targetm.expand_to_rtl_hook ();
6613 crtl->init_stack_alignment ();
6614 fun->cfg->max_jumptable_ents = 0;
6616 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6617 of the function section at exapnsion time to predict distance of calls. */
6618 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6620 /* Expand the variables recorded during gimple lowering. */
6621 timevar_push (TV_VAR_EXPAND);
6622 start_sequence ();
6624 var_ret_seq = expand_used_vars (forced_stack_vars);
6626 var_seq = get_insns ();
6627 end_sequence ();
6628 timevar_pop (TV_VAR_EXPAND);
6630 /* Honor stack protection warnings. */
6631 if (warn_stack_protect)
6633 if (fun->calls_alloca)
6634 warning (OPT_Wstack_protector,
6635 "stack protector not protecting local variables: "
6636 "variable length buffer");
6637 if (has_short_buffer && !crtl->stack_protect_guard)
6638 warning (OPT_Wstack_protector,
6639 "stack protector not protecting function: "
6640 "all local arrays are less than %d bytes long",
6641 (int) param_ssp_buffer_size);
6644 /* Temporarily mark PARM_DECLs and RESULT_DECLs we need to expand to
6645 memory addressable so expand_function_start can emit the required
6646 copies. */
6647 auto_vec<tree, 16> marked_parms;
6648 for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
6649 parm = DECL_CHAIN (parm))
6650 if (!TREE_ADDRESSABLE (parm)
6651 && bitmap_bit_p (forced_stack_vars, DECL_UID (parm)))
6653 TREE_ADDRESSABLE (parm) = 1;
6654 marked_parms.safe_push (parm);
6656 if (DECL_RESULT (current_function_decl)
6657 && !TREE_ADDRESSABLE (DECL_RESULT (current_function_decl))
6658 && bitmap_bit_p (forced_stack_vars,
6659 DECL_UID (DECL_RESULT (current_function_decl))))
6661 TREE_ADDRESSABLE (DECL_RESULT (current_function_decl)) = 1;
6662 marked_parms.safe_push (DECL_RESULT (current_function_decl));
6665 /* Set up parameters and prepare for return, for the function. */
6666 expand_function_start (current_function_decl);
6668 /* Clear TREE_ADDRESSABLE again. */
6669 while (!marked_parms.is_empty ())
6670 TREE_ADDRESSABLE (marked_parms.pop ()) = 0;
6672 /* If we emitted any instructions for setting up the variables,
6673 emit them before the FUNCTION_START note. */
6674 if (var_seq)
6676 emit_insn_before (var_seq, parm_birth_insn);
6678 /* In expand_function_end we'll insert the alloca save/restore
6679 before parm_birth_insn. We've just insertted an alloca call.
6680 Adjust the pointer to match. */
6681 parm_birth_insn = var_seq;
6684 /* Now propagate the RTL assignment of each partition to the
6685 underlying var of each SSA_NAME. */
6686 tree name;
6688 FOR_EACH_SSA_NAME (i, name, cfun)
6690 /* We might have generated new SSA names in
6691 update_alias_info_with_stack_vars. They will have a NULL
6692 defining statements, and won't be part of the partitioning,
6693 so ignore those. */
6694 if (!SSA_NAME_DEF_STMT (name))
6695 continue;
6697 adjust_one_expanded_partition_var (name);
6700 /* Clean up RTL of variables that straddle across multiple
6701 partitions, and check that the rtl of any PARM_DECLs that are not
6702 cleaned up is that of their default defs. */
6703 FOR_EACH_SSA_NAME (i, name, cfun)
6705 int part;
6707 /* We might have generated new SSA names in
6708 update_alias_info_with_stack_vars. They will have a NULL
6709 defining statements, and won't be part of the partitioning,
6710 so ignore those. */
6711 if (!SSA_NAME_DEF_STMT (name))
6712 continue;
6713 part = var_to_partition (SA.map, name);
6714 if (part == NO_PARTITION)
6715 continue;
6717 /* If this decl was marked as living in multiple places, reset
6718 this now to NULL. */
6719 tree var = SSA_NAME_VAR (name);
6720 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6721 SET_DECL_RTL (var, NULL);
6722 /* Check that the pseudos chosen by assign_parms are those of
6723 the corresponding default defs. */
6724 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6725 && (TREE_CODE (var) == PARM_DECL
6726 || TREE_CODE (var) == RESULT_DECL))
6728 rtx in = DECL_RTL_IF_SET (var);
6729 gcc_assert (in);
6730 rtx out = SA.partition_to_pseudo[part];
6731 gcc_assert (in == out);
6733 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6734 those expected by debug backends for each parm and for
6735 the result. This is particularly important for stabs,
6736 whose register elimination from parm's DECL_RTL may cause
6737 -fcompare-debug differences as SET_DECL_RTL changes reg's
6738 attrs. So, make sure the RTL already has the parm as the
6739 EXPR, so that it won't change. */
6740 SET_DECL_RTL (var, NULL_RTX);
6741 if (MEM_P (in))
6742 set_mem_attributes (in, var, true);
6743 SET_DECL_RTL (var, in);
6747 /* If this function is `main', emit a call to `__main'
6748 to run global initializers, etc. */
6749 if (DECL_NAME (current_function_decl)
6750 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6751 && DECL_FILE_SCOPE_P (current_function_decl))
6752 expand_main_function ();
6754 /* Initialize the stack_protect_guard field. This must happen after the
6755 call to __main (if any) so that the external decl is initialized. */
6756 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6757 stack_protect_prologue ();
6759 expand_phi_nodes (&SA);
6761 /* Release any stale SSA redirection data. */
6762 redirect_edge_var_map_empty ();
6764 /* Register rtl specific functions for cfg. */
6765 rtl_register_cfg_hooks ();
6767 init_block = construct_init_block ();
6769 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6770 remaining edges later. */
6771 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6772 e->flags &= ~EDGE_EXECUTABLE;
6774 /* If the function has too many markers, drop them while expanding. */
6775 if (cfun->debug_marker_count
6776 >= param_max_debug_marker_count)
6777 cfun->debug_nonbind_markers = false;
6779 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6780 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6781 next_bb)
6782 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6784 if (MAY_HAVE_DEBUG_BIND_INSNS)
6785 expand_debug_locations ();
6787 if (deep_ter_debug_map)
6789 delete deep_ter_debug_map;
6790 deep_ter_debug_map = NULL;
6793 /* Free stuff we no longer need after GIMPLE optimizations. */
6794 free_dominance_info (CDI_DOMINATORS);
6795 free_dominance_info (CDI_POST_DOMINATORS);
6796 delete_tree_cfg_annotations (fun);
6798 timevar_push (TV_OUT_OF_SSA);
6799 finish_out_of_ssa (&SA);
6800 timevar_pop (TV_OUT_OF_SSA);
6802 timevar_push (TV_POST_EXPAND);
6803 /* We are no longer in SSA form. */
6804 fun->gimple_df->in_ssa_p = false;
6805 loops_state_clear (LOOP_CLOSED_SSA);
6807 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6808 conservatively to true until they are all profile aware. */
6809 delete lab_rtx_for_bb;
6810 free_histograms (fun);
6812 construct_exit_block ();
6813 insn_locations_finalize ();
6815 if (var_ret_seq)
6817 rtx_insn *after = return_label;
6818 rtx_insn *next = NEXT_INSN (after);
6819 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6820 after = next;
6821 emit_insn_after (var_ret_seq, after);
6824 if (hwasan_sanitize_stack_p ())
6825 hwasan_maybe_emit_frame_base_init ();
6827 /* Zap the tree EH table. */
6828 set_eh_throw_stmt_table (fun, NULL);
6830 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6831 split edges which edge insertions might do. */
6832 rebuild_jump_labels (get_insns ());
6834 /* If we have a single successor to the entry block, put the pending insns
6835 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6836 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6838 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6839 if (e->insns.r)
6841 rtx_insn *insns = e->insns.r;
6842 e->insns.r = NULL;
6843 rebuild_jump_labels_chain (insns);
6844 if (NOTE_P (parm_birth_insn)
6845 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6846 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6847 else
6848 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6852 /* Otherwise, as well as for other edges, take the usual way. */
6853 commit_edge_insertions ();
6855 /* We're done expanding trees to RTL. */
6856 currently_expanding_to_rtl = 0;
6858 flush_mark_addressable_queue ();
6860 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6861 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6863 edge e;
6864 edge_iterator ei;
6865 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6867 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6868 e->flags &= ~EDGE_EXECUTABLE;
6870 /* At the moment not all abnormal edges match the RTL
6871 representation. It is safe to remove them here as
6872 find_many_sub_basic_blocks will rediscover them.
6873 In the future we should get this fixed properly. */
6874 if ((e->flags & EDGE_ABNORMAL)
6875 && !(e->flags & EDGE_SIBCALL))
6876 remove_edge (e);
6877 else
6878 ei_next (&ei);
6882 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6883 bitmap_ones (blocks);
6884 find_many_sub_basic_blocks (blocks);
6885 purge_all_dead_edges ();
6887 /* After initial rtl generation, call back to finish generating
6888 exception support code. We need to do this before cleaning up
6889 the CFG as the code does not expect dead landing pads. */
6890 if (fun->eh->region_tree != NULL)
6891 finish_eh_generation ();
6893 /* Call expand_stack_alignment after finishing all
6894 updates to crtl->preferred_stack_boundary. */
6895 expand_stack_alignment ();
6897 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6898 function. */
6899 if (crtl->tail_call_emit)
6900 fixup_tail_calls ();
6902 HOST_WIDE_INT patch_area_size, patch_area_entry;
6903 parse_and_check_patch_area (flag_patchable_function_entry, false,
6904 &patch_area_size, &patch_area_entry);
6906 tree patchable_function_entry_attr
6907 = lookup_attribute ("patchable_function_entry",
6908 DECL_ATTRIBUTES (cfun->decl));
6909 if (patchable_function_entry_attr)
6911 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
6912 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
6914 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
6915 patch_area_entry = 0;
6916 if (TREE_CHAIN (pp_val) != NULL_TREE)
6918 tree patchable_function_entry_value2
6919 = TREE_VALUE (TREE_CHAIN (pp_val));
6920 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
6924 if (patch_area_entry > patch_area_size)
6926 if (patch_area_size > 0)
6927 warning (OPT_Wattributes,
6928 "patchable function entry %wu exceeds size %wu",
6929 patch_area_entry, patch_area_size);
6930 patch_area_entry = 0;
6933 crtl->patch_area_size = patch_area_size;
6934 crtl->patch_area_entry = patch_area_entry;
6936 /* BB subdivision may have created basic blocks that are only reachable
6937 from unlikely bbs but not marked as such in the profile. */
6938 if (optimize)
6939 propagate_unlikely_bbs_forward ();
6941 /* Remove unreachable blocks, otherwise we cannot compute dominators
6942 which are needed for loop state verification. As a side-effect
6943 this also compacts blocks.
6944 ??? We cannot remove trivially dead insns here as for example
6945 the DRAP reg on i?86 is not magically live at this point.
6946 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6947 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6949 checking_verify_flow_info ();
6951 /* Initialize pseudos allocated for hard registers. */
6952 emit_initial_value_sets ();
6954 /* And finally unshare all RTL. */
6955 unshare_all_rtl ();
6957 /* There's no need to defer outputting this function any more; we
6958 know we want to output it. */
6959 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6961 /* Now that we're done expanding trees to RTL, we shouldn't have any
6962 more CONCATs anywhere. */
6963 generating_concat_p = 0;
6965 if (dump_file)
6967 fprintf (dump_file,
6968 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6969 /* And the pass manager will dump RTL for us. */
6972 /* If we're emitting a nested function, make sure its parent gets
6973 emitted as well. Doing otherwise confuses debug info. */
6975 tree parent;
6976 for (parent = DECL_CONTEXT (current_function_decl);
6977 parent != NULL_TREE;
6978 parent = get_containing_scope (parent))
6979 if (TREE_CODE (parent) == FUNCTION_DECL)
6980 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6983 TREE_ASM_WRITTEN (current_function_decl) = 1;
6985 /* After expanding, the return labels are no longer needed. */
6986 return_label = NULL;
6987 naked_return_label = NULL;
6989 /* After expanding, the tm_restart map is no longer needed. */
6990 if (fun->gimple_df->tm_restart)
6991 fun->gimple_df->tm_restart = NULL;
6993 /* Tag the blocks with a depth number so that change_scope can find
6994 the common parent easily. */
6995 set_block_levels (DECL_INITIAL (fun->decl), 0);
6996 default_rtl_profile ();
6998 /* For -dx discard loops now, otherwise IL verify in clean_state will
6999 ICE. */
7000 if (rtl_dump_and_exit)
7002 cfun->curr_properties &= ~PROP_loops;
7003 loop_optimizer_finalize ();
7006 timevar_pop (TV_POST_EXPAND);
7008 return 0;
7011 } // anon namespace
7013 rtl_opt_pass *
7014 make_pass_expand (gcc::context *ctxt)
7016 return new pass_expand (ctxt);