fix single argument static_assert
[official-gcc.git] / gcc / cfgexpand.cc
blobafee064aa154fd5c97c6e85152b6aa61a3c87eb3
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2024 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
76 #include "opts.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 switch (gimple_assign_rhs_class (stmt))
109 case GIMPLE_TERNARY_RHS:
110 t = build3 (gimple_assign_rhs_code (stmt),
111 TREE_TYPE (gimple_assign_lhs (stmt)),
112 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
113 gimple_assign_rhs3 (stmt));
114 break;
115 case GIMPLE_BINARY_RHS:
116 t = build2 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
119 break;
120 case GIMPLE_UNARY_RHS:
121 t = build1 (gimple_assign_rhs_code (stmt),
122 TREE_TYPE (gimple_assign_lhs (stmt)),
123 gimple_assign_rhs1 (stmt));
124 break;
125 case GIMPLE_SINGLE_RHS:
127 t = gimple_assign_rhs1 (stmt);
128 /* Avoid modifying this tree in place below. */
129 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
130 && gimple_location (stmt) != EXPR_LOCATION (t))
131 || (gimple_block (stmt) && currently_expanding_to_rtl
132 && EXPR_P (t)))
133 t = copy_node (t);
134 break;
136 default:
137 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 class stack_var
310 public:
311 /* The Variable. */
312 tree decl;
314 /* Initially, the size of the variable. Later, the size of the partition,
315 if this variable becomes it's partition's representative. */
316 poly_uint64 size;
318 /* The *byte* alignment required for this variable. Or as, with the
319 size, the alignment for this partition. */
320 unsigned int alignb;
322 /* The partition representative. */
323 size_t representative;
325 /* The next stack variable in the partition, or EOC. */
326 size_t next;
328 /* The numbers of conflicting stack variables. */
329 bitmap conflicts;
332 #define EOC ((size_t)-1)
334 /* We have an array of such objects while deciding allocation. */
335 static class stack_var *stack_vars;
336 static size_t stack_vars_alloc;
337 static size_t stack_vars_num;
338 static hash_map<tree, size_t> *decl_to_stack_part;
340 /* Conflict bitmaps go on this obstack. This allows us to destroy
341 all of them in one big sweep. */
342 static bitmap_obstack stack_var_bitmap_obstack;
344 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
345 is non-decreasing. */
346 static size_t *stack_vars_sorted;
348 /* The phase of the stack frame. This is the known misalignment of
349 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
350 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
351 static int frame_phase;
353 /* Used during expand_used_vars to remember if we saw any decls for
354 which we'd like to enable stack smashing protection. */
355 static bool has_protected_decls;
357 /* Used during expand_used_vars. Remember if we say a character buffer
358 smaller than our cutoff threshold. Used for -Wstack-protector. */
359 static bool has_short_buffer;
361 /* Compute the byte alignment to use for DECL. Ignore alignment
362 we can't do with expected alignment of the stack boundary. */
364 static unsigned int
365 align_local_variable (tree decl, bool really_expand)
367 unsigned int align;
369 if (TREE_CODE (decl) == SSA_NAME)
371 tree type = TREE_TYPE (decl);
372 machine_mode mode = TYPE_MODE (type);
374 align = TYPE_ALIGN (type);
375 if (mode != BLKmode
376 && align < GET_MODE_ALIGNMENT (mode))
377 align = GET_MODE_ALIGNMENT (mode);
379 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
382 if (hwasan_sanitize_stack_p ())
383 align = MAX (align, (unsigned) HWASAN_TAG_GRANULE_SIZE * BITS_PER_UNIT);
385 if (TREE_CODE (decl) != SSA_NAME && really_expand)
386 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
387 That is done before IPA and could bump alignment based on host
388 backend even for offloaded code which wants different
389 LOCAL_DECL_ALIGNMENT. */
390 SET_DECL_ALIGN (decl, align);
392 return align / BITS_PER_UNIT;
395 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
396 down otherwise. Return truncated BASE value. */
398 static inline unsigned HOST_WIDE_INT
399 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
401 return align_up ? (base + align - 1) & -align : base & -align;
404 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
405 Return the frame offset. */
407 static poly_int64
408 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
410 poly_int64 offset, new_frame_offset;
412 if (FRAME_GROWS_DOWNWARD)
414 new_frame_offset
415 = aligned_lower_bound (frame_offset - frame_phase - size,
416 align) + frame_phase;
417 offset = new_frame_offset;
419 else
421 new_frame_offset
422 = aligned_upper_bound (frame_offset - frame_phase,
423 align) + frame_phase;
424 offset = new_frame_offset;
425 new_frame_offset += size;
427 frame_offset = new_frame_offset;
429 if (frame_offset_overflow (frame_offset, cfun->decl))
430 frame_offset = offset = 0;
432 return offset;
435 /* Ensure that the stack is aligned to ALIGN bytes.
436 Return the new frame offset. */
437 static poly_int64
438 align_frame_offset (unsigned HOST_WIDE_INT align)
440 return alloc_stack_frame_space (0, align);
443 /* Accumulate DECL into STACK_VARS. */
445 static void
446 add_stack_var (tree decl, bool really_expand)
448 class stack_var *v;
450 if (stack_vars_num >= stack_vars_alloc)
452 if (stack_vars_alloc)
453 stack_vars_alloc = stack_vars_alloc * 3 / 2;
454 else
455 stack_vars_alloc = 32;
456 stack_vars
457 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
459 if (!decl_to_stack_part)
460 decl_to_stack_part = new hash_map<tree, size_t>;
462 v = &stack_vars[stack_vars_num];
463 decl_to_stack_part->put (decl, stack_vars_num);
465 v->decl = decl;
466 tree size = TREE_CODE (decl) == SSA_NAME
467 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
468 : DECL_SIZE_UNIT (decl);
469 v->size = tree_to_poly_uint64 (size);
470 /* Ensure that all variables have size, so that &a != &b for any two
471 variables that are simultaneously live. */
472 if (known_eq (v->size, 0U))
473 v->size = 1;
474 v->alignb = align_local_variable (decl, really_expand);
475 /* An alignment of zero can mightily confuse us later. */
476 gcc_assert (v->alignb != 0);
478 /* All variables are initially in their own partition. */
479 v->representative = stack_vars_num;
480 v->next = EOC;
482 /* All variables initially conflict with no other. */
483 v->conflicts = NULL;
485 /* Ensure that this decl doesn't get put onto the list twice. */
486 set_rtl (decl, pc_rtx);
488 stack_vars_num++;
491 /* Make the decls associated with luid's X and Y conflict. */
493 static void
494 add_stack_var_conflict (size_t x, size_t y)
496 class stack_var *a = &stack_vars[x];
497 class stack_var *b = &stack_vars[y];
498 if (x == y)
499 return;
500 if (!a->conflicts)
501 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
502 if (!b->conflicts)
503 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
504 bitmap_set_bit (a->conflicts, y);
505 bitmap_set_bit (b->conflicts, x);
508 /* Check whether the decls associated with luid's X and Y conflict. */
510 static bool
511 stack_var_conflict_p (size_t x, size_t y)
513 class stack_var *a = &stack_vars[x];
514 class stack_var *b = &stack_vars[y];
515 if (x == y)
516 return false;
517 /* Partitions containing an SSA name result from gimple registers
518 with things like unsupported modes. They are top-level and
519 hence conflict with everything else. */
520 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
521 return true;
523 if (!a->conflicts || !b->conflicts)
524 return false;
525 return bitmap_bit_p (a->conflicts, y);
528 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
529 enter its partition number into bitmap DATA. */
531 static bool
532 visit_op (gimple *, tree op, tree, void *data)
534 bitmap active = (bitmap)data;
535 op = get_base_address (op);
536 if (op
537 && DECL_P (op)
538 && DECL_RTL_IF_SET (op) == pc_rtx)
540 size_t *v = decl_to_stack_part->get (op);
541 if (v)
542 bitmap_set_bit (active, *v);
544 return false;
547 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
548 record conflicts between it and all currently active other partitions
549 from bitmap DATA. */
551 static bool
552 visit_conflict (gimple *, tree op, tree, void *data)
554 bitmap active = (bitmap)data;
555 op = get_base_address (op);
556 if (op
557 && DECL_P (op)
558 && DECL_RTL_IF_SET (op) == pc_rtx)
560 size_t *v = decl_to_stack_part->get (op);
561 if (v && bitmap_set_bit (active, *v))
563 size_t num = *v;
564 bitmap_iterator bi;
565 unsigned i;
566 gcc_assert (num < stack_vars_num);
567 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
568 add_stack_var_conflict (num, i);
571 return false;
574 /* Helper function for add_scope_conflicts_1. For USE on
575 a stmt, if it is a SSA_NAME and in its SSA_NAME_DEF_STMT is known to be
576 based on some ADDR_EXPR, invoke VISIT on that ADDR_EXPR. */
578 static inline void
579 add_scope_conflicts_2 (tree use, bitmap work,
580 walk_stmt_load_store_addr_fn visit)
582 if (TREE_CODE (use) == SSA_NAME
583 && (POINTER_TYPE_P (TREE_TYPE (use))
584 || INTEGRAL_TYPE_P (TREE_TYPE (use))))
586 gimple *g = SSA_NAME_DEF_STMT (use);
587 if (is_gimple_assign (g))
588 if (tree op = gimple_assign_rhs1 (g))
589 if (TREE_CODE (op) == ADDR_EXPR)
590 visit (g, TREE_OPERAND (op, 0), op, work);
594 /* Helper routine for add_scope_conflicts, calculating the active partitions
595 at the end of BB, leaving the result in WORK. We're called to generate
596 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
597 liveness. */
599 static void
600 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
602 edge e;
603 edge_iterator ei;
604 gimple_stmt_iterator gsi;
605 walk_stmt_load_store_addr_fn visit;
606 use_operand_p use_p;
607 ssa_op_iter iter;
609 bitmap_clear (work);
610 FOR_EACH_EDGE (e, ei, bb->preds)
611 bitmap_ior_into (work, (bitmap)e->src->aux);
613 visit = visit_op;
615 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
617 gimple *stmt = gsi_stmt (gsi);
618 gphi *phi = as_a <gphi *> (stmt);
619 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
620 FOR_EACH_PHI_ARG (use_p, phi, iter, SSA_OP_USE)
621 add_scope_conflicts_2 (USE_FROM_PTR (use_p), work, visit);
623 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
625 gimple *stmt = gsi_stmt (gsi);
627 if (gimple_clobber_p (stmt))
629 tree lhs = gimple_assign_lhs (stmt);
630 size_t *v;
631 /* Nested function lowering might introduce LHSs
632 that are COMPONENT_REFs. */
633 if (!VAR_P (lhs))
634 continue;
635 if (DECL_RTL_IF_SET (lhs) == pc_rtx
636 && (v = decl_to_stack_part->get (lhs)))
637 bitmap_clear_bit (work, *v);
639 else if (!is_gimple_debug (stmt))
641 if (for_conflict && visit == visit_op)
643 /* When we are inheriting live variables from our predecessors
644 through a CFG merge we might not see an actual mention of
645 the variables to record the approprate conflict as defs/uses
646 might be through indirect stores/loads. For this reason
647 we have to make sure each live variable conflicts with
648 each other. When there's just a single predecessor the
649 set of conflicts is already up-to-date.
650 We perform this delayed at the first real instruction to
651 allow clobbers starting this block to remove variables from
652 the set of live variables. */
653 bitmap_iterator bi;
654 unsigned i;
655 if (EDGE_COUNT (bb->preds) > 1)
656 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
658 class stack_var *a = &stack_vars[i];
659 if (!a->conflicts)
660 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
661 bitmap_ior_into (a->conflicts, work);
663 visit = visit_conflict;
665 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
666 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
667 add_scope_conflicts_2 (USE_FROM_PTR (use_p), work, visit);
671 /* When there was no real instruction but there's a CFG merge we need
672 to add the conflicts now. */
673 if (for_conflict && visit == visit_op && EDGE_COUNT (bb->preds) > 1)
675 bitmap_iterator bi;
676 unsigned i;
677 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
679 class stack_var *a = &stack_vars[i];
680 if (!a->conflicts)
681 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
682 bitmap_ior_into (a->conflicts, work);
687 /* Generate stack partition conflicts between all partitions that are
688 simultaneously live. */
690 static void
691 add_scope_conflicts (void)
693 basic_block bb;
694 bool changed;
695 bitmap work = BITMAP_ALLOC (NULL);
696 int *rpo;
697 int n_bbs;
699 /* We approximate the live range of a stack variable by taking the first
700 mention of its name as starting point(s), and by the end-of-scope
701 death clobber added by gimplify as ending point(s) of the range.
702 This overapproximates in the case we for instance moved an address-taken
703 operation upward, without also moving a dereference to it upwards.
704 But it's conservatively correct as a variable never can hold values
705 before its name is mentioned at least once.
707 We then do a mostly classical bitmap liveness algorithm. */
709 FOR_ALL_BB_FN (bb, cfun)
710 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
712 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
713 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
715 changed = true;
716 while (changed)
718 int i;
719 changed = false;
720 for (i = 0; i < n_bbs; i++)
722 bitmap active;
723 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
724 active = (bitmap)bb->aux;
725 add_scope_conflicts_1 (bb, work, false);
726 if (bitmap_ior_into (active, work))
727 changed = true;
731 FOR_EACH_BB_FN (bb, cfun)
732 add_scope_conflicts_1 (bb, work, true);
734 free (rpo);
735 BITMAP_FREE (work);
736 FOR_ALL_BB_FN (bb, cfun)
737 BITMAP_FREE (bb->aux);
740 /* A subroutine of partition_stack_vars. A comparison function for qsort,
741 sorting an array of indices by the properties of the object. */
743 static int
744 stack_var_cmp (const void *a, const void *b)
746 size_t ia = *(const size_t *)a;
747 size_t ib = *(const size_t *)b;
748 unsigned int aligna = stack_vars[ia].alignb;
749 unsigned int alignb = stack_vars[ib].alignb;
750 poly_int64 sizea = stack_vars[ia].size;
751 poly_int64 sizeb = stack_vars[ib].size;
752 tree decla = stack_vars[ia].decl;
753 tree declb = stack_vars[ib].decl;
754 bool largea, largeb;
755 unsigned int uida, uidb;
757 /* Primary compare on "large" alignment. Large comes first. */
758 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
759 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
760 if (largea != largeb)
761 return (int)largeb - (int)largea;
763 /* Secondary compare on size, decreasing */
764 int diff = compare_sizes_for_sort (sizeb, sizea);
765 if (diff != 0)
766 return diff;
768 /* Tertiary compare on true alignment, decreasing. */
769 if (aligna < alignb)
770 return -1;
771 if (aligna > alignb)
772 return 1;
774 /* Final compare on ID for sort stability, increasing.
775 Two SSA names are compared by their version, SSA names come before
776 non-SSA names, and two normal decls are compared by their DECL_UID. */
777 if (TREE_CODE (decla) == SSA_NAME)
779 if (TREE_CODE (declb) == SSA_NAME)
780 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
781 else
782 return -1;
784 else if (TREE_CODE (declb) == SSA_NAME)
785 return 1;
786 else
787 uida = DECL_UID (decla), uidb = DECL_UID (declb);
788 if (uida < uidb)
789 return 1;
790 if (uida > uidb)
791 return -1;
792 return 0;
795 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
796 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
798 /* If the points-to solution *PI points to variables that are in a partition
799 together with other variables add all partition members to the pointed-to
800 variables bitmap. */
802 static void
803 add_partitioned_vars_to_ptset (struct pt_solution *pt,
804 part_hashmap *decls_to_partitions,
805 hash_set<bitmap> *visited, bitmap temp)
807 bitmap_iterator bi;
808 unsigned i;
809 bitmap *part;
811 if (pt->anything
812 || pt->vars == NULL
813 /* The pointed-to vars bitmap is shared, it is enough to
814 visit it once. */
815 || visited->add (pt->vars))
816 return;
818 bitmap_clear (temp);
820 /* By using a temporary bitmap to store all members of the partitions
821 we have to add we make sure to visit each of the partitions only
822 once. */
823 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
824 if ((!temp
825 || !bitmap_bit_p (temp, i))
826 && (part = decls_to_partitions->get (i)))
827 bitmap_ior_into (temp, *part);
828 if (!bitmap_empty_p (temp))
829 bitmap_ior_into (pt->vars, temp);
832 /* Update points-to sets based on partition info, so we can use them on RTL.
833 The bitmaps representing stack partitions will be saved until expand,
834 where partitioned decls used as bases in memory expressions will be
835 rewritten.
837 It is not necessary to update TBAA info on accesses to the coalesced
838 storage since our memory model doesn't allow TBAA to be used for
839 WAW or WAR dependences. For RAW when the write is to an old object
840 the new object would not have been initialized at the point of the
841 read, invoking undefined behavior. */
843 static void
844 update_alias_info_with_stack_vars (void)
846 part_hashmap *decls_to_partitions = NULL;
847 size_t i, j;
848 tree var = NULL_TREE;
850 for (i = 0; i < stack_vars_num; i++)
852 bitmap part = NULL;
853 tree name;
854 struct ptr_info_def *pi;
856 /* Not interested in partitions with single variable. */
857 if (stack_vars[i].representative != i
858 || stack_vars[i].next == EOC)
859 continue;
861 if (!decls_to_partitions)
863 decls_to_partitions = new part_hashmap;
864 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
867 /* Create an SSA_NAME that points to the partition for use
868 as base during alias-oracle queries on RTL for bases that
869 have been partitioned. */
870 if (var == NULL_TREE)
871 var = create_tmp_var (ptr_type_node);
872 name = make_ssa_name (var);
874 /* Create bitmaps representing partitions. They will be used for
875 points-to sets later, so use GGC alloc. */
876 part = BITMAP_GGC_ALLOC ();
877 for (j = i; j != EOC; j = stack_vars[j].next)
879 tree decl = stack_vars[j].decl;
880 unsigned int uid = DECL_PT_UID (decl);
881 bitmap_set_bit (part, uid);
882 decls_to_partitions->put (uid, part);
883 cfun->gimple_df->decls_to_pointers->put (decl, name);
884 if (TREE_ADDRESSABLE (decl))
885 TREE_ADDRESSABLE (name) = 1;
888 /* Make the SSA name point to all partition members. */
889 pi = get_ptr_info (name);
890 pt_solution_set (&pi->pt, part, false);
893 /* Make all points-to sets that contain one member of a partition
894 contain all members of the partition. */
895 if (decls_to_partitions)
897 unsigned i;
898 tree name;
899 hash_set<bitmap> visited;
900 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
902 FOR_EACH_SSA_NAME (i, name, cfun)
904 struct ptr_info_def *pi;
906 if (POINTER_TYPE_P (TREE_TYPE (name))
907 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
908 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
909 &visited, temp);
912 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
913 decls_to_partitions, &visited, temp);
914 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped_return,
915 decls_to_partitions, &visited, temp);
916 delete decls_to_partitions;
917 BITMAP_FREE (temp);
921 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
922 partitioning algorithm. Partitions A and B are known to be non-conflicting.
923 Merge them into a single partition A. */
925 static void
926 union_stack_vars (size_t a, size_t b)
928 class stack_var *vb = &stack_vars[b];
929 bitmap_iterator bi;
930 unsigned u;
932 gcc_assert (stack_vars[b].next == EOC);
933 /* Add B to A's partition. */
934 stack_vars[b].next = stack_vars[a].next;
935 stack_vars[b].representative = a;
936 stack_vars[a].next = b;
938 /* Make sure A is big enough to hold B. */
939 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
941 /* Update the required alignment of partition A to account for B. */
942 if (stack_vars[a].alignb < stack_vars[b].alignb)
943 stack_vars[a].alignb = stack_vars[b].alignb;
945 /* Update the interference graph and merge the conflicts. */
946 if (vb->conflicts)
948 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
949 add_stack_var_conflict (a, stack_vars[u].representative);
950 BITMAP_FREE (vb->conflicts);
954 /* A subroutine of expand_used_vars. Binpack the variables into
955 partitions constrained by the interference graph. The overall
956 algorithm used is as follows:
958 Sort the objects by size in descending order.
959 For each object A {
960 S = size(A)
961 O = 0
962 loop {
963 Look for the largest non-conflicting object B with size <= S.
964 UNION (A, B)
969 static void
970 partition_stack_vars (void)
972 size_t si, sj, n = stack_vars_num;
974 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
975 for (si = 0; si < n; ++si)
976 stack_vars_sorted[si] = si;
978 if (n == 1)
979 return;
981 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
983 for (si = 0; si < n; ++si)
985 size_t i = stack_vars_sorted[si];
986 unsigned int ialign = stack_vars[i].alignb;
987 poly_int64 isize = stack_vars[i].size;
989 /* Ignore objects that aren't partition representatives. If we
990 see a var that is not a partition representative, it must
991 have been merged earlier. */
992 if (stack_vars[i].representative != i)
993 continue;
995 for (sj = si + 1; sj < n; ++sj)
997 size_t j = stack_vars_sorted[sj];
998 unsigned int jalign = stack_vars[j].alignb;
999 poly_int64 jsize = stack_vars[j].size;
1001 /* Ignore objects that aren't partition representatives. */
1002 if (stack_vars[j].representative != j)
1003 continue;
1005 /* Do not mix objects of "small" (supported) alignment
1006 and "large" (unsupported) alignment. */
1007 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1008 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
1009 break;
1011 /* For Address Sanitizer do not mix objects with different
1012 sizes, as the shorter vars wouldn't be adequately protected.
1013 Don't do that for "large" (unsupported) alignment objects,
1014 those aren't protected anyway. */
1015 if (asan_sanitize_stack_p ()
1016 && maybe_ne (isize, jsize)
1017 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1018 break;
1020 /* Ignore conflicting objects. */
1021 if (stack_var_conflict_p (i, j))
1022 continue;
1024 /* UNION the objects, placing J at OFFSET. */
1025 union_stack_vars (i, j);
1029 update_alias_info_with_stack_vars ();
1032 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
1034 static void
1035 dump_stack_var_partition (void)
1037 size_t si, i, j, n = stack_vars_num;
1039 for (si = 0; si < n; ++si)
1041 i = stack_vars_sorted[si];
1043 /* Skip variables that aren't partition representatives, for now. */
1044 if (stack_vars[i].representative != i)
1045 continue;
1047 fprintf (dump_file, "Partition " HOST_SIZE_T_PRINT_UNSIGNED ": size ",
1048 (fmt_size_t) i);
1049 print_dec (stack_vars[i].size, dump_file);
1050 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
1052 for (j = i; j != EOC; j = stack_vars[j].next)
1054 fputc ('\t', dump_file);
1055 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
1057 fputc ('\n', dump_file);
1061 /* Assign rtl to DECL at BASE + OFFSET. */
1063 static void
1064 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1065 poly_int64 offset)
1067 unsigned align;
1068 rtx x;
1070 /* If this fails, we've overflowed the stack frame. Error nicely? */
1071 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1073 if (hwasan_sanitize_stack_p ())
1074 x = targetm.memtag.add_tag (base, offset,
1075 hwasan_current_frame_tag ());
1076 else
1077 x = plus_constant (Pmode, base, offset);
1079 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1080 ? TYPE_MODE (TREE_TYPE (decl))
1081 : DECL_MODE (decl), x);
1083 /* Set alignment we actually gave this decl if it isn't an SSA name.
1084 If it is we generate stack slots only accidentally so it isn't as
1085 important, we'll simply set the alignment directly on the MEM. */
1087 if (stack_vars_base_reg_p (base))
1088 offset -= frame_phase;
1089 align = known_alignment (offset);
1090 align *= BITS_PER_UNIT;
1091 if (align == 0 || align > base_align)
1092 align = base_align;
1094 if (TREE_CODE (decl) != SSA_NAME)
1096 /* One would think that we could assert that we're not decreasing
1097 alignment here, but (at least) the i386 port does exactly this
1098 via the MINIMUM_ALIGNMENT hook. */
1100 SET_DECL_ALIGN (decl, align);
1101 DECL_USER_ALIGN (decl) = 0;
1104 set_rtl (decl, x);
1106 set_mem_align (x, align);
1109 class stack_vars_data
1111 public:
1112 /* Vector of offset pairs, always end of some padding followed
1113 by start of the padding that needs Address Sanitizer protection.
1114 The vector is in reversed, highest offset pairs come first. */
1115 auto_vec<HOST_WIDE_INT> asan_vec;
1117 /* Vector of partition representative decls in between the paddings. */
1118 auto_vec<tree> asan_decl_vec;
1120 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1121 rtx asan_base;
1123 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1124 unsigned int asan_alignb;
1127 /* A subroutine of expand_used_vars. Give each partition representative
1128 a unique location within the stack frame. Update each partition member
1129 with that location. */
1130 static void
1131 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1133 size_t si, i, j, n = stack_vars_num;
1134 poly_uint64 large_size = 0, large_alloc = 0;
1135 rtx large_base = NULL;
1136 rtx large_untagged_base = NULL;
1137 unsigned large_align = 0;
1138 bool large_allocation_done = false;
1139 tree decl;
1141 /* Determine if there are any variables requiring "large" alignment.
1142 Since these are dynamically allocated, we only process these if
1143 no predicate involved. */
1144 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1145 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1147 /* Find the total size of these variables. */
1148 for (si = 0; si < n; ++si)
1150 unsigned alignb;
1152 i = stack_vars_sorted[si];
1153 alignb = stack_vars[i].alignb;
1155 /* All "large" alignment decls come before all "small" alignment
1156 decls, but "large" alignment decls are not sorted based on
1157 their alignment. Increase large_align to track the largest
1158 required alignment. */
1159 if ((alignb * BITS_PER_UNIT) > large_align)
1160 large_align = alignb * BITS_PER_UNIT;
1162 /* Stop when we get to the first decl with "small" alignment. */
1163 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1164 break;
1166 /* Skip variables that aren't partition representatives. */
1167 if (stack_vars[i].representative != i)
1168 continue;
1170 /* Skip variables that have already had rtl assigned. See also
1171 add_stack_var where we perpetrate this pc_rtx hack. */
1172 decl = stack_vars[i].decl;
1173 if (TREE_CODE (decl) == SSA_NAME
1174 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1175 : DECL_RTL (decl) != pc_rtx)
1176 continue;
1178 large_size = aligned_upper_bound (large_size, alignb);
1179 large_size += stack_vars[i].size;
1183 for (si = 0; si < n; ++si)
1185 rtx base;
1186 unsigned base_align, alignb;
1187 poly_int64 offset = 0;
1189 i = stack_vars_sorted[si];
1191 /* Skip variables that aren't partition representatives, for now. */
1192 if (stack_vars[i].representative != i)
1193 continue;
1195 /* Skip variables that have already had rtl assigned. See also
1196 add_stack_var where we perpetrate this pc_rtx hack. */
1197 decl = stack_vars[i].decl;
1198 if (TREE_CODE (decl) == SSA_NAME
1199 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1200 : DECL_RTL (decl) != pc_rtx)
1201 continue;
1203 /* Check the predicate to see whether this variable should be
1204 allocated in this pass. */
1205 if (pred && !pred (i))
1206 continue;
1208 base = (hwasan_sanitize_stack_p ()
1209 ? hwasan_frame_base ()
1210 : virtual_stack_vars_rtx);
1211 alignb = stack_vars[i].alignb;
1212 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1214 poly_int64 hwasan_orig_offset;
1215 if (hwasan_sanitize_stack_p ())
1217 /* There must be no tag granule "shared" between different
1218 objects. This means that no HWASAN_TAG_GRANULE_SIZE byte
1219 chunk can have more than one object in it.
1221 We ensure this by forcing the end of the last bit of data to
1222 be aligned to HWASAN_TAG_GRANULE_SIZE bytes here, and setting
1223 the start of each variable to be aligned to
1224 HWASAN_TAG_GRANULE_SIZE bytes in `align_local_variable`.
1226 We can't align just one of the start or end, since there are
1227 untagged things stored on the stack which we do not align to
1228 HWASAN_TAG_GRANULE_SIZE bytes. If we only aligned the start
1229 or the end of tagged objects then untagged objects could end
1230 up sharing the first granule of a tagged object or sharing the
1231 last granule of a tagged object respectively. */
1232 hwasan_orig_offset = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1233 gcc_assert (stack_vars[i].alignb >= HWASAN_TAG_GRANULE_SIZE);
1235 /* ASAN description strings don't yet have a syntax for expressing
1236 polynomial offsets. */
1237 HOST_WIDE_INT prev_offset;
1238 if (asan_sanitize_stack_p ()
1239 && pred
1240 && frame_offset.is_constant (&prev_offset)
1241 && stack_vars[i].size.is_constant ())
1243 if (data->asan_vec.is_empty ())
1245 align_frame_offset (ASAN_RED_ZONE_SIZE);
1246 prev_offset = frame_offset.to_constant ();
1248 prev_offset = align_base (prev_offset,
1249 ASAN_MIN_RED_ZONE_SIZE,
1250 !FRAME_GROWS_DOWNWARD);
1251 tree repr_decl = NULL_TREE;
1252 unsigned HOST_WIDE_INT size
1253 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1254 if (data->asan_vec.is_empty ())
1255 size = MAX (size, ASAN_RED_ZONE_SIZE);
1257 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1258 ASAN_MIN_RED_ZONE_SIZE);
1259 offset = alloc_stack_frame_space (size, alignment);
1261 data->asan_vec.safe_push (prev_offset);
1262 /* Allocating a constant amount of space from a constant
1263 starting offset must give a constant result. */
1264 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1265 .to_constant ());
1266 /* Find best representative of the partition.
1267 Prefer those with DECL_NAME, even better
1268 satisfying asan_protect_stack_decl predicate. */
1269 for (j = i; j != EOC; j = stack_vars[j].next)
1270 if (asan_protect_stack_decl (stack_vars[j].decl)
1271 && DECL_NAME (stack_vars[j].decl))
1273 repr_decl = stack_vars[j].decl;
1274 break;
1276 else if (repr_decl == NULL_TREE
1277 && DECL_P (stack_vars[j].decl)
1278 && DECL_NAME (stack_vars[j].decl))
1279 repr_decl = stack_vars[j].decl;
1280 if (repr_decl == NULL_TREE)
1281 repr_decl = stack_vars[i].decl;
1282 data->asan_decl_vec.safe_push (repr_decl);
1284 /* Make sure a representative is unpoison if another
1285 variable in the partition is handled by
1286 use-after-scope sanitization. */
1287 if (asan_handled_variables != NULL
1288 && !asan_handled_variables->contains (repr_decl))
1290 for (j = i; j != EOC; j = stack_vars[j].next)
1291 if (asan_handled_variables->contains (stack_vars[j].decl))
1292 break;
1293 if (j != EOC)
1294 asan_handled_variables->add (repr_decl);
1297 data->asan_alignb = MAX (data->asan_alignb, alignb);
1298 if (data->asan_base == NULL)
1299 data->asan_base = gen_reg_rtx (Pmode);
1300 base = data->asan_base;
1302 if (!STRICT_ALIGNMENT)
1303 base_align = crtl->max_used_stack_slot_alignment;
1304 else
1305 base_align = MAX (crtl->max_used_stack_slot_alignment,
1306 GET_MODE_ALIGNMENT (SImode)
1307 << ASAN_SHADOW_SHIFT);
1309 else
1311 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1312 base_align = crtl->max_used_stack_slot_alignment;
1314 if (hwasan_sanitize_stack_p ())
1316 /* Align again since the point of this alignment is to handle
1317 the "end" of the object (i.e. smallest address after the
1318 stack object). For FRAME_GROWS_DOWNWARD that requires
1319 aligning the stack before allocating, but for a frame that
1320 grows upwards that requires aligning the stack after
1321 allocation.
1323 Use `frame_offset` to record the offset value rather than
1324 `offset` since the `frame_offset` describes the extent
1325 allocated for this particular variable while `offset`
1326 describes the address that this variable starts at. */
1327 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1328 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1329 hwasan_orig_offset, frame_offset);
1333 else
1335 /* Large alignment is only processed in the last pass. */
1336 if (pred)
1337 continue;
1339 /* If there were any variables requiring "large" alignment, allocate
1340 space. */
1341 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1343 poly_int64 loffset;
1344 rtx large_allocsize;
1346 large_allocsize = gen_int_mode (large_size, Pmode);
1347 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1348 loffset = alloc_stack_frame_space
1349 (rtx_to_poly_int64 (large_allocsize),
1350 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1351 large_base = get_dynamic_stack_base (loffset, large_align, base);
1352 large_allocation_done = true;
1355 gcc_assert (large_base != NULL);
1356 large_alloc = aligned_upper_bound (large_alloc, alignb);
1357 offset = large_alloc;
1358 large_alloc += stack_vars[i].size;
1359 if (hwasan_sanitize_stack_p ())
1361 /* An object with a large alignment requirement means that the
1362 alignment requirement is greater than the required alignment
1363 for tags. */
1364 if (!large_untagged_base)
1365 large_untagged_base
1366 = targetm.memtag.untagged_pointer (large_base, NULL_RTX);
1367 /* Ensure the end of the variable is also aligned correctly. */
1368 poly_int64 align_again
1369 = aligned_upper_bound (large_alloc, HWASAN_TAG_GRANULE_SIZE);
1370 /* For large allocations we always allocate a chunk of space
1371 (which is addressed by large_untagged_base/large_base) and
1372 then use positive offsets from that. Hence the farthest
1373 offset is `align_again` and the nearest offset from the base
1374 is `offset`. */
1375 hwasan_record_stack_var (large_untagged_base, large_base,
1376 offset, align_again);
1379 base = large_base;
1380 base_align = large_align;
1383 /* Create rtl for each variable based on their location within the
1384 partition. */
1385 for (j = i; j != EOC; j = stack_vars[j].next)
1387 expand_one_stack_var_at (stack_vars[j].decl,
1388 base, base_align, offset);
1390 if (hwasan_sanitize_stack_p ())
1391 hwasan_increment_frame_tag ();
1394 gcc_assert (known_eq (large_alloc, large_size));
1397 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1398 static poly_uint64
1399 account_stack_vars (void)
1401 size_t si, j, i, n = stack_vars_num;
1402 poly_uint64 size = 0;
1404 for (si = 0; si < n; ++si)
1406 i = stack_vars_sorted[si];
1408 /* Skip variables that aren't partition representatives, for now. */
1409 if (stack_vars[i].representative != i)
1410 continue;
1412 size += stack_vars[i].size;
1413 for (j = i; j != EOC; j = stack_vars[j].next)
1414 set_rtl (stack_vars[j].decl, NULL);
1416 return size;
1419 /* Record the RTL assignment X for the default def of PARM. */
1421 extern void
1422 set_parm_rtl (tree parm, rtx x)
1424 gcc_assert (TREE_CODE (parm) == PARM_DECL
1425 || TREE_CODE (parm) == RESULT_DECL);
1427 if (x && !MEM_P (x))
1429 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1430 TYPE_MODE (TREE_TYPE (parm)),
1431 TYPE_ALIGN (TREE_TYPE (parm)));
1433 /* If the variable alignment is very large we'll dynamicaly
1434 allocate it, which means that in-frame portion is just a
1435 pointer. ??? We've got a pseudo for sure here, do we
1436 actually dynamically allocate its spilling area if needed?
1437 ??? Isn't it a problem when Pmode alignment also exceeds
1438 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1439 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1440 align = GET_MODE_ALIGNMENT (Pmode);
1442 record_alignment_for_reg_var (align);
1445 tree ssa = ssa_default_def (cfun, parm);
1446 if (!ssa)
1447 return set_rtl (parm, x);
1449 int part = var_to_partition (SA.map, ssa);
1450 gcc_assert (part != NO_PARTITION);
1452 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1453 gcc_assert (changed);
1455 set_rtl (ssa, x);
1456 gcc_assert (DECL_RTL (parm) == x);
1459 /* A subroutine of expand_one_var. Called to immediately assign rtl
1460 to a variable to be allocated in the stack frame. */
1462 static void
1463 expand_one_stack_var_1 (tree var)
1465 poly_uint64 size;
1466 poly_int64 offset;
1467 unsigned byte_align;
1469 if (TREE_CODE (var) == SSA_NAME)
1471 tree type = TREE_TYPE (var);
1472 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1474 else
1475 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1477 byte_align = align_local_variable (var, true);
1479 /* We handle highly aligned variables in expand_stack_vars. */
1480 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1482 rtx base;
1483 if (hwasan_sanitize_stack_p ())
1485 /* Allocate zero bytes to align the stack. */
1486 poly_int64 hwasan_orig_offset
1487 = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1488 offset = alloc_stack_frame_space (size, byte_align);
1489 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1490 base = hwasan_frame_base ();
1491 /* Use `frame_offset` to automatically account for machines where the
1492 frame grows upwards.
1494 `offset` will always point to the "start" of the stack object, which
1495 will be the smallest address, for ! FRAME_GROWS_DOWNWARD this is *not*
1496 the "furthest" offset from the base delimiting the current stack
1497 object. `frame_offset` will always delimit the extent that the frame.
1499 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1500 hwasan_orig_offset, frame_offset);
1502 else
1504 offset = alloc_stack_frame_space (size, byte_align);
1505 base = virtual_stack_vars_rtx;
1508 expand_one_stack_var_at (var, base,
1509 crtl->max_used_stack_slot_alignment, offset);
1511 if (hwasan_sanitize_stack_p ())
1512 hwasan_increment_frame_tag ();
1515 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1516 already assigned some MEM. */
1518 static void
1519 expand_one_stack_var (tree var)
1521 if (TREE_CODE (var) == SSA_NAME)
1523 int part = var_to_partition (SA.map, var);
1524 if (part != NO_PARTITION)
1526 rtx x = SA.partition_to_pseudo[part];
1527 gcc_assert (x);
1528 gcc_assert (MEM_P (x));
1529 return;
1533 return expand_one_stack_var_1 (var);
1536 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1537 that will reside in a hard register. */
1539 static void
1540 expand_one_hard_reg_var (tree var)
1542 rest_of_decl_compilation (var, 0, 0);
1545 /* Record the alignment requirements of some variable assigned to a
1546 pseudo. */
1548 static void
1549 record_alignment_for_reg_var (unsigned int align)
1551 if (SUPPORTS_STACK_ALIGNMENT
1552 && crtl->stack_alignment_estimated < align)
1554 /* stack_alignment_estimated shouldn't change after stack
1555 realign decision made */
1556 gcc_assert (!crtl->stack_realign_processed);
1557 crtl->stack_alignment_estimated = align;
1560 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1561 So here we only make sure stack_alignment_needed >= align. */
1562 if (crtl->stack_alignment_needed < align)
1563 crtl->stack_alignment_needed = align;
1564 if (crtl->max_used_stack_slot_alignment < align)
1565 crtl->max_used_stack_slot_alignment = align;
1568 /* Create RTL for an SSA partition. */
1570 static void
1571 expand_one_ssa_partition (tree var)
1573 int part = var_to_partition (SA.map, var);
1574 gcc_assert (part != NO_PARTITION);
1576 if (SA.partition_to_pseudo[part])
1577 return;
1579 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1580 TYPE_MODE (TREE_TYPE (var)),
1581 TYPE_ALIGN (TREE_TYPE (var)));
1583 /* If the variable alignment is very large we'll dynamicaly allocate
1584 it, which means that in-frame portion is just a pointer. */
1585 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1586 align = GET_MODE_ALIGNMENT (Pmode);
1588 record_alignment_for_reg_var (align);
1590 if (!use_register_for_decl (var))
1592 if (defer_stack_allocation (var, true))
1593 add_stack_var (var, true);
1594 else
1595 expand_one_stack_var_1 (var);
1596 return;
1599 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1600 rtx x = gen_reg_rtx (reg_mode);
1602 set_rtl (var, x);
1604 /* For a promoted variable, X will not be used directly but wrapped in a
1605 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1606 will assume that its upper bits can be inferred from its lower bits.
1607 Therefore, if X isn't initialized on every path from the entry, then
1608 we must do it manually in order to fulfill the above assumption. */
1609 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1610 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1611 emit_move_insn (x, CONST0_RTX (reg_mode));
1614 /* Record the association between the RTL generated for partition PART
1615 and the underlying variable of the SSA_NAME VAR. */
1617 static void
1618 adjust_one_expanded_partition_var (tree var)
1620 if (!var)
1621 return;
1623 tree decl = SSA_NAME_VAR (var);
1625 int part = var_to_partition (SA.map, var);
1626 if (part == NO_PARTITION)
1627 return;
1629 rtx x = SA.partition_to_pseudo[part];
1631 gcc_assert (x);
1633 set_rtl (var, x);
1635 if (!REG_P (x))
1636 return;
1638 /* Note if the object is a user variable. */
1639 if (decl && !DECL_ARTIFICIAL (decl))
1640 mark_user_reg (x);
1642 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1643 mark_reg_pointer (x, get_pointer_alignment (var));
1646 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1647 that will reside in a pseudo register. */
1649 static void
1650 expand_one_register_var (tree var)
1652 if (TREE_CODE (var) == SSA_NAME)
1654 int part = var_to_partition (SA.map, var);
1655 if (part != NO_PARTITION)
1657 rtx x = SA.partition_to_pseudo[part];
1658 gcc_assert (x);
1659 gcc_assert (REG_P (x));
1660 return;
1662 gcc_unreachable ();
1665 tree decl = var;
1666 tree type = TREE_TYPE (decl);
1667 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1668 rtx x = gen_reg_rtx (reg_mode);
1670 set_rtl (var, x);
1672 /* Note if the object is a user variable. */
1673 if (!DECL_ARTIFICIAL (decl))
1674 mark_user_reg (x);
1676 if (POINTER_TYPE_P (type))
1677 mark_reg_pointer (x, get_pointer_alignment (var));
1680 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1681 has some associated error, e.g. its type is error-mark. We just need
1682 to pick something that won't crash the rest of the compiler. */
1684 static void
1685 expand_one_error_var (tree var)
1687 machine_mode mode = DECL_MODE (var);
1688 rtx x;
1690 if (mode == BLKmode)
1691 x = gen_rtx_MEM (BLKmode, const0_rtx);
1692 else if (mode == VOIDmode)
1693 x = const0_rtx;
1694 else
1695 x = gen_reg_rtx (mode);
1697 SET_DECL_RTL (var, x);
1700 /* A subroutine of expand_one_var. VAR is a variable that will be
1701 allocated to the local stack frame. Return true if we wish to
1702 add VAR to STACK_VARS so that it will be coalesced with other
1703 variables. Return false to allocate VAR immediately.
1705 This function is used to reduce the number of variables considered
1706 for coalescing, which reduces the size of the quadratic problem. */
1708 static bool
1709 defer_stack_allocation (tree var, bool toplevel)
1711 tree size_unit = TREE_CODE (var) == SSA_NAME
1712 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1713 : DECL_SIZE_UNIT (var);
1714 poly_uint64 size;
1716 /* Whether the variable is small enough for immediate allocation not to be
1717 a problem with regard to the frame size. */
1718 bool smallish
1719 = (poly_int_tree_p (size_unit, &size)
1720 && (estimated_poly_value (size)
1721 < param_min_size_for_stack_sharing));
1723 /* If stack protection is enabled, *all* stack variables must be deferred,
1724 so that we can re-order the strings to the top of the frame.
1725 Similarly for Address Sanitizer. */
1726 if (flag_stack_protect || asan_sanitize_stack_p ())
1727 return true;
1729 unsigned int align = TREE_CODE (var) == SSA_NAME
1730 ? TYPE_ALIGN (TREE_TYPE (var))
1731 : DECL_ALIGN (var);
1733 /* We handle "large" alignment via dynamic allocation. We want to handle
1734 this extra complication in only one place, so defer them. */
1735 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1736 return true;
1738 bool ignored = TREE_CODE (var) == SSA_NAME
1739 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1740 : DECL_IGNORED_P (var);
1742 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1743 might be detached from their block and appear at toplevel when we reach
1744 here. We want to coalesce them with variables from other blocks when
1745 the immediate contribution to the frame size would be noticeable. */
1746 if (toplevel && optimize > 0 && ignored && !smallish)
1747 return true;
1749 /* Variables declared in the outermost scope automatically conflict
1750 with every other variable. The only reason to want to defer them
1751 at all is that, after sorting, we can more efficiently pack
1752 small variables in the stack frame. Continue to defer at -O2. */
1753 if (toplevel && optimize < 2)
1754 return false;
1756 /* Without optimization, *most* variables are allocated from the
1757 stack, which makes the quadratic problem large exactly when we
1758 want compilation to proceed as quickly as possible. On the
1759 other hand, we don't want the function's stack frame size to
1760 get completely out of hand. So we avoid adding scalars and
1761 "small" aggregates to the list at all. */
1762 if (optimize == 0 && smallish)
1763 return false;
1765 return true;
1768 /* A subroutine of expand_used_vars. Expand one variable according to
1769 its flavor. Variables to be placed on the stack are not actually
1770 expanded yet, merely recorded.
1771 When REALLY_EXPAND is false, only add stack values to be allocated.
1772 Return stack usage this variable is supposed to take.
1775 static poly_uint64
1776 expand_one_var (tree var, bool toplevel, bool really_expand,
1777 bitmap forced_stack_var = NULL)
1779 unsigned int align = BITS_PER_UNIT;
1780 tree origvar = var;
1782 var = SSAVAR (var);
1784 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1786 if (is_global_var (var))
1787 return 0;
1789 /* Because we don't know if VAR will be in register or on stack,
1790 we conservatively assume it will be on stack even if VAR is
1791 eventually put into register after RA pass. For non-automatic
1792 variables, which won't be on stack, we collect alignment of
1793 type and ignore user specified alignment. Similarly for
1794 SSA_NAMEs for which use_register_for_decl returns true. */
1795 if (TREE_STATIC (var)
1796 || DECL_EXTERNAL (var)
1797 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1798 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1799 TYPE_MODE (TREE_TYPE (var)),
1800 TYPE_ALIGN (TREE_TYPE (var)));
1801 else if (DECL_HAS_VALUE_EXPR_P (var)
1802 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1803 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1804 or variables which were assigned a stack slot already by
1805 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1806 changed from the offset chosen to it. */
1807 align = crtl->stack_alignment_estimated;
1808 else
1809 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1811 /* If the variable alignment is very large we'll dynamicaly allocate
1812 it, which means that in-frame portion is just a pointer. */
1813 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1814 align = GET_MODE_ALIGNMENT (Pmode);
1817 record_alignment_for_reg_var (align);
1819 poly_uint64 size;
1820 if (TREE_CODE (origvar) == SSA_NAME)
1822 gcc_assert (!VAR_P (var)
1823 || (!DECL_EXTERNAL (var)
1824 && !DECL_HAS_VALUE_EXPR_P (var)
1825 && !TREE_STATIC (var)
1826 && TREE_TYPE (var) != error_mark_node
1827 && !DECL_HARD_REGISTER (var)
1828 && really_expand));
1830 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1832 else if (DECL_EXTERNAL (var))
1834 else if (DECL_HAS_VALUE_EXPR_P (var))
1836 else if (TREE_STATIC (var))
1838 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1840 else if (TREE_TYPE (var) == error_mark_node)
1842 if (really_expand)
1843 expand_one_error_var (var);
1845 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1847 if (really_expand)
1849 expand_one_hard_reg_var (var);
1850 if (!DECL_HARD_REGISTER (var))
1851 /* Invalid register specification. */
1852 expand_one_error_var (var);
1855 else if (use_register_for_decl (var)
1856 && (!forced_stack_var
1857 || !bitmap_bit_p (forced_stack_var, DECL_UID (var))))
1859 if (really_expand)
1860 expand_one_register_var (origvar);
1862 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1863 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1865 /* Reject variables which cover more than half of the address-space. */
1866 if (really_expand)
1868 if (DECL_NONLOCAL_FRAME (var))
1869 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1870 "total size of local objects is too large");
1871 else
1872 error_at (DECL_SOURCE_LOCATION (var),
1873 "size of variable %q+D is too large", var);
1874 expand_one_error_var (var);
1877 else if (defer_stack_allocation (var, toplevel))
1878 add_stack_var (origvar, really_expand);
1879 else
1881 if (really_expand)
1883 if (lookup_attribute ("naked",
1884 DECL_ATTRIBUTES (current_function_decl)))
1885 error ("cannot allocate stack for variable %q+D, naked function",
1886 var);
1888 expand_one_stack_var (origvar);
1890 return size;
1892 return 0;
1895 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1896 expanding variables. Those variables that can be put into registers
1897 are allocated pseudos; those that can't are put on the stack.
1899 TOPLEVEL is true if this is the outermost BLOCK. */
1901 static void
1902 expand_used_vars_for_block (tree block, bool toplevel, bitmap forced_stack_vars)
1904 tree t;
1906 /* Expand all variables at this level. */
1907 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1908 if (TREE_USED (t)
1909 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1910 || !DECL_NONSHAREABLE (t)))
1911 expand_one_var (t, toplevel, true, forced_stack_vars);
1913 /* Expand all variables at containing levels. */
1914 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1915 expand_used_vars_for_block (t, false, forced_stack_vars);
1918 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1919 and clear TREE_USED on all local variables. */
1921 static void
1922 clear_tree_used (tree block)
1924 tree t;
1926 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1927 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1928 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1929 || !DECL_NONSHAREABLE (t))
1930 TREE_USED (t) = 0;
1932 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1933 clear_tree_used (t);
1936 /* Examine TYPE and determine a bit mask of the following features. */
1938 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1939 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1940 #define SPCT_HAS_ARRAY 4
1941 #define SPCT_HAS_AGGREGATE 8
1943 static unsigned int
1944 stack_protect_classify_type (tree type)
1946 unsigned int ret = 0;
1947 tree t;
1949 switch (TREE_CODE (type))
1951 case ARRAY_TYPE:
1952 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1953 if (t == char_type_node
1954 || t == signed_char_type_node
1955 || t == unsigned_char_type_node)
1957 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1958 unsigned HOST_WIDE_INT len;
1960 if (!TYPE_SIZE_UNIT (type)
1961 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1962 len = max;
1963 else
1964 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1966 if (len < max)
1967 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1968 else
1969 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1971 else
1972 ret = SPCT_HAS_ARRAY;
1973 break;
1975 case UNION_TYPE:
1976 case QUAL_UNION_TYPE:
1977 case RECORD_TYPE:
1978 ret = SPCT_HAS_AGGREGATE;
1979 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1980 if (TREE_CODE (t) == FIELD_DECL)
1981 ret |= stack_protect_classify_type (TREE_TYPE (t));
1982 break;
1984 default:
1985 break;
1988 return ret;
1991 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1992 part of the local stack frame. Remember if we ever return nonzero for
1993 any variable in this function. The return value is the phase number in
1994 which the variable should be allocated. */
1996 static int
1997 stack_protect_decl_phase (tree decl)
1999 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
2000 int ret = 0;
2002 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
2003 has_short_buffer = true;
2005 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2006 if (!lookup_attribute ("no_stack_protector", attribs)
2007 && (flag_stack_protect == SPCT_FLAG_ALL
2008 || flag_stack_protect == SPCT_FLAG_STRONG
2009 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2010 && lookup_attribute ("stack_protect", attribs))))
2012 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
2013 && !(bits & SPCT_HAS_AGGREGATE))
2014 ret = 1;
2015 else if (bits & SPCT_HAS_ARRAY)
2016 ret = 2;
2018 else
2019 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
2021 if (ret)
2022 has_protected_decls = true;
2024 return ret;
2027 /* Two helper routines that check for phase 1 and phase 2. These are used
2028 as callbacks for expand_stack_vars. */
2030 static bool
2031 stack_protect_decl_phase_1 (size_t i)
2033 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
2036 static bool
2037 stack_protect_decl_phase_2 (size_t i)
2039 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
2042 /* And helper function that checks for asan phase (with stack protector
2043 it is phase 3). This is used as callback for expand_stack_vars.
2044 Returns true if any of the vars in the partition need to be protected. */
2046 static bool
2047 asan_decl_phase_3 (size_t i)
2049 while (i != EOC)
2051 if (asan_protect_stack_decl (stack_vars[i].decl))
2052 return true;
2053 i = stack_vars[i].next;
2055 return false;
2058 /* Ensure that variables in different stack protection phases conflict
2059 so that they are not merged and share the same stack slot.
2060 Return true if there are any address taken variables. */
2062 static bool
2063 add_stack_protection_conflicts (void)
2065 size_t i, j, n = stack_vars_num;
2066 unsigned char *phase;
2067 bool ret = false;
2069 phase = XNEWVEC (unsigned char, n);
2070 for (i = 0; i < n; ++i)
2072 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
2073 if (TREE_ADDRESSABLE (stack_vars[i].decl))
2074 ret = true;
2077 for (i = 0; i < n; ++i)
2079 unsigned char ph_i = phase[i];
2080 for (j = i + 1; j < n; ++j)
2081 if (ph_i != phase[j])
2082 add_stack_var_conflict (i, j);
2085 XDELETEVEC (phase);
2086 return ret;
2089 /* Create a decl for the guard at the top of the stack frame. */
2091 static void
2092 create_stack_guard (void)
2094 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
2095 VAR_DECL, NULL, ptr_type_node);
2096 TREE_THIS_VOLATILE (guard) = 1;
2097 TREE_USED (guard) = 1;
2098 expand_one_stack_var (guard);
2099 crtl->stack_protect_guard = guard;
2102 /* Prepare for expanding variables. */
2103 static void
2104 init_vars_expansion (void)
2106 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
2107 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
2109 /* A map from decl to stack partition. */
2110 decl_to_stack_part = new hash_map<tree, size_t>;
2112 /* Initialize local stack smashing state. */
2113 has_protected_decls = false;
2114 has_short_buffer = false;
2115 if (hwasan_sanitize_stack_p ())
2116 hwasan_record_frame_init ();
2119 /* Free up stack variable graph data. */
2120 static void
2121 fini_vars_expansion (void)
2123 bitmap_obstack_release (&stack_var_bitmap_obstack);
2124 if (stack_vars)
2125 XDELETEVEC (stack_vars);
2126 if (stack_vars_sorted)
2127 XDELETEVEC (stack_vars_sorted);
2128 stack_vars = NULL;
2129 stack_vars_sorted = NULL;
2130 stack_vars_alloc = stack_vars_num = 0;
2131 delete decl_to_stack_part;
2132 decl_to_stack_part = NULL;
2135 /* Make a fair guess for the size of the stack frame of the function
2136 in NODE. This doesn't have to be exact, the result is only used in
2137 the inline heuristics. So we don't want to run the full stack var
2138 packing algorithm (which is quadratic in the number of stack vars).
2139 Instead, we calculate the total size of all stack vars. This turns
2140 out to be a pretty fair estimate -- packing of stack vars doesn't
2141 happen very often. */
2143 HOST_WIDE_INT
2144 estimated_stack_frame_size (struct cgraph_node *node)
2146 poly_int64 size = 0;
2147 size_t i;
2148 tree var;
2149 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2151 push_cfun (fn);
2153 init_vars_expansion ();
2155 FOR_EACH_LOCAL_DECL (fn, i, var)
2156 if (auto_var_in_fn_p (var, fn->decl))
2157 size += expand_one_var (var, true, false);
2159 if (stack_vars_num > 0)
2161 /* Fake sorting the stack vars for account_stack_vars (). */
2162 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
2163 for (i = 0; i < stack_vars_num; ++i)
2164 stack_vars_sorted[i] = i;
2165 size += account_stack_vars ();
2168 fini_vars_expansion ();
2169 pop_cfun ();
2170 return estimated_poly_value (size);
2173 /* Check if the current function has calls that use a return slot. */
2175 static bool
2176 stack_protect_return_slot_p ()
2178 basic_block bb;
2180 FOR_ALL_BB_FN (bb, cfun)
2181 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2182 !gsi_end_p (gsi); gsi_next (&gsi))
2184 gimple *stmt = gsi_stmt (gsi);
2185 /* This assumes that calls to internal-only functions never
2186 use a return slot. */
2187 if (is_gimple_call (stmt)
2188 && !gimple_call_internal_p (stmt)
2189 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2190 gimple_call_fndecl (stmt)))
2191 return true;
2193 return false;
2196 /* Expand all variables used in the function. */
2198 static rtx_insn *
2199 expand_used_vars (bitmap forced_stack_vars)
2201 tree var, outer_block = DECL_INITIAL (current_function_decl);
2202 auto_vec<tree> maybe_local_decls;
2203 rtx_insn *var_end_seq = NULL;
2204 unsigned i;
2205 unsigned len;
2206 bool gen_stack_protect_signal = false;
2208 /* Compute the phase of the stack frame for this function. */
2210 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2211 int off = targetm.starting_frame_offset () % align;
2212 frame_phase = off ? align - off : 0;
2215 /* Set TREE_USED on all variables in the local_decls. */
2216 FOR_EACH_LOCAL_DECL (cfun, i, var)
2217 TREE_USED (var) = 1;
2218 /* Clear TREE_USED on all variables associated with a block scope. */
2219 clear_tree_used (DECL_INITIAL (current_function_decl));
2221 init_vars_expansion ();
2223 if (targetm.use_pseudo_pic_reg ())
2224 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2226 for (i = 0; i < SA.map->num_partitions; i++)
2228 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2229 continue;
2231 tree var = partition_to_var (SA.map, i);
2233 gcc_assert (!virtual_operand_p (var));
2235 expand_one_ssa_partition (var);
2238 if (flag_stack_protect == SPCT_FLAG_STRONG)
2239 gen_stack_protect_signal = stack_protect_return_slot_p ();
2241 /* At this point all variables on the local_decls with TREE_USED
2242 set are not associated with any block scope. Lay them out. */
2244 len = vec_safe_length (cfun->local_decls);
2245 FOR_EACH_LOCAL_DECL (cfun, i, var)
2247 bool expand_now = false;
2249 /* Expanded above already. */
2250 if (is_gimple_reg (var))
2252 TREE_USED (var) = 0;
2253 goto next;
2255 /* We didn't set a block for static or extern because it's hard
2256 to tell the difference between a global variable (re)declared
2257 in a local scope, and one that's really declared there to
2258 begin with. And it doesn't really matter much, since we're
2259 not giving them stack space. Expand them now. */
2260 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2261 expand_now = true;
2263 /* Expand variables not associated with any block now. Those created by
2264 the optimizers could be live anywhere in the function. Those that
2265 could possibly have been scoped originally and detached from their
2266 block will have their allocation deferred so we coalesce them with
2267 others when optimization is enabled. */
2268 else if (TREE_USED (var))
2269 expand_now = true;
2271 /* Finally, mark all variables on the list as used. We'll use
2272 this in a moment when we expand those associated with scopes. */
2273 TREE_USED (var) = 1;
2275 if (expand_now)
2276 expand_one_var (var, true, true, forced_stack_vars);
2278 next:
2279 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2281 rtx rtl = DECL_RTL_IF_SET (var);
2283 /* Keep artificial non-ignored vars in cfun->local_decls
2284 chain until instantiate_decls. */
2285 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2286 add_local_decl (cfun, var);
2287 else if (rtl == NULL_RTX)
2288 /* If rtl isn't set yet, which can happen e.g. with
2289 -fstack-protector, retry before returning from this
2290 function. */
2291 maybe_local_decls.safe_push (var);
2295 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2297 +-----------------+-----------------+
2298 | ...processed... | ...duplicates...|
2299 +-----------------+-----------------+
2301 +-- LEN points here.
2303 We just want the duplicates, as those are the artificial
2304 non-ignored vars that we want to keep until instantiate_decls.
2305 Move them down and truncate the array. */
2306 if (!vec_safe_is_empty (cfun->local_decls))
2307 cfun->local_decls->block_remove (0, len);
2309 /* At this point, all variables within the block tree with TREE_USED
2310 set are actually used by the optimized function. Lay them out. */
2311 expand_used_vars_for_block (outer_block, true, forced_stack_vars);
2313 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2314 if (stack_vars_num > 0)
2316 bool has_addressable_vars = false;
2318 add_scope_conflicts ();
2320 /* If stack protection is enabled, we don't share space between
2321 vulnerable data and non-vulnerable data. */
2322 if (flag_stack_protect != 0
2323 && !lookup_attribute ("no_stack_protector", attribs)
2324 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2325 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2326 && lookup_attribute ("stack_protect", attribs))))
2327 has_addressable_vars = add_stack_protection_conflicts ();
2329 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2330 gen_stack_protect_signal = true;
2332 /* Now that we have collected all stack variables, and have computed a
2333 minimal interference graph, attempt to save some stack space. */
2334 partition_stack_vars ();
2335 if (dump_file)
2336 dump_stack_var_partition ();
2340 if (!lookup_attribute ("no_stack_protector", attribs))
2341 switch (flag_stack_protect)
2343 case SPCT_FLAG_ALL:
2344 create_stack_guard ();
2345 break;
2347 case SPCT_FLAG_STRONG:
2348 if (gen_stack_protect_signal
2349 || cfun->calls_alloca
2350 || has_protected_decls
2351 || lookup_attribute ("stack_protect", attribs))
2352 create_stack_guard ();
2353 break;
2355 case SPCT_FLAG_DEFAULT:
2356 if (cfun->calls_alloca
2357 || has_protected_decls
2358 || lookup_attribute ("stack_protect", attribs))
2359 create_stack_guard ();
2360 break;
2362 case SPCT_FLAG_EXPLICIT:
2363 if (lookup_attribute ("stack_protect", attribs))
2364 create_stack_guard ();
2365 break;
2367 default:
2368 break;
2371 /* Assign rtl to each variable based on these partitions. */
2372 if (stack_vars_num > 0)
2374 class stack_vars_data data;
2376 data.asan_base = NULL_RTX;
2377 data.asan_alignb = 0;
2379 /* Reorder decls to be protected by iterating over the variables
2380 array multiple times, and allocating out of each phase in turn. */
2381 /* ??? We could probably integrate this into the qsort we did
2382 earlier, such that we naturally see these variables first,
2383 and thus naturally allocate things in the right order. */
2384 if (has_protected_decls)
2386 /* Phase 1 contains only character arrays. */
2387 expand_stack_vars (stack_protect_decl_phase_1, &data);
2389 /* Phase 2 contains other kinds of arrays. */
2390 if (!lookup_attribute ("no_stack_protector", attribs)
2391 && (flag_stack_protect == SPCT_FLAG_ALL
2392 || flag_stack_protect == SPCT_FLAG_STRONG
2393 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2394 && lookup_attribute ("stack_protect", attribs))))
2395 expand_stack_vars (stack_protect_decl_phase_2, &data);
2398 if (asan_sanitize_stack_p ())
2399 /* Phase 3, any partitions that need asan protection
2400 in addition to phase 1 and 2. */
2401 expand_stack_vars (asan_decl_phase_3, &data);
2403 /* ASAN description strings don't yet have a syntax for expressing
2404 polynomial offsets. */
2405 HOST_WIDE_INT prev_offset;
2406 if (!data.asan_vec.is_empty ()
2407 && frame_offset.is_constant (&prev_offset))
2409 HOST_WIDE_INT offset, sz, redzonesz;
2410 redzonesz = ASAN_RED_ZONE_SIZE;
2411 sz = data.asan_vec[0] - prev_offset;
2412 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2413 && data.asan_alignb <= 4096
2414 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2415 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2416 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2417 /* Allocating a constant amount of space from a constant
2418 starting offset must give a constant result. */
2419 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2420 .to_constant ());
2421 data.asan_vec.safe_push (prev_offset);
2422 data.asan_vec.safe_push (offset);
2423 /* Leave space for alignment if STRICT_ALIGNMENT. */
2424 if (STRICT_ALIGNMENT)
2425 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2426 << ASAN_SHADOW_SHIFT)
2427 / BITS_PER_UNIT, 1);
2429 var_end_seq
2430 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2431 data.asan_base,
2432 data.asan_alignb,
2433 data.asan_vec.address (),
2434 data.asan_decl_vec.address (),
2435 data.asan_vec.length ());
2438 expand_stack_vars (NULL, &data);
2441 if (hwasan_sanitize_stack_p ())
2442 hwasan_emit_prologue ();
2443 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2444 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2445 virtual_stack_vars_rtx,
2446 var_end_seq);
2447 else if (hwasan_sanitize_allocas_p () && cfun->calls_alloca)
2448 /* When using out-of-line instrumentation we only want to emit one function
2449 call for clearing the tags in a region of shadow stack. When there are
2450 alloca calls in this frame we want to emit a call using the
2451 virtual_stack_dynamic_rtx, but when not we use the hwasan_frame_extent
2452 rtx we created in expand_stack_vars. */
2453 var_end_seq = hwasan_emit_untag_frame (virtual_stack_dynamic_rtx,
2454 virtual_stack_vars_rtx);
2455 else if (hwasan_sanitize_stack_p ())
2456 /* If no variables were stored on the stack, `hwasan_get_frame_extent`
2457 will return NULL_RTX and hence `hwasan_emit_untag_frame` will return
2458 NULL (i.e. an empty sequence). */
2459 var_end_seq = hwasan_emit_untag_frame (hwasan_get_frame_extent (),
2460 virtual_stack_vars_rtx);
2462 fini_vars_expansion ();
2464 /* If there were any artificial non-ignored vars without rtl
2465 found earlier, see if deferred stack allocation hasn't assigned
2466 rtl to them. */
2467 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2469 rtx rtl = DECL_RTL_IF_SET (var);
2471 /* Keep artificial non-ignored vars in cfun->local_decls
2472 chain until instantiate_decls. */
2473 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2474 add_local_decl (cfun, var);
2477 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2478 if (STACK_ALIGNMENT_NEEDED)
2480 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2481 if (FRAME_GROWS_DOWNWARD)
2482 frame_offset = aligned_lower_bound (frame_offset, align);
2483 else
2484 frame_offset = aligned_upper_bound (frame_offset, align);
2487 return var_end_seq;
2491 /* If we need to produce a detailed dump, print the tree representation
2492 for STMT to the dump file. SINCE is the last RTX after which the RTL
2493 generated for STMT should have been appended. */
2495 static void
2496 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2498 if (dump_file && (dump_flags & TDF_DETAILS))
2500 fprintf (dump_file, "\n;; ");
2501 print_gimple_stmt (dump_file, stmt, 0,
2502 TDF_SLIM | (dump_flags & TDF_LINENO));
2503 fprintf (dump_file, "\n");
2505 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2509 /* Maps the blocks that do not contain tree labels to rtx labels. */
2511 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2513 /* Returns the label_rtx expression for a label starting basic block BB. */
2515 static rtx_code_label *
2516 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2518 if (bb->flags & BB_RTL)
2519 return block_label (bb);
2521 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2522 if (elt)
2523 return *elt;
2525 /* Find the tree label if it is present. */
2526 gimple_stmt_iterator gsi = gsi_start_bb (bb);
2527 glabel *lab_stmt;
2528 if (!gsi_end_p (gsi)
2529 && (lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi)))
2530 && !DECL_NONLOCAL (gimple_label_label (lab_stmt)))
2531 return jump_target_rtx (gimple_label_label (lab_stmt));
2533 rtx_code_label *l = gen_label_rtx ();
2534 lab_rtx_for_bb->put (bb, l);
2535 return l;
2539 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2540 of a basic block where we just expanded the conditional at the end,
2541 possibly clean up the CFG and instruction sequence. LAST is the
2542 last instruction before the just emitted jump sequence. */
2544 static void
2545 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2547 /* Special case: when jumpif decides that the condition is
2548 trivial it emits an unconditional jump (and the necessary
2549 barrier). But we still have two edges, the fallthru one is
2550 wrong. purge_dead_edges would clean this up later. Unfortunately
2551 we have to insert insns (and split edges) before
2552 find_many_sub_basic_blocks and hence before purge_dead_edges.
2553 But splitting edges might create new blocks which depend on the
2554 fact that if there are two edges there's no barrier. So the
2555 barrier would get lost and verify_flow_info would ICE. Instead
2556 of auditing all edge splitters to care for the barrier (which
2557 normally isn't there in a cleaned CFG), fix it here. */
2558 if (BARRIER_P (get_last_insn ()))
2560 rtx_insn *insn;
2561 remove_edge (e);
2562 /* Now, we have a single successor block, if we have insns to
2563 insert on the remaining edge we potentially will insert
2564 it at the end of this block (if the dest block isn't feasible)
2565 in order to avoid splitting the edge. This insertion will take
2566 place in front of the last jump. But we might have emitted
2567 multiple jumps (conditional and one unconditional) to the
2568 same destination. Inserting in front of the last one then
2569 is a problem. See PR 40021. We fix this by deleting all
2570 jumps except the last unconditional one. */
2571 insn = PREV_INSN (get_last_insn ());
2572 /* Make sure we have an unconditional jump. Otherwise we're
2573 confused. */
2574 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2575 for (insn = PREV_INSN (insn); insn != last;)
2577 insn = PREV_INSN (insn);
2578 if (JUMP_P (NEXT_INSN (insn)))
2580 if (!any_condjump_p (NEXT_INSN (insn)))
2582 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2583 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2585 delete_insn (NEXT_INSN (insn));
2591 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2592 Returns a new basic block if we've terminated the current basic
2593 block and created a new one. */
2595 static basic_block
2596 expand_gimple_cond (basic_block bb, gcond *stmt)
2598 basic_block new_bb, dest;
2599 edge true_edge;
2600 edge false_edge;
2601 rtx_insn *last2, *last;
2602 enum tree_code code;
2603 tree op0, op1;
2605 code = gimple_cond_code (stmt);
2606 op0 = gimple_cond_lhs (stmt);
2607 op1 = gimple_cond_rhs (stmt);
2608 /* We're sometimes presented with such code:
2609 D.123_1 = x < y;
2610 if (D.123_1 != 0)
2612 This would expand to two comparisons which then later might
2613 be cleaned up by combine. But some pattern matchers like if-conversion
2614 work better when there's only one compare, so make up for this
2615 here as special exception if TER would have made the same change. */
2616 if (SA.values
2617 && TREE_CODE (op0) == SSA_NAME
2618 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2619 && TREE_CODE (op1) == INTEGER_CST
2620 && ((gimple_cond_code (stmt) == NE_EXPR
2621 && integer_zerop (op1))
2622 || (gimple_cond_code (stmt) == EQ_EXPR
2623 && integer_onep (op1)))
2624 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2626 gimple *second = SSA_NAME_DEF_STMT (op0);
2627 if (gimple_code (second) == GIMPLE_ASSIGN)
2629 enum tree_code code2 = gimple_assign_rhs_code (second);
2630 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2632 code = code2;
2633 op0 = gimple_assign_rhs1 (second);
2634 op1 = gimple_assign_rhs2 (second);
2636 /* If jumps are cheap and the target does not support conditional
2637 compare, turn some more codes into jumpy sequences. */
2638 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2639 && targetm.gen_ccmp_first == NULL)
2641 if ((code2 == BIT_AND_EXPR
2642 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2643 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2644 || code2 == TRUTH_AND_EXPR)
2646 code = TRUTH_ANDIF_EXPR;
2647 op0 = gimple_assign_rhs1 (second);
2648 op1 = gimple_assign_rhs2 (second);
2650 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2652 code = TRUTH_ORIF_EXPR;
2653 op0 = gimple_assign_rhs1 (second);
2654 op1 = gimple_assign_rhs2 (second);
2660 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2661 into (x - C2) * C3 < C4. */
2662 if ((code == EQ_EXPR || code == NE_EXPR)
2663 && TREE_CODE (op0) == SSA_NAME
2664 && TREE_CODE (op1) == INTEGER_CST)
2665 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2667 /* Optimize (x - y) < 0 into x < y if x - y has undefined overflow. */
2668 if (!TYPE_UNSIGNED (TREE_TYPE (op0))
2669 && (code == LT_EXPR || code == LE_EXPR
2670 || code == GT_EXPR || code == GE_EXPR)
2671 && integer_zerop (op1)
2672 && TREE_CODE (op0) == SSA_NAME)
2673 maybe_optimize_sub_cmp_0 (code, &op0, &op1);
2675 last2 = last = get_last_insn ();
2677 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2678 set_curr_insn_location (gimple_location (stmt));
2680 /* These flags have no purpose in RTL land. */
2681 true_edge->flags &= ~EDGE_TRUE_VALUE;
2682 false_edge->flags &= ~EDGE_FALSE_VALUE;
2684 /* We can either have a pure conditional jump with one fallthru edge or
2685 two-way jump that needs to be decomposed into two basic blocks. */
2686 if (false_edge->dest == bb->next_bb)
2688 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2689 true_edge->probability);
2690 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2691 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2692 set_curr_insn_location (true_edge->goto_locus);
2693 false_edge->flags |= EDGE_FALLTHRU;
2694 maybe_cleanup_end_of_block (false_edge, last);
2695 return NULL;
2697 if (true_edge->dest == bb->next_bb)
2699 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2700 false_edge->probability);
2701 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2702 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2703 set_curr_insn_location (false_edge->goto_locus);
2704 true_edge->flags |= EDGE_FALLTHRU;
2705 maybe_cleanup_end_of_block (true_edge, last);
2706 return NULL;
2709 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2710 true_edge->probability);
2711 last = get_last_insn ();
2712 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2713 set_curr_insn_location (false_edge->goto_locus);
2714 emit_jump (label_rtx_for_bb (false_edge->dest));
2716 BB_END (bb) = last;
2717 if (BARRIER_P (BB_END (bb)))
2718 BB_END (bb) = PREV_INSN (BB_END (bb));
2719 update_bb_for_insn (bb);
2721 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2722 dest = false_edge->dest;
2723 redirect_edge_succ (false_edge, new_bb);
2724 false_edge->flags |= EDGE_FALLTHRU;
2725 new_bb->count = false_edge->count ();
2726 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2727 add_bb_to_loop (new_bb, loop);
2728 if (loop->latch == bb
2729 && loop->header == dest)
2730 loop->latch = new_bb;
2731 make_single_succ_edge (new_bb, dest, 0);
2732 if (BARRIER_P (BB_END (new_bb)))
2733 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2734 update_bb_for_insn (new_bb);
2736 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2738 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2740 set_curr_insn_location (true_edge->goto_locus);
2741 true_edge->goto_locus = curr_insn_location ();
2744 return new_bb;
2747 /* Mark all calls that can have a transaction restart. */
2749 static void
2750 mark_transaction_restart_calls (gimple *stmt)
2752 struct tm_restart_node dummy;
2753 tm_restart_node **slot;
2755 if (!cfun->gimple_df->tm_restart)
2756 return;
2758 dummy.stmt = stmt;
2759 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2760 if (slot)
2762 struct tm_restart_node *n = *slot;
2763 tree list = n->label_or_list;
2764 rtx_insn *insn;
2766 for (insn = next_real_insn (get_last_insn ());
2767 !CALL_P (insn);
2768 insn = next_real_insn (insn))
2769 continue;
2771 if (TREE_CODE (list) == LABEL_DECL)
2772 add_reg_note (insn, REG_TM, label_rtx (list));
2773 else
2774 for (; list ; list = TREE_CHAIN (list))
2775 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2779 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2780 statement STMT. */
2782 static void
2783 expand_call_stmt (gcall *stmt)
2785 tree exp, decl, lhs;
2786 bool builtin_p;
2787 size_t i;
2789 if (gimple_call_internal_p (stmt))
2791 expand_internal_call (stmt);
2792 return;
2795 /* If this is a call to a built-in function and it has no effect other
2796 than setting the lhs, try to implement it using an internal function
2797 instead. */
2798 decl = gimple_call_fndecl (stmt);
2799 if (gimple_call_lhs (stmt)
2800 && !gimple_has_side_effects (stmt)
2801 && (optimize || (decl && called_as_built_in (decl))))
2803 internal_fn ifn = replacement_internal_fn (stmt);
2804 if (ifn != IFN_LAST)
2806 expand_internal_call (ifn, stmt);
2807 return;
2811 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2813 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2814 builtin_p = decl && fndecl_built_in_p (decl);
2816 /* If this is not a builtin function, the function type through which the
2817 call is made may be different from the type of the function. */
2818 if (!builtin_p)
2819 CALL_EXPR_FN (exp)
2820 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2821 CALL_EXPR_FN (exp));
2823 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2824 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2826 for (i = 0; i < gimple_call_num_args (stmt); i++)
2828 tree arg = gimple_call_arg (stmt, i);
2829 gimple *def;
2830 /* TER addresses into arguments of builtin functions so we have a
2831 chance to infer more correct alignment information. See PR39954. */
2832 if (builtin_p
2833 && TREE_CODE (arg) == SSA_NAME
2834 && (def = get_gimple_for_ssa_name (arg))
2835 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2836 arg = gimple_assign_rhs1 (def);
2837 CALL_EXPR_ARG (exp, i) = arg;
2840 if (gimple_has_side_effects (stmt)
2841 /* ??? Downstream in expand_expr_real_1 we assume that expressions
2842 w/o side-effects do not throw so work around this here. */
2843 || stmt_could_throw_p (cfun, stmt))
2844 TREE_SIDE_EFFECTS (exp) = 1;
2846 if (gimple_call_nothrow_p (stmt))
2847 TREE_NOTHROW (exp) = 1;
2849 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2850 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2851 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2852 if (decl
2853 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2854 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2855 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2856 else
2857 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2858 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2859 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2860 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2862 /* Must come after copying location. */
2863 copy_warning (exp, stmt);
2865 /* Ensure RTL is created for debug args. */
2866 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2868 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2869 unsigned int ix;
2870 tree dtemp;
2872 if (debug_args)
2873 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2875 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2876 expand_debug_expr (dtemp);
2880 rtx_insn *before_call = get_last_insn ();
2881 lhs = gimple_call_lhs (stmt);
2882 if (lhs)
2883 expand_assignment (lhs, exp, false);
2884 else
2885 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2887 /* If the gimple call is an indirect call and has 'nocf_check'
2888 attribute find a generated CALL insn to mark it as no
2889 control-flow verification is needed. */
2890 if (gimple_call_nocf_check_p (stmt)
2891 && !gimple_call_fndecl (stmt))
2893 rtx_insn *last = get_last_insn ();
2894 while (!CALL_P (last)
2895 && last != before_call)
2896 last = PREV_INSN (last);
2898 if (last != before_call)
2899 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2902 mark_transaction_restart_calls (stmt);
2906 /* Generate RTL for an asm statement (explicit assembler code).
2907 STRING is a STRING_CST node containing the assembler code text,
2908 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2909 insn is volatile; don't optimize it. */
2911 static void
2912 expand_asm_loc (tree string, int vol, location_t locus)
2914 rtx body;
2916 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2917 ggc_strdup (TREE_STRING_POINTER (string)),
2918 locus);
2920 MEM_VOLATILE_P (body) = vol;
2922 /* Non-empty basic ASM implicitly clobbers memory. */
2923 if (TREE_STRING_LENGTH (string) != 0)
2925 rtx asm_op, clob;
2926 unsigned i, nclobbers;
2927 auto_vec<rtx> input_rvec, output_rvec;
2928 auto_vec<machine_mode> input_mode;
2929 auto_vec<const char *> constraints;
2930 auto_vec<rtx> use_rvec;
2931 auto_vec<rtx> clobber_rvec;
2932 HARD_REG_SET clobbered_regs;
2933 CLEAR_HARD_REG_SET (clobbered_regs);
2935 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2936 clobber_rvec.safe_push (clob);
2938 if (targetm.md_asm_adjust)
2939 targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
2940 constraints, use_rvec, clobber_rvec,
2941 clobbered_regs, locus);
2943 asm_op = body;
2944 nclobbers = clobber_rvec.length ();
2945 auto nuses = use_rvec.length ();
2946 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nuses + nclobbers));
2948 i = 0;
2949 XVECEXP (body, 0, i++) = asm_op;
2950 for (rtx use : use_rvec)
2951 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
2952 for (rtx clobber : clobber_rvec)
2953 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobber);
2956 emit_insn (body);
2959 /* Return the number of times character C occurs in string S. */
2960 static int
2961 n_occurrences (int c, const char *s)
2963 int n = 0;
2964 while (*s)
2965 n += (*s++ == c);
2966 return n;
2969 /* A subroutine of expand_asm_operands. Check that all operands have
2970 the same number of alternatives. Return true if so. */
2972 static bool
2973 check_operand_nalternatives (const vec<const char *> &constraints)
2975 unsigned len = constraints.length();
2976 if (len > 0)
2978 int nalternatives = n_occurrences (',', constraints[0]);
2980 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2982 error ("too many alternatives in %<asm%>");
2983 return false;
2986 for (unsigned i = 1; i < len; ++i)
2987 if (n_occurrences (',', constraints[i]) != nalternatives)
2989 error ("operand constraints for %<asm%> differ "
2990 "in number of alternatives");
2991 return false;
2994 return true;
2997 /* Check for overlap between registers marked in CLOBBERED_REGS and
2998 anything inappropriate in T. Emit error and return the register
2999 variable definition for error, NULL_TREE for ok. */
3001 static bool
3002 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs,
3003 location_t loc)
3005 /* Conflicts between asm-declared register variables and the clobber
3006 list are not allowed. */
3007 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
3009 if (overlap)
3011 error_at (loc, "%<asm%> specifier for variable %qE conflicts with "
3012 "%<asm%> clobber list", DECL_NAME (overlap));
3014 /* Reset registerness to stop multiple errors emitted for a single
3015 variable. */
3016 DECL_REGISTER (overlap) = 0;
3017 return true;
3020 return false;
3023 /* Check that the given REGNO spanning NREGS is a valid
3024 asm clobber operand. Some HW registers cannot be
3025 saved/restored, hence they should not be clobbered by
3026 asm statements. */
3027 static bool
3028 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
3030 bool is_valid = true;
3031 HARD_REG_SET regset;
3033 CLEAR_HARD_REG_SET (regset);
3035 add_range_to_hard_reg_set (&regset, regno, nregs);
3037 /* Clobbering the PIC register is an error. */
3038 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
3039 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
3041 /* ??? Diagnose during gimplification? */
3042 error ("PIC register clobbered by %qs in %<asm%>", regname);
3043 is_valid = false;
3045 else if (!in_hard_reg_set_p
3046 (accessible_reg_set, reg_raw_mode[regno], regno))
3048 /* ??? Diagnose during gimplification? */
3049 error ("the register %qs cannot be clobbered in %<asm%>"
3050 " for the current target", regname);
3051 is_valid = false;
3054 /* Clobbering the stack pointer register is deprecated. GCC expects
3055 the value of the stack pointer after an asm statement to be the same
3056 as it was before, so no asm can validly clobber the stack pointer in
3057 the usual sense. Adding the stack pointer to the clobber list has
3058 traditionally had some undocumented and somewhat obscure side-effects. */
3059 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
3061 crtl->sp_is_clobbered_by_asm = true;
3062 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
3063 " %qs in a clobber list is deprecated", regname))
3064 inform (input_location, "the value of the stack pointer after"
3065 " an %<asm%> statement must be the same as it was before"
3066 " the statement");
3069 return is_valid;
3072 /* Generate RTL for an asm statement with arguments.
3073 STRING is the instruction template.
3074 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
3075 Each output or input has an expression in the TREE_VALUE and
3076 a tree list in TREE_PURPOSE which in turn contains a constraint
3077 name in TREE_VALUE (or NULL_TREE) and a constraint string
3078 in TREE_PURPOSE.
3079 CLOBBERS is a list of STRING_CST nodes each naming a hard register
3080 that is clobbered by this insn.
3082 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
3083 should be the fallthru basic block of the asm goto.
3085 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
3086 Some elements of OUTPUTS may be replaced with trees representing temporary
3087 values. The caller should copy those temporary values to the originally
3088 specified lvalues.
3090 VOL nonzero means the insn is volatile; don't optimize it. */
3092 static void
3093 expand_asm_stmt (gasm *stmt)
3095 class save_input_location
3097 location_t old;
3099 public:
3100 explicit save_input_location(location_t where)
3102 old = input_location;
3103 input_location = where;
3106 ~save_input_location()
3108 input_location = old;
3112 location_t locus = gimple_location (stmt);
3114 if (gimple_asm_input_p (stmt))
3116 const char *s = gimple_asm_string (stmt);
3117 tree string = build_string (strlen (s), s);
3118 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
3119 return;
3122 /* There are some legacy diagnostics in here. */
3123 save_input_location s_i_l(locus);
3125 unsigned noutputs = gimple_asm_noutputs (stmt);
3126 unsigned ninputs = gimple_asm_ninputs (stmt);
3127 unsigned nlabels = gimple_asm_nlabels (stmt);
3128 unsigned i;
3129 bool error_seen = false;
3131 /* ??? Diagnose during gimplification? */
3132 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
3134 error_at (locus, "more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
3135 return;
3138 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
3139 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
3140 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
3142 /* Copy the gimple vectors into new vectors that we can manipulate. */
3144 output_tvec.safe_grow (noutputs, true);
3145 input_tvec.safe_grow (ninputs, true);
3146 constraints.safe_grow (noutputs + ninputs, true);
3148 for (i = 0; i < noutputs; ++i)
3150 tree t = gimple_asm_output_op (stmt, i);
3151 output_tvec[i] = TREE_VALUE (t);
3152 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3154 for (i = 0; i < ninputs; i++)
3156 tree t = gimple_asm_input_op (stmt, i);
3157 input_tvec[i] = TREE_VALUE (t);
3158 constraints[i + noutputs]
3159 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3162 /* ??? Diagnose during gimplification? */
3163 if (! check_operand_nalternatives (constraints))
3164 return;
3166 /* Count the number of meaningful clobbered registers, ignoring what
3167 we would ignore later. */
3168 auto_vec<rtx> clobber_rvec;
3169 HARD_REG_SET clobbered_regs;
3170 CLEAR_HARD_REG_SET (clobbered_regs);
3172 if (unsigned n = gimple_asm_nclobbers (stmt))
3174 clobber_rvec.reserve (n);
3175 for (i = 0; i < n; i++)
3177 tree t = gimple_asm_clobber_op (stmt, i);
3178 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
3179 int nregs, j;
3181 j = decode_reg_name_and_count (regname, &nregs);
3182 if (j < 0)
3184 if (j == -2)
3186 /* ??? Diagnose during gimplification? */
3187 error_at (locus, "unknown register name %qs in %<asm%>",
3188 regname);
3189 error_seen = true;
3191 else if (j == -4)
3193 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3194 clobber_rvec.safe_push (x);
3196 else
3198 /* Otherwise we should have -1 == empty string
3199 or -3 == cc, which is not a register. */
3200 gcc_assert (j == -1 || j == -3);
3203 else
3204 for (int reg = j; reg < j + nregs; reg++)
3206 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3207 return;
3209 SET_HARD_REG_BIT (clobbered_regs, reg);
3210 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3211 clobber_rvec.safe_push (x);
3216 /* First pass over inputs and outputs checks validity and sets
3217 mark_addressable if needed. */
3218 /* ??? Diagnose during gimplification? */
3220 for (i = 0; i < noutputs; ++i)
3222 tree val = output_tvec[i];
3223 tree type = TREE_TYPE (val);
3224 const char *constraint;
3225 bool is_inout;
3226 bool allows_reg;
3227 bool allows_mem;
3229 /* Try to parse the output constraint. If that fails, there's
3230 no point in going further. */
3231 constraint = constraints[i];
3232 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3233 &allows_mem, &allows_reg, &is_inout))
3234 return;
3236 /* If the output is a hard register, verify it doesn't conflict with
3237 any other operand's possible hard register use. */
3238 if (DECL_P (val)
3239 && REG_P (DECL_RTL (val))
3240 && HARD_REGISTER_P (DECL_RTL (val)))
3242 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3243 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3244 unsigned long match;
3246 /* Verify the other outputs do not use the same hard register. */
3247 for (j = i + 1; j < noutputs; ++j)
3248 if (DECL_P (output_tvec[j])
3249 && REG_P (DECL_RTL (output_tvec[j]))
3250 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3251 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3253 error_at (locus, "invalid hard register usage between output "
3254 "operands");
3255 error_seen = true;
3258 /* Verify matching constraint operands use the same hard register
3259 and that the non-matching constraint operands do not use the same
3260 hard register if the output is an early clobber operand. */
3261 for (j = 0; j < ninputs; ++j)
3262 if (DECL_P (input_tvec[j])
3263 && REG_P (DECL_RTL (input_tvec[j]))
3264 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3266 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3267 switch (*constraints[j + noutputs])
3269 case '0': case '1': case '2': case '3': case '4':
3270 case '5': case '6': case '7': case '8': case '9':
3271 match = strtoul (constraints[j + noutputs], NULL, 10);
3272 break;
3273 default:
3274 match = ULONG_MAX;
3275 break;
3277 if (i == match
3278 && output_hregno != input_hregno)
3280 error_at (locus, "invalid hard register usage between "
3281 "output operand and matching constraint operand");
3282 error_seen = true;
3284 else if (early_clobber_p
3285 && i != match
3286 && output_hregno == input_hregno)
3288 error_at (locus, "invalid hard register usage between "
3289 "earlyclobber operand and input operand");
3290 error_seen = true;
3295 if (! allows_reg
3296 && (allows_mem
3297 || is_inout
3298 || (DECL_P (val)
3299 && REG_P (DECL_RTL (val))
3300 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3301 mark_addressable (val);
3304 for (i = 0; i < ninputs; ++i)
3306 bool allows_reg, allows_mem;
3307 const char *constraint;
3309 constraint = constraints[i + noutputs];
3310 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3311 constraints.address (),
3312 &allows_mem, &allows_reg))
3313 return;
3315 if (! allows_reg && allows_mem)
3316 mark_addressable (input_tvec[i]);
3319 /* Second pass evaluates arguments. */
3321 /* Make sure stack is consistent for asm goto. */
3322 if (nlabels > 0)
3323 do_pending_stack_adjust ();
3324 int old_generating_concat_p = generating_concat_p;
3326 /* Vector of RTX's of evaluated output operands. */
3327 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3328 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3329 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3331 output_rvec.safe_grow (noutputs, true);
3333 for (i = 0; i < noutputs; ++i)
3335 tree val = output_tvec[i];
3336 tree type = TREE_TYPE (val);
3337 bool is_inout, allows_reg, allows_mem, ok;
3338 rtx op;
3340 ok = parse_output_constraint (&constraints[i], i, ninputs,
3341 noutputs, &allows_mem, &allows_reg,
3342 &is_inout);
3343 gcc_assert (ok);
3345 /* If an output operand is not a decl or indirect ref and our constraint
3346 allows a register, make a temporary to act as an intermediate.
3347 Make the asm insn write into that, then we will copy it to
3348 the real output operand. Likewise for promoted variables. */
3350 generating_concat_p = 0;
3352 gcc_assert (TREE_CODE (val) != INDIRECT_REF);
3353 if (((TREE_CODE (val) == MEM_REF
3354 && TREE_CODE (TREE_OPERAND (val, 0)) != ADDR_EXPR)
3355 && allows_mem)
3356 || (DECL_P (val)
3357 && (allows_mem || REG_P (DECL_RTL (val)))
3358 && ! (REG_P (DECL_RTL (val))
3359 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3360 || ! allows_reg
3361 || is_inout
3362 || TREE_ADDRESSABLE (type)
3363 || (!tree_fits_poly_int64_p (TYPE_SIZE (type))
3364 && !known_size_p (max_int_size_in_bytes (type))))
3366 op = expand_expr (val, NULL_RTX, VOIDmode,
3367 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3368 if (MEM_P (op))
3369 op = validize_mem (op);
3371 if (! allows_reg && !MEM_P (op))
3373 error_at (locus, "output number %d not directly addressable", i);
3374 error_seen = true;
3376 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3377 || GET_CODE (op) == CONCAT)
3379 rtx old_op = op;
3380 op = gen_reg_rtx (GET_MODE (op));
3382 generating_concat_p = old_generating_concat_p;
3384 if (is_inout)
3385 emit_move_insn (op, old_op);
3387 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3388 emit_move_insn (old_op, op);
3389 after_rtl_seq = get_insns ();
3390 after_rtl_end = get_last_insn ();
3391 end_sequence ();
3394 else
3396 op = assign_temp (type, 0, 1);
3397 op = validize_mem (op);
3398 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3399 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3401 generating_concat_p = old_generating_concat_p;
3403 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3404 expand_assignment (val, make_tree (type, op), false);
3405 after_rtl_seq = get_insns ();
3406 after_rtl_end = get_last_insn ();
3407 end_sequence ();
3409 output_rvec[i] = op;
3411 if (is_inout)
3412 inout_opnum.safe_push (i);
3415 const char *str = gimple_asm_string (stmt);
3416 if (error_seen)
3418 ninputs = 0;
3419 noutputs = 0;
3420 inout_opnum.truncate (0);
3421 output_rvec.truncate (0);
3422 clobber_rvec.truncate (0);
3423 constraints.truncate (0);
3424 CLEAR_HARD_REG_SET (clobbered_regs);
3425 str = "";
3428 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3429 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3431 input_rvec.safe_grow (ninputs, true);
3432 input_mode.safe_grow (ninputs, true);
3434 generating_concat_p = 0;
3436 for (i = 0; i < ninputs; ++i)
3438 tree val = input_tvec[i];
3439 tree type = TREE_TYPE (val);
3440 bool allows_reg, allows_mem, ok;
3441 const char *constraint;
3442 rtx op;
3444 constraint = constraints[i + noutputs];
3445 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3446 constraints.address (),
3447 &allows_mem, &allows_reg);
3448 gcc_assert (ok);
3450 /* EXPAND_INITIALIZER will not generate code for valid initializer
3451 constants, but will still generate code for other types of operand.
3452 This is the behavior we want for constant constraints. */
3453 op = expand_expr (val, NULL_RTX, VOIDmode,
3454 allows_reg ? EXPAND_NORMAL
3455 : allows_mem ? EXPAND_MEMORY
3456 : EXPAND_INITIALIZER);
3458 /* Never pass a CONCAT to an ASM. */
3459 if (GET_CODE (op) == CONCAT)
3460 op = force_reg (GET_MODE (op), op);
3461 else if (MEM_P (op))
3462 op = validize_mem (op);
3464 if (asm_operand_ok (op, constraint, NULL) <= 0)
3466 if (allows_reg && TYPE_MODE (type) != BLKmode)
3467 op = force_reg (TYPE_MODE (type), op);
3468 else if (!allows_mem)
3469 warning_at (locus, 0, "%<asm%> operand %d probably does not match "
3470 "constraints", i + noutputs);
3471 else if (MEM_P (op))
3473 /* We won't recognize either volatile memory or memory
3474 with a queued address as available a memory_operand
3475 at this point. Ignore it: clearly this *is* a memory. */
3477 else
3478 gcc_unreachable ();
3480 input_rvec[i] = op;
3481 input_mode[i] = TYPE_MODE (type);
3484 /* For in-out operands, copy output rtx to input rtx. */
3485 unsigned ninout = inout_opnum.length ();
3486 for (i = 0; i < ninout; i++)
3488 int j = inout_opnum[i];
3489 rtx o = output_rvec[j];
3491 input_rvec.safe_push (o);
3492 input_mode.safe_push (GET_MODE (o));
3494 char buffer[16];
3495 sprintf (buffer, "%d", j);
3496 constraints.safe_push (ggc_strdup (buffer));
3498 ninputs += ninout;
3500 /* Sometimes we wish to automatically clobber registers across an asm.
3501 Case in point is when the i386 backend moved from cc0 to a hard reg --
3502 maintaining source-level compatibility means automatically clobbering
3503 the flags register. */
3504 rtx_insn *after_md_seq = NULL;
3505 auto_vec<rtx> use_rvec;
3506 if (targetm.md_asm_adjust)
3507 after_md_seq
3508 = targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
3509 constraints, use_rvec, clobber_rvec,
3510 clobbered_regs, locus);
3512 /* Do not allow the hook to change the output and input count,
3513 lest it mess up the operand numbering. */
3514 gcc_assert (output_rvec.length() == noutputs);
3515 gcc_assert (input_rvec.length() == ninputs);
3516 gcc_assert (constraints.length() == noutputs + ninputs);
3518 /* But it certainly can adjust the uses and clobbers. */
3519 unsigned nuses = use_rvec.length ();
3520 unsigned nclobbers = clobber_rvec.length ();
3522 /* Third pass checks for easy conflicts. */
3523 /* ??? Why are we doing this on trees instead of rtx. */
3525 bool clobber_conflict_found = 0;
3526 for (i = 0; i < noutputs; ++i)
3527 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs, locus))
3528 clobber_conflict_found = 1;
3529 for (i = 0; i < ninputs - ninout; ++i)
3530 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs, locus))
3531 clobber_conflict_found = 1;
3533 /* Make vectors for the expression-rtx, constraint strings,
3534 and named operands. */
3536 rtvec argvec = rtvec_alloc (ninputs);
3537 rtvec constraintvec = rtvec_alloc (ninputs);
3538 rtvec labelvec = rtvec_alloc (nlabels);
3540 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3541 : GET_MODE (output_rvec[0])),
3542 ggc_strdup (str),
3543 "", 0, argvec, constraintvec,
3544 labelvec, locus);
3545 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3547 for (i = 0; i < ninputs; ++i)
3549 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3550 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3551 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3552 constraints[i + noutputs],
3553 locus);
3556 /* Copy labels to the vector. */
3557 rtx_code_label *fallthru_label = NULL;
3558 if (nlabels > 0)
3560 basic_block fallthru_bb = NULL;
3561 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3562 if (fallthru)
3563 fallthru_bb = fallthru->dest;
3565 for (i = 0; i < nlabels; ++i)
3567 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3568 rtx_insn *r;
3569 /* If asm goto has any labels in the fallthru basic block, use
3570 a label that we emit immediately after the asm goto. Expansion
3571 may insert further instructions into the same basic block after
3572 asm goto and if we don't do this, insertion of instructions on
3573 the fallthru edge might misbehave. See PR58670. */
3574 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3576 if (fallthru_label == NULL_RTX)
3577 fallthru_label = gen_label_rtx ();
3578 r = fallthru_label;
3580 else
3581 r = label_rtx (label);
3582 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3586 /* Now, for each output, construct an rtx
3587 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3588 ARGVEC CONSTRAINTS OPNAMES))
3589 If there is more than one, put them inside a PARALLEL. */
3591 if (noutputs == 0 && nuses == 0 && nclobbers == 0)
3593 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3594 if (nlabels > 0)
3595 emit_jump_insn (body);
3596 else
3597 emit_insn (body);
3599 else if (noutputs == 1 && nuses == 0 && nclobbers == 0)
3601 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3602 if (nlabels > 0)
3603 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3604 else
3605 emit_insn (gen_rtx_SET (output_rvec[0], body));
3607 else
3609 rtx obody = body;
3610 int num = noutputs;
3612 if (num == 0)
3613 num = 1;
3615 body = gen_rtx_PARALLEL (VOIDmode,
3616 rtvec_alloc (num + nuses + nclobbers));
3618 /* For each output operand, store a SET. */
3619 for (i = 0; i < noutputs; ++i)
3621 rtx src, o = output_rvec[i];
3622 if (i == 0)
3624 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3625 src = obody;
3627 else
3629 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3630 ASM_OPERANDS_TEMPLATE (obody),
3631 constraints[i], i, argvec,
3632 constraintvec, labelvec, locus);
3633 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3635 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3638 /* If there are no outputs (but there are some clobbers)
3639 store the bare ASM_OPERANDS into the PARALLEL. */
3640 if (i == 0)
3641 XVECEXP (body, 0, i++) = obody;
3643 /* Add the uses specified by the target hook. No checking should
3644 be needed since this doesn't come directly from user code. */
3645 for (rtx use : use_rvec)
3646 XVECEXP (body, 0, i++) = gen_rtx_USE (VOIDmode, use);
3648 /* Store (clobber REG) for each clobbered register specified. */
3649 for (unsigned j = 0; j < nclobbers; ++j)
3651 rtx clobbered_reg = clobber_rvec[j];
3653 /* Do sanity check for overlap between clobbers and respectively
3654 input and outputs that hasn't been handled. Such overlap
3655 should have been detected and reported above. */
3656 if (!clobber_conflict_found && REG_P (clobbered_reg))
3658 /* We test the old body (obody) contents to avoid
3659 tripping over the under-construction body. */
3660 for (unsigned k = 0; k < noutputs; ++k)
3661 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3662 internal_error ("%<asm%> clobber conflict with "
3663 "output operand");
3665 for (unsigned k = 0; k < ninputs - ninout; ++k)
3666 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3667 internal_error ("%<asm%> clobber conflict with "
3668 "input operand");
3671 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3674 if (nlabels > 0)
3675 emit_jump_insn (body);
3676 else
3677 emit_insn (body);
3680 generating_concat_p = old_generating_concat_p;
3682 if (fallthru_label)
3683 emit_label (fallthru_label);
3685 if (after_md_seq)
3686 emit_insn (after_md_seq);
3687 if (after_rtl_seq)
3689 if (nlabels == 0)
3690 emit_insn (after_rtl_seq);
3691 else
3693 edge e;
3694 edge_iterator ei;
3695 unsigned int cnt = EDGE_COUNT (gimple_bb (stmt)->succs);
3697 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3699 rtx_insn *copy;
3700 if (--cnt == 0)
3701 copy = after_rtl_seq;
3702 else
3704 start_sequence ();
3705 duplicate_insn_chain (after_rtl_seq, after_rtl_end,
3706 NULL, NULL);
3707 copy = get_insns ();
3708 end_sequence ();
3710 prepend_insn_to_edge (copy, e);
3715 free_temp_slots ();
3716 crtl->has_asm_statement = 1;
3719 /* Emit code to jump to the address
3720 specified by the pointer expression EXP. */
3722 static void
3723 expand_computed_goto (tree exp)
3725 rtx x = expand_normal (exp);
3727 do_pending_stack_adjust ();
3728 emit_indirect_jump (x);
3731 /* Generate RTL code for a `goto' statement with target label LABEL.
3732 LABEL should be a LABEL_DECL tree node that was or will later be
3733 defined with `expand_label'. */
3735 static void
3736 expand_goto (tree label)
3738 if (flag_checking)
3740 /* Check for a nonlocal goto to a containing function. Should have
3741 gotten translated to __builtin_nonlocal_goto. */
3742 tree context = decl_function_context (label);
3743 gcc_assert (!context || context == current_function_decl);
3746 emit_jump (jump_target_rtx (label));
3749 /* Output a return with no value. */
3751 static void
3752 expand_null_return_1 (void)
3754 clear_pending_stack_adjust ();
3755 do_pending_stack_adjust ();
3756 emit_jump (return_label);
3759 /* Generate RTL to return from the current function, with no value.
3760 (That is, we do not do anything about returning any value.) */
3762 void
3763 expand_null_return (void)
3765 /* If this function was declared to return a value, but we
3766 didn't, clobber the return registers so that they are not
3767 propagated live to the rest of the function. */
3768 clobber_return_register ();
3770 expand_null_return_1 ();
3773 /* Generate RTL to return from the current function, with value VAL. */
3775 static void
3776 expand_value_return (rtx val)
3778 /* Copy the value to the return location unless it's already there. */
3780 tree decl = DECL_RESULT (current_function_decl);
3781 rtx return_reg = DECL_RTL (decl);
3782 if (return_reg != val)
3784 tree funtype = TREE_TYPE (current_function_decl);
3785 tree type = TREE_TYPE (decl);
3786 int unsignedp = TYPE_UNSIGNED (type);
3787 machine_mode old_mode = DECL_MODE (decl);
3788 machine_mode mode;
3789 if (DECL_BY_REFERENCE (decl))
3790 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3791 else
3792 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3794 if (mode != old_mode)
3796 /* Some ABIs require scalar floating point modes to be returned
3797 in a wider scalar integer mode. We need to explicitly
3798 reinterpret to an integer mode of the correct precision
3799 before extending to the desired result. */
3800 if (SCALAR_INT_MODE_P (mode)
3801 && SCALAR_FLOAT_MODE_P (old_mode)
3802 && known_gt (GET_MODE_SIZE (mode), GET_MODE_SIZE (old_mode)))
3803 val = convert_float_to_wider_int (mode, old_mode, val);
3804 else
3805 val = convert_modes (mode, old_mode, val, unsignedp);
3808 if (GET_CODE (return_reg) == PARALLEL)
3809 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3810 else
3811 emit_move_insn (return_reg, val);
3814 expand_null_return_1 ();
3817 /* Generate RTL to evaluate the expression RETVAL and return it
3818 from the current function. */
3820 static void
3821 expand_return (tree retval)
3823 rtx result_rtl;
3824 rtx val = 0;
3825 tree retval_rhs;
3827 /* If function wants no value, give it none. */
3828 if (VOID_TYPE_P (TREE_TYPE (TREE_TYPE (current_function_decl))))
3830 expand_normal (retval);
3831 expand_null_return ();
3832 return;
3835 if (retval == error_mark_node)
3837 /* Treat this like a return of no value from a function that
3838 returns a value. */
3839 expand_null_return ();
3840 return;
3842 else if ((TREE_CODE (retval) == MODIFY_EXPR
3843 || TREE_CODE (retval) == INIT_EXPR)
3844 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3845 retval_rhs = TREE_OPERAND (retval, 1);
3846 else
3847 retval_rhs = retval;
3849 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3851 /* If we are returning the RESULT_DECL, then the value has already
3852 been stored into it, so we don't have to do anything special. */
3853 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3854 expand_value_return (result_rtl);
3856 /* If the result is an aggregate that is being returned in one (or more)
3857 registers, load the registers here. */
3859 else if (retval_rhs != 0
3860 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3861 && REG_P (result_rtl))
3863 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3864 if (val)
3866 /* Use the mode of the result value on the return register. */
3867 PUT_MODE (result_rtl, GET_MODE (val));
3868 expand_value_return (val);
3870 else
3871 expand_null_return ();
3873 else if (retval_rhs != 0
3874 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3875 && (REG_P (result_rtl)
3876 || (GET_CODE (result_rtl) == PARALLEL)))
3878 /* Compute the return value into a temporary (usually a pseudo reg). */
3880 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3881 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3882 val = force_not_mem (val);
3883 expand_value_return (val);
3885 else
3887 /* No hard reg used; calculate value into hard return reg. */
3888 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3889 expand_value_return (result_rtl);
3893 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3894 register, tell the rtl optimizers that its value is no longer
3895 needed. */
3897 static void
3898 expand_clobber (tree lhs)
3900 if (DECL_P (lhs))
3902 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3903 if (decl_rtl && REG_P (decl_rtl))
3905 machine_mode decl_mode = GET_MODE (decl_rtl);
3906 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3907 REGMODE_NATURAL_SIZE (decl_mode)))
3908 emit_clobber (decl_rtl);
3913 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3914 STMT that doesn't require special handling for outgoing edges. That
3915 is no tailcalls and no GIMPLE_COND. */
3917 static void
3918 expand_gimple_stmt_1 (gimple *stmt)
3920 tree op0;
3922 set_curr_insn_location (gimple_location (stmt));
3924 switch (gimple_code (stmt))
3926 case GIMPLE_GOTO:
3927 op0 = gimple_goto_dest (stmt);
3928 if (TREE_CODE (op0) == LABEL_DECL)
3929 expand_goto (op0);
3930 else
3931 expand_computed_goto (op0);
3932 break;
3933 case GIMPLE_LABEL:
3934 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3935 break;
3936 case GIMPLE_NOP:
3937 case GIMPLE_PREDICT:
3938 break;
3939 case GIMPLE_SWITCH:
3941 gswitch *swtch = as_a <gswitch *> (stmt);
3942 if (gimple_switch_num_labels (swtch) == 1)
3943 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3944 else
3945 expand_case (swtch);
3947 break;
3948 case GIMPLE_ASM:
3949 expand_asm_stmt (as_a <gasm *> (stmt));
3950 break;
3951 case GIMPLE_CALL:
3952 expand_call_stmt (as_a <gcall *> (stmt));
3953 break;
3955 case GIMPLE_RETURN:
3957 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3959 /* If a return doesn't have a location, it very likely represents
3960 multiple user returns so we cannot let it inherit the location
3961 of the last statement of the previous basic block in RTL. */
3962 if (!gimple_has_location (stmt))
3963 set_curr_insn_location (cfun->function_end_locus);
3965 if (op0 && op0 != error_mark_node)
3967 tree result = DECL_RESULT (current_function_decl);
3969 /* If we are not returning the current function's RESULT_DECL,
3970 build an assignment to it. */
3971 if (op0 != result)
3973 /* I believe that a function's RESULT_DECL is unique. */
3974 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3976 /* ??? We'd like to use simply expand_assignment here,
3977 but this fails if the value is of BLKmode but the return
3978 decl is a register. expand_return has special handling
3979 for this combination, which eventually should move
3980 to common code. See comments there. Until then, let's
3981 build a modify expression :-/ */
3982 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3983 result, op0);
3987 if (!op0)
3988 expand_null_return ();
3989 else
3990 expand_return (op0);
3992 break;
3994 case GIMPLE_ASSIGN:
3996 gassign *assign_stmt = as_a <gassign *> (stmt);
3997 tree lhs = gimple_assign_lhs (assign_stmt);
3999 /* Tree expand used to fiddle with |= and &= of two bitfield
4000 COMPONENT_REFs here. This can't happen with gimple, the LHS
4001 of binary assigns must be a gimple reg. */
4003 if (TREE_CODE (lhs) != SSA_NAME
4004 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
4006 tree rhs = gimple_assign_rhs1 (assign_stmt);
4007 gcc_assert (gimple_assign_rhs_class (assign_stmt)
4008 == GIMPLE_SINGLE_RHS);
4009 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
4010 /* Do not put locations on possibly shared trees. */
4011 && !is_gimple_min_invariant (rhs))
4012 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
4013 if (TREE_CLOBBER_P (rhs))
4014 /* This is a clobber to mark the going out of scope for
4015 this LHS. */
4016 expand_clobber (lhs);
4017 else
4018 expand_assignment (lhs, rhs,
4019 gimple_assign_nontemporal_move_p (
4020 assign_stmt));
4022 else
4024 rtx target, temp;
4025 gcc_assert (!gimple_assign_nontemporal_move_p (assign_stmt));
4026 bool promoted = false;
4028 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
4029 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
4030 promoted = true;
4032 /* If we store into a promoted register, don't directly
4033 expand to target. */
4034 temp = promoted ? NULL_RTX : target;
4035 temp = expand_expr_real_gassign (assign_stmt, temp,
4036 GET_MODE (target), EXPAND_NORMAL);
4038 if (temp == target)
4040 else if (promoted)
4042 int unsignedp = SUBREG_PROMOTED_SIGN (target);
4043 /* If TEMP is a VOIDmode constant, use convert_modes to make
4044 sure that we properly convert it. */
4045 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
4047 temp = convert_modes (GET_MODE (target),
4048 TYPE_MODE (TREE_TYPE (lhs)),
4049 temp, unsignedp);
4050 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
4051 GET_MODE (target), temp, unsignedp);
4054 convert_move (SUBREG_REG (target), temp, unsignedp);
4056 else
4058 temp = force_operand (temp, target);
4059 if (temp != target)
4060 emit_move_insn (target, temp);
4064 break;
4066 default:
4067 gcc_unreachable ();
4071 /* Expand one gimple statement STMT and return the last RTL instruction
4072 before any of the newly generated ones.
4074 In addition to generating the necessary RTL instructions this also
4075 sets REG_EH_REGION notes if necessary and sets the current source
4076 location for diagnostics. */
4078 static rtx_insn *
4079 expand_gimple_stmt (gimple *stmt)
4081 location_t saved_location = input_location;
4082 rtx_insn *last = get_last_insn ();
4083 int lp_nr;
4085 gcc_assert (cfun);
4087 /* We need to save and restore the current source location so that errors
4088 discovered during expansion are emitted with the right location. But
4089 it would be better if the diagnostic routines used the source location
4090 embedded in the tree nodes rather than globals. */
4091 if (gimple_has_location (stmt))
4092 input_location = gimple_location (stmt);
4094 expand_gimple_stmt_1 (stmt);
4096 /* Free any temporaries used to evaluate this statement. */
4097 free_temp_slots ();
4099 input_location = saved_location;
4101 /* Mark all insns that may trap. */
4102 lp_nr = lookup_stmt_eh_lp (stmt);
4103 if (lp_nr)
4105 rtx_insn *insn;
4106 for (insn = next_real_insn (last); insn;
4107 insn = next_real_insn (insn))
4109 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
4110 /* If we want exceptions for non-call insns, any
4111 may_trap_p instruction may throw. */
4112 && GET_CODE (PATTERN (insn)) != CLOBBER
4113 && GET_CODE (PATTERN (insn)) != USE
4114 && insn_could_throw_p (insn))
4115 make_reg_eh_region_note (insn, 0, lp_nr);
4119 return last;
4122 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
4123 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
4124 generated a tail call (something that might be denied by the ABI
4125 rules governing the call; see calls.cc).
4127 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
4128 can still reach the rest of BB. The case here is __builtin_sqrt,
4129 where the NaN result goes through the external function (with a
4130 tailcall) and the normal result happens via a sqrt instruction. */
4132 static basic_block
4133 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
4135 rtx_insn *last2, *last;
4136 edge e;
4137 edge_iterator ei;
4138 profile_probability probability;
4140 last2 = last = expand_gimple_stmt (stmt);
4142 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
4143 if (CALL_P (last) && SIBLING_CALL_P (last))
4144 goto found;
4146 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4148 *can_fallthru = true;
4149 return NULL;
4151 found:
4152 /* ??? Wouldn't it be better to just reset any pending stack adjust?
4153 Any instructions emitted here are about to be deleted. */
4154 do_pending_stack_adjust ();
4156 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
4157 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
4158 EH or abnormal edges, we shouldn't have created a tail call in
4159 the first place. So it seems to me we should just be removing
4160 all edges here, or redirecting the existing fallthru edge to
4161 the exit block. */
4163 probability = profile_probability::never ();
4165 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
4167 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
4169 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
4170 e->dest->count -= e->count ();
4171 probability += e->probability;
4172 remove_edge (e);
4174 else
4175 ei_next (&ei);
4178 /* This is somewhat ugly: the call_expr expander often emits instructions
4179 after the sibcall (to perform the function return). These confuse the
4180 find_many_sub_basic_blocks code, so we need to get rid of these. */
4181 last = NEXT_INSN (last);
4182 gcc_assert (BARRIER_P (last));
4184 *can_fallthru = false;
4185 while (NEXT_INSN (last))
4187 /* For instance an sqrt builtin expander expands if with
4188 sibcall in the then and label for `else`. */
4189 if (LABEL_P (NEXT_INSN (last)))
4191 *can_fallthru = true;
4192 break;
4194 delete_insn (NEXT_INSN (last));
4197 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
4198 | EDGE_SIBCALL);
4199 e->probability = probability;
4200 BB_END (bb) = last;
4201 update_bb_for_insn (bb);
4203 if (NEXT_INSN (last))
4205 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
4207 last = BB_END (bb);
4208 if (BARRIER_P (last))
4209 BB_END (bb) = PREV_INSN (last);
4212 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4214 return bb;
4217 /* Return the difference between the floor and the truncated result of
4218 a signed division by OP1 with remainder MOD. */
4219 static rtx
4220 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4222 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4223 return gen_rtx_IF_THEN_ELSE
4224 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4225 gen_rtx_IF_THEN_ELSE
4226 (mode, gen_rtx_LT (BImode,
4227 gen_rtx_DIV (mode, op1, mod),
4228 const0_rtx),
4229 constm1_rtx, const0_rtx),
4230 const0_rtx);
4233 /* Return the difference between the ceil and the truncated result of
4234 a signed division by OP1 with remainder MOD. */
4235 static rtx
4236 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4238 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4239 return gen_rtx_IF_THEN_ELSE
4240 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4241 gen_rtx_IF_THEN_ELSE
4242 (mode, gen_rtx_GT (BImode,
4243 gen_rtx_DIV (mode, op1, mod),
4244 const0_rtx),
4245 const1_rtx, const0_rtx),
4246 const0_rtx);
4249 /* Return the difference between the ceil and the truncated result of
4250 an unsigned division by OP1 with remainder MOD. */
4251 static rtx
4252 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4254 /* (mod != 0 ? 1 : 0) */
4255 return gen_rtx_IF_THEN_ELSE
4256 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4257 const1_rtx, const0_rtx);
4260 /* Return the difference between the rounded and the truncated result
4261 of a signed division by OP1 with remainder MOD. Halfway cases are
4262 rounded away from zero, rather than to the nearest even number. */
4263 static rtx
4264 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4266 /* (abs (mod) >= abs (op1) - abs (mod)
4267 ? (op1 / mod > 0 ? 1 : -1)
4268 : 0) */
4269 return gen_rtx_IF_THEN_ELSE
4270 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4271 gen_rtx_MINUS (mode,
4272 gen_rtx_ABS (mode, op1),
4273 gen_rtx_ABS (mode, mod))),
4274 gen_rtx_IF_THEN_ELSE
4275 (mode, gen_rtx_GT (BImode,
4276 gen_rtx_DIV (mode, op1, mod),
4277 const0_rtx),
4278 const1_rtx, constm1_rtx),
4279 const0_rtx);
4282 /* Return the difference between the rounded and the truncated result
4283 of a unsigned division by OP1 with remainder MOD. Halfway cases
4284 are rounded away from zero, rather than to the nearest even
4285 number. */
4286 static rtx
4287 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4289 /* (mod >= op1 - mod ? 1 : 0) */
4290 return gen_rtx_IF_THEN_ELSE
4291 (mode, gen_rtx_GE (BImode, mod,
4292 gen_rtx_MINUS (mode, op1, mod)),
4293 const1_rtx, const0_rtx);
4296 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4297 any rtl. */
4299 static rtx
4300 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4301 addr_space_t as)
4303 #ifndef POINTERS_EXTEND_UNSIGNED
4304 gcc_assert (mode == Pmode
4305 || mode == targetm.addr_space.address_mode (as));
4306 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4307 #else
4308 rtx temp;
4310 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4312 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4313 return x;
4315 /* X must have some form of address mode already. */
4316 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4317 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4318 x = lowpart_subreg (mode, x, xmode);
4319 else if (POINTERS_EXTEND_UNSIGNED > 0)
4320 x = gen_rtx_ZERO_EXTEND (mode, x);
4321 else if (!POINTERS_EXTEND_UNSIGNED)
4322 x = gen_rtx_SIGN_EXTEND (mode, x);
4323 else
4325 switch (GET_CODE (x))
4327 case SUBREG:
4328 if ((SUBREG_PROMOTED_VAR_P (x)
4329 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4330 || (GET_CODE (SUBREG_REG (x)) == PLUS
4331 && REG_P (XEXP (SUBREG_REG (x), 0))
4332 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4333 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4334 && GET_MODE (SUBREG_REG (x)) == mode)
4335 return SUBREG_REG (x);
4336 break;
4337 case LABEL_REF:
4338 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4339 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4340 return temp;
4341 case SYMBOL_REF:
4342 temp = shallow_copy_rtx (x);
4343 PUT_MODE (temp, mode);
4344 return temp;
4345 case CONST:
4346 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4347 if (temp)
4348 temp = gen_rtx_CONST (mode, temp);
4349 return temp;
4350 case PLUS:
4351 case MINUS:
4352 if (CONST_INT_P (XEXP (x, 1)))
4354 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4355 if (temp)
4356 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4358 break;
4359 default:
4360 break;
4362 /* Don't know how to express ptr_extend as operation in debug info. */
4363 return NULL;
4365 #endif /* POINTERS_EXTEND_UNSIGNED */
4367 return x;
4370 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4371 by avoid_deep_ter_for_debug. */
4373 static hash_map<tree, tree> *deep_ter_debug_map;
4375 /* Split too deep TER chains for debug stmts using debug temporaries. */
4377 static void
4378 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4380 use_operand_p use_p;
4381 ssa_op_iter iter;
4382 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4384 tree use = USE_FROM_PTR (use_p);
4385 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4386 continue;
4387 gimple *g = get_gimple_for_ssa_name (use);
4388 if (g == NULL)
4389 continue;
4390 if (depth > 6 && !stmt_ends_bb_p (g))
4392 if (deep_ter_debug_map == NULL)
4393 deep_ter_debug_map = new hash_map<tree, tree>;
4395 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4396 if (vexpr != NULL)
4397 continue;
4398 vexpr = build_debug_expr_decl (TREE_TYPE (use));
4399 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4400 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4401 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4402 avoid_deep_ter_for_debug (def_temp, 0);
4404 else
4405 avoid_deep_ter_for_debug (g, depth + 1);
4409 /* Return an RTX equivalent to the value of the parameter DECL. */
4411 static rtx
4412 expand_debug_parm_decl (tree decl)
4414 rtx incoming = DECL_INCOMING_RTL (decl);
4416 if (incoming
4417 && GET_MODE (incoming) != BLKmode
4418 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4419 || (MEM_P (incoming)
4420 && REG_P (XEXP (incoming, 0))
4421 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4423 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4425 #ifdef HAVE_window_save
4426 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4427 If the target machine has an explicit window save instruction, the
4428 actual entry value is the corresponding OUTGOING_REGNO instead. */
4429 if (REG_P (incoming)
4430 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4431 incoming
4432 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4433 OUTGOING_REGNO (REGNO (incoming)), 0);
4434 else if (MEM_P (incoming))
4436 rtx reg = XEXP (incoming, 0);
4437 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4439 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4440 incoming = replace_equiv_address_nv (incoming, reg);
4442 else
4443 incoming = copy_rtx (incoming);
4445 #endif
4447 ENTRY_VALUE_EXP (rtl) = incoming;
4448 return rtl;
4451 if (incoming
4452 && GET_MODE (incoming) != BLKmode
4453 && !TREE_ADDRESSABLE (decl)
4454 && MEM_P (incoming)
4455 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4456 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4457 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4458 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4459 return copy_rtx (incoming);
4461 return NULL_RTX;
4464 /* Return an RTX equivalent to the value of the tree expression EXP. */
4466 static rtx
4467 expand_debug_expr (tree exp)
4469 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4470 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4471 machine_mode inner_mode = VOIDmode;
4472 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4473 addr_space_t as;
4474 scalar_int_mode op0_mode, op1_mode, addr_mode;
4476 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4478 case tcc_expression:
4479 switch (TREE_CODE (exp))
4481 case COND_EXPR:
4482 case DOT_PROD_EXPR:
4483 case SAD_EXPR:
4484 case WIDEN_MULT_PLUS_EXPR:
4485 case WIDEN_MULT_MINUS_EXPR:
4486 goto ternary;
4488 case TRUTH_ANDIF_EXPR:
4489 case TRUTH_ORIF_EXPR:
4490 case TRUTH_AND_EXPR:
4491 case TRUTH_OR_EXPR:
4492 case TRUTH_XOR_EXPR:
4493 goto binary;
4495 case TRUTH_NOT_EXPR:
4496 goto unary;
4498 default:
4499 break;
4501 break;
4503 ternary:
4504 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4505 if (!op2)
4506 return NULL_RTX;
4507 /* Fall through. */
4509 binary:
4510 case tcc_binary:
4511 if (mode == BLKmode)
4512 return NULL_RTX;
4513 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4514 if (!op1)
4515 return NULL_RTX;
4516 switch (TREE_CODE (exp))
4518 case LSHIFT_EXPR:
4519 case RSHIFT_EXPR:
4520 case LROTATE_EXPR:
4521 case RROTATE_EXPR:
4522 case WIDEN_LSHIFT_EXPR:
4523 /* Ensure second operand isn't wider than the first one. */
4524 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4525 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4526 && (GET_MODE_UNIT_PRECISION (mode)
4527 < GET_MODE_PRECISION (op1_mode)))
4528 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4529 break;
4530 default:
4531 break;
4533 /* Fall through. */
4535 unary:
4536 case tcc_unary:
4537 if (mode == BLKmode)
4538 return NULL_RTX;
4539 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4540 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4541 if (!op0)
4542 return NULL_RTX;
4543 break;
4545 case tcc_comparison:
4546 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4547 goto binary;
4549 case tcc_type:
4550 case tcc_statement:
4551 gcc_unreachable ();
4553 case tcc_constant:
4554 case tcc_exceptional:
4555 case tcc_declaration:
4556 case tcc_reference:
4557 case tcc_vl_exp:
4558 break;
4561 switch (TREE_CODE (exp))
4563 case STRING_CST:
4564 if (!lookup_constant_def (exp))
4566 if (strlen (TREE_STRING_POINTER (exp)) + 1
4567 != (size_t) TREE_STRING_LENGTH (exp))
4568 return NULL_RTX;
4569 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4570 op0 = gen_rtx_MEM (BLKmode, op0);
4571 set_mem_attributes (op0, exp, 0);
4572 return op0;
4574 /* Fall through. */
4576 case INTEGER_CST:
4577 if (TREE_CODE (TREE_TYPE (exp)) == BITINT_TYPE
4578 && TYPE_MODE (TREE_TYPE (exp)) == BLKmode)
4579 return NULL;
4580 /* FALLTHRU */
4581 case REAL_CST:
4582 case FIXED_CST:
4583 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4584 return op0;
4586 case POLY_INT_CST:
4587 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4589 case COMPLEX_CST:
4590 gcc_assert (COMPLEX_MODE_P (mode));
4591 op0 = expand_debug_expr (TREE_REALPART (exp));
4592 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4593 return gen_rtx_CONCAT (mode, op0, op1);
4595 case DEBUG_EXPR_DECL:
4596 op0 = DECL_RTL_IF_SET (exp);
4598 if (op0)
4600 if (GET_MODE (op0) != mode)
4601 gcc_assert (VECTOR_TYPE_P (TREE_TYPE (exp)));
4602 else
4603 return op0;
4606 op0 = gen_rtx_DEBUG_EXPR (mode);
4607 DEBUG_EXPR_TREE_DECL (op0) = exp;
4608 SET_DECL_RTL (exp, op0);
4610 return op0;
4612 case VAR_DECL:
4613 case PARM_DECL:
4614 case FUNCTION_DECL:
4615 case LABEL_DECL:
4616 case CONST_DECL:
4617 case RESULT_DECL:
4618 op0 = DECL_RTL_IF_SET (exp);
4620 /* This decl was probably optimized away. */
4621 if (!op0
4622 /* At least label RTXen are sometimes replaced by
4623 NOTE_INSN_DELETED_LABEL. Any notes here are not
4624 handled by copy_rtx. */
4625 || NOTE_P (op0))
4627 if (!VAR_P (exp)
4628 || DECL_EXTERNAL (exp)
4629 || !TREE_STATIC (exp)
4630 || !DECL_NAME (exp)
4631 || DECL_HARD_REGISTER (exp)
4632 || DECL_IN_CONSTANT_POOL (exp)
4633 || mode == VOIDmode
4634 || symtab_node::get (exp) == NULL)
4635 return NULL;
4637 op0 = make_decl_rtl_for_debug (exp);
4638 if (!MEM_P (op0)
4639 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4640 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4641 return NULL;
4643 else if (VAR_P (exp)
4644 && is_global_var (exp)
4645 && symtab_node::get (exp) == NULL)
4646 return NULL;
4647 else
4648 op0 = copy_rtx (op0);
4650 if (GET_MODE (op0) == BLKmode
4651 /* If op0 is not BLKmode, but mode is, adjust_mode
4652 below would ICE. While it is likely a FE bug,
4653 try to be robust here. See PR43166. */
4654 || mode == BLKmode
4655 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4657 gcc_assert (MEM_P (op0));
4658 op0 = adjust_address_nv (op0, mode, 0);
4659 return op0;
4662 /* Fall through. */
4664 adjust_mode:
4665 case PAREN_EXPR:
4666 CASE_CONVERT:
4668 inner_mode = GET_MODE (op0);
4670 if (mode == inner_mode)
4671 return op0;
4673 if (inner_mode == VOIDmode)
4675 if (TREE_CODE (exp) == SSA_NAME)
4676 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4677 else
4678 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4679 if (mode == inner_mode)
4680 return op0;
4683 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4685 if (GET_MODE_UNIT_BITSIZE (mode)
4686 == GET_MODE_UNIT_BITSIZE (inner_mode))
4687 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4688 else if (GET_MODE_UNIT_BITSIZE (mode)
4689 < GET_MODE_UNIT_BITSIZE (inner_mode))
4690 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4691 else
4692 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4694 else if (FLOAT_MODE_P (mode))
4696 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4697 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4698 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4699 else
4700 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4702 else if (FLOAT_MODE_P (inner_mode))
4704 if (unsignedp)
4705 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4706 else
4707 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4709 else if (GET_MODE_UNIT_PRECISION (mode)
4710 == GET_MODE_UNIT_PRECISION (inner_mode))
4711 op0 = lowpart_subreg (mode, op0, inner_mode);
4712 else if (GET_MODE_UNIT_PRECISION (mode)
4713 < GET_MODE_UNIT_PRECISION (inner_mode))
4714 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4715 else if (UNARY_CLASS_P (exp)
4716 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4717 : unsignedp)
4718 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4719 else
4720 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4722 return op0;
4725 case MEM_REF:
4726 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4728 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4729 TREE_OPERAND (exp, 0),
4730 TREE_OPERAND (exp, 1));
4731 if (newexp)
4732 return expand_debug_expr (newexp);
4734 /* FALLTHROUGH */
4735 case INDIRECT_REF:
4736 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4737 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4738 if (!op0)
4739 return NULL;
4741 if (TREE_CODE (exp) == MEM_REF)
4743 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4744 || (GET_CODE (op0) == PLUS
4745 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4746 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4747 Instead just use get_inner_reference. */
4748 goto component_ref;
4750 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4751 poly_int64 offset;
4752 if (!op1 || !poly_int_rtx_p (op1, &offset))
4753 return NULL;
4755 op0 = plus_constant (inner_mode, op0, offset);
4758 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4760 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4761 op0, as);
4762 if (op0 == NULL_RTX)
4763 return NULL;
4765 op0 = gen_rtx_MEM (mode, op0);
4766 set_mem_attributes (op0, exp, 0);
4767 if (TREE_CODE (exp) == MEM_REF
4768 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4769 set_mem_expr (op0, NULL_TREE);
4770 set_mem_addr_space (op0, as);
4772 return op0;
4774 case TARGET_MEM_REF:
4775 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4776 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4777 return NULL;
4779 op0 = expand_debug_expr
4780 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4781 if (!op0)
4782 return NULL;
4784 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4785 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4786 op0, as);
4787 if (op0 == NULL_RTX)
4788 return NULL;
4790 op0 = gen_rtx_MEM (mode, op0);
4792 set_mem_attributes (op0, exp, 0);
4793 set_mem_addr_space (op0, as);
4795 return op0;
4797 component_ref:
4798 case ARRAY_REF:
4799 case ARRAY_RANGE_REF:
4800 case COMPONENT_REF:
4801 case BIT_FIELD_REF:
4802 case REALPART_EXPR:
4803 case IMAGPART_EXPR:
4804 case VIEW_CONVERT_EXPR:
4806 machine_mode mode1;
4807 poly_int64 bitsize, bitpos;
4808 tree offset;
4809 int reversep, volatilep = 0;
4810 tree tem
4811 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4812 &unsignedp, &reversep, &volatilep);
4813 rtx orig_op0;
4815 if (known_eq (bitsize, 0))
4816 return NULL;
4818 orig_op0 = op0 = expand_debug_expr (tem);
4820 if (!op0)
4821 return NULL;
4823 if (offset)
4825 machine_mode addrmode, offmode;
4827 if (!MEM_P (op0))
4828 return NULL;
4830 op0 = XEXP (op0, 0);
4831 addrmode = GET_MODE (op0);
4832 if (addrmode == VOIDmode)
4833 addrmode = Pmode;
4835 op1 = expand_debug_expr (offset);
4836 if (!op1)
4837 return NULL;
4839 offmode = GET_MODE (op1);
4840 if (offmode == VOIDmode)
4841 offmode = TYPE_MODE (TREE_TYPE (offset));
4843 if (addrmode != offmode)
4844 op1 = lowpart_subreg (addrmode, op1, offmode);
4846 /* Don't use offset_address here, we don't need a
4847 recognizable address, and we don't want to generate
4848 code. */
4849 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4850 op0, op1));
4853 if (MEM_P (op0))
4855 if (mode1 == VOIDmode)
4857 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4858 return NULL;
4859 /* Bitfield. */
4860 mode1 = smallest_int_mode_for_size (bitsize);
4862 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4863 if (maybe_ne (bytepos, 0))
4865 op0 = adjust_address_nv (op0, mode1, bytepos);
4866 bitpos = num_trailing_bits (bitpos);
4868 else if (known_eq (bitpos, 0)
4869 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4870 op0 = adjust_address_nv (op0, mode, 0);
4871 else if (GET_MODE (op0) != mode1)
4872 op0 = adjust_address_nv (op0, mode1, 0);
4873 else
4874 op0 = copy_rtx (op0);
4875 if (op0 == orig_op0)
4876 op0 = shallow_copy_rtx (op0);
4877 if (TREE_CODE (tem) != SSA_NAME)
4878 set_mem_attributes (op0, exp, 0);
4881 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4882 return op0;
4884 if (maybe_lt (bitpos, 0))
4885 return NULL;
4887 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4888 return NULL;
4890 poly_int64 bytepos;
4891 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4892 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4894 machine_mode opmode = GET_MODE (op0);
4896 if (opmode == VOIDmode)
4897 opmode = TYPE_MODE (TREE_TYPE (tem));
4899 /* This condition may hold if we're expanding the address
4900 right past the end of an array that turned out not to
4901 be addressable (i.e., the address was only computed in
4902 debug stmts). The gen_subreg below would rightfully
4903 crash, and the address doesn't really exist, so just
4904 drop it. */
4905 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4906 return NULL;
4908 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4909 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4912 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4913 && TYPE_UNSIGNED (TREE_TYPE (exp))
4914 ? SIGN_EXTRACT
4915 : ZERO_EXTRACT, mode,
4916 GET_MODE (op0) != VOIDmode
4917 ? GET_MODE (op0)
4918 : TYPE_MODE (TREE_TYPE (tem)),
4919 op0, gen_int_mode (bitsize, word_mode),
4920 gen_int_mode (bitpos, word_mode));
4923 case ABS_EXPR:
4924 case ABSU_EXPR:
4925 return simplify_gen_unary (ABS, mode, op0, mode);
4927 case NEGATE_EXPR:
4928 return simplify_gen_unary (NEG, mode, op0, mode);
4930 case BIT_NOT_EXPR:
4931 return simplify_gen_unary (NOT, mode, op0, mode);
4933 case FLOAT_EXPR:
4934 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4935 0)))
4936 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4937 inner_mode);
4939 case FIX_TRUNC_EXPR:
4940 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4941 inner_mode);
4943 case POINTER_PLUS_EXPR:
4944 /* For the rare target where pointers are not the same size as
4945 size_t, we need to check for mis-matched modes and correct
4946 the addend. */
4947 if (op0 && op1
4948 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4949 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4950 && op0_mode != op1_mode)
4952 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4953 /* If OP0 is a partial mode, then we must truncate, even
4954 if it has the same bitsize as OP1 as GCC's
4955 representation of partial modes is opaque. */
4956 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4957 && (GET_MODE_BITSIZE (op0_mode)
4958 == GET_MODE_BITSIZE (op1_mode))))
4959 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4960 else
4961 /* We always sign-extend, regardless of the signedness of
4962 the operand, because the operand is always unsigned
4963 here even if the original C expression is signed. */
4964 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4966 /* Fall through. */
4967 case PLUS_EXPR:
4968 return simplify_gen_binary (PLUS, mode, op0, op1);
4970 case MINUS_EXPR:
4971 case POINTER_DIFF_EXPR:
4972 return simplify_gen_binary (MINUS, mode, op0, op1);
4974 case MULT_EXPR:
4975 return simplify_gen_binary (MULT, mode, op0, op1);
4977 case RDIV_EXPR:
4978 case TRUNC_DIV_EXPR:
4979 case EXACT_DIV_EXPR:
4980 if (unsignedp)
4981 return simplify_gen_binary (UDIV, mode, op0, op1);
4982 else
4983 return simplify_gen_binary (DIV, mode, op0, op1);
4985 case TRUNC_MOD_EXPR:
4986 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4988 case FLOOR_DIV_EXPR:
4989 if (unsignedp)
4990 return simplify_gen_binary (UDIV, mode, op0, op1);
4991 else
4993 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4994 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4995 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4996 return simplify_gen_binary (PLUS, mode, div, adj);
4999 case FLOOR_MOD_EXPR:
5000 if (unsignedp)
5001 return simplify_gen_binary (UMOD, mode, op0, op1);
5002 else
5004 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5005 rtx adj = floor_sdiv_adjust (mode, mod, op1);
5006 adj = simplify_gen_unary (NEG, mode,
5007 simplify_gen_binary (MULT, mode, adj, op1),
5008 mode);
5009 return simplify_gen_binary (PLUS, mode, mod, adj);
5012 case CEIL_DIV_EXPR:
5013 if (unsignedp)
5015 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
5016 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5017 rtx adj = ceil_udiv_adjust (mode, mod, op1);
5018 return simplify_gen_binary (PLUS, mode, div, adj);
5020 else
5022 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
5023 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5024 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
5025 return simplify_gen_binary (PLUS, mode, div, adj);
5028 case CEIL_MOD_EXPR:
5029 if (unsignedp)
5031 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5032 rtx adj = ceil_udiv_adjust (mode, mod, op1);
5033 adj = simplify_gen_unary (NEG, mode,
5034 simplify_gen_binary (MULT, mode, adj, op1),
5035 mode);
5036 return simplify_gen_binary (PLUS, mode, mod, adj);
5038 else
5040 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5041 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
5042 adj = simplify_gen_unary (NEG, mode,
5043 simplify_gen_binary (MULT, mode, adj, op1),
5044 mode);
5045 return simplify_gen_binary (PLUS, mode, mod, adj);
5048 case ROUND_DIV_EXPR:
5049 if (unsignedp)
5051 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
5052 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5053 rtx adj = round_udiv_adjust (mode, mod, op1);
5054 return simplify_gen_binary (PLUS, mode, div, adj);
5056 else
5058 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
5059 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5060 rtx adj = round_sdiv_adjust (mode, mod, op1);
5061 return simplify_gen_binary (PLUS, mode, div, adj);
5064 case ROUND_MOD_EXPR:
5065 if (unsignedp)
5067 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5068 rtx adj = round_udiv_adjust (mode, mod, op1);
5069 adj = simplify_gen_unary (NEG, mode,
5070 simplify_gen_binary (MULT, mode, adj, op1),
5071 mode);
5072 return simplify_gen_binary (PLUS, mode, mod, adj);
5074 else
5076 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5077 rtx adj = round_sdiv_adjust (mode, mod, op1);
5078 adj = simplify_gen_unary (NEG, mode,
5079 simplify_gen_binary (MULT, mode, adj, op1),
5080 mode);
5081 return simplify_gen_binary (PLUS, mode, mod, adj);
5084 case LSHIFT_EXPR:
5085 return simplify_gen_binary (ASHIFT, mode, op0, op1);
5087 case RSHIFT_EXPR:
5088 if (unsignedp)
5089 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
5090 else
5091 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
5093 case LROTATE_EXPR:
5094 return simplify_gen_binary (ROTATE, mode, op0, op1);
5096 case RROTATE_EXPR:
5097 return simplify_gen_binary (ROTATERT, mode, op0, op1);
5099 case MIN_EXPR:
5100 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
5102 case MAX_EXPR:
5103 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
5105 case BIT_AND_EXPR:
5106 case TRUTH_AND_EXPR:
5107 return simplify_gen_binary (AND, mode, op0, op1);
5109 case BIT_IOR_EXPR:
5110 case TRUTH_OR_EXPR:
5111 return simplify_gen_binary (IOR, mode, op0, op1);
5113 case BIT_XOR_EXPR:
5114 case TRUTH_XOR_EXPR:
5115 return simplify_gen_binary (XOR, mode, op0, op1);
5117 case TRUTH_ANDIF_EXPR:
5118 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
5120 case TRUTH_ORIF_EXPR:
5121 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
5123 case TRUTH_NOT_EXPR:
5124 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
5126 case LT_EXPR:
5127 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
5128 op0, op1);
5130 case LE_EXPR:
5131 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
5132 op0, op1);
5134 case GT_EXPR:
5135 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
5136 op0, op1);
5138 case GE_EXPR:
5139 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
5140 op0, op1);
5142 case EQ_EXPR:
5143 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
5145 case NE_EXPR:
5146 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
5148 case UNORDERED_EXPR:
5149 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
5151 case ORDERED_EXPR:
5152 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
5154 case UNLT_EXPR:
5155 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
5157 case UNLE_EXPR:
5158 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
5160 case UNGT_EXPR:
5161 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
5163 case UNGE_EXPR:
5164 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
5166 case UNEQ_EXPR:
5167 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
5169 case LTGT_EXPR:
5170 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
5172 case COND_EXPR:
5173 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
5175 case COMPLEX_EXPR:
5176 gcc_assert (COMPLEX_MODE_P (mode));
5177 if (GET_MODE (op0) == VOIDmode)
5178 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
5179 if (GET_MODE (op1) == VOIDmode)
5180 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
5181 return gen_rtx_CONCAT (mode, op0, op1);
5183 case CONJ_EXPR:
5184 if (GET_CODE (op0) == CONCAT)
5185 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
5186 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
5187 XEXP (op0, 1),
5188 GET_MODE_INNER (mode)));
5189 else
5191 scalar_mode imode = GET_MODE_INNER (mode);
5192 rtx re, im;
5194 if (MEM_P (op0))
5196 re = adjust_address_nv (op0, imode, 0);
5197 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
5199 else
5201 scalar_int_mode ifmode;
5202 scalar_int_mode ihmode;
5203 rtx halfsize;
5204 if (!int_mode_for_mode (mode).exists (&ifmode)
5205 || !int_mode_for_mode (imode).exists (&ihmode))
5206 return NULL;
5207 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
5208 re = op0;
5209 if (mode != ifmode)
5210 re = gen_rtx_SUBREG (ifmode, re, 0);
5211 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
5212 if (imode != ihmode)
5213 re = gen_rtx_SUBREG (imode, re, 0);
5214 im = copy_rtx (op0);
5215 if (mode != ifmode)
5216 im = gen_rtx_SUBREG (ifmode, im, 0);
5217 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
5218 if (imode != ihmode)
5219 im = gen_rtx_SUBREG (imode, im, 0);
5221 im = gen_rtx_NEG (imode, im);
5222 return gen_rtx_CONCAT (mode, re, im);
5225 case ADDR_EXPR:
5226 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
5227 if (!op0 || !MEM_P (op0))
5229 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5230 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5231 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5232 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5233 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5234 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5236 if (handled_component_p (TREE_OPERAND (exp, 0)))
5238 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5239 bool reverse;
5240 tree decl
5241 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5242 &bitsize, &maxsize, &reverse);
5243 if ((VAR_P (decl)
5244 || TREE_CODE (decl) == PARM_DECL
5245 || TREE_CODE (decl) == RESULT_DECL)
5246 && (!TREE_ADDRESSABLE (decl)
5247 || target_for_debug_bind (decl))
5248 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5249 && known_gt (bitsize, 0)
5250 && known_eq (bitsize, maxsize))
5252 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5253 return plus_constant (mode, base, byteoffset);
5257 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5258 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5259 == ADDR_EXPR)
5261 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5262 0));
5263 if (op0 != NULL
5264 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5265 || (GET_CODE (op0) == PLUS
5266 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5267 && CONST_INT_P (XEXP (op0, 1)))))
5269 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5270 1));
5271 poly_int64 offset;
5272 if (!op1 || !poly_int_rtx_p (op1, &offset))
5273 return NULL;
5275 return plus_constant (mode, op0, offset);
5279 return NULL;
5282 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5283 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5284 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5286 return op0;
5288 case VECTOR_CST:
5290 unsigned HOST_WIDE_INT i, nelts;
5292 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5293 return NULL;
5295 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5297 for (i = 0; i < nelts; ++i)
5299 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5300 if (!op1)
5301 return NULL;
5302 XVECEXP (op0, 0, i) = op1;
5305 return op0;
5308 case CONSTRUCTOR:
5309 if (TREE_CLOBBER_P (exp))
5310 return NULL;
5311 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5313 unsigned i;
5314 unsigned HOST_WIDE_INT nelts;
5315 tree val;
5317 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5318 goto flag_unsupported;
5320 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5322 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5324 op1 = expand_debug_expr (val);
5325 if (!op1)
5326 return NULL;
5327 XVECEXP (op0, 0, i) = op1;
5330 if (i < nelts)
5332 op1 = expand_debug_expr
5333 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5335 if (!op1)
5336 return NULL;
5338 for (; i < nelts; i++)
5339 XVECEXP (op0, 0, i) = op1;
5342 return op0;
5344 else
5345 goto flag_unsupported;
5347 case CALL_EXPR:
5348 /* ??? Maybe handle some builtins? */
5349 return NULL;
5351 case SSA_NAME:
5353 gimple *g = get_gimple_for_ssa_name (exp);
5354 if (g)
5356 tree t = NULL_TREE;
5357 if (deep_ter_debug_map)
5359 tree *slot = deep_ter_debug_map->get (exp);
5360 if (slot)
5361 t = *slot;
5363 if (t == NULL_TREE)
5364 t = gimple_assign_rhs_to_tree (g);
5365 op0 = expand_debug_expr (t);
5366 if (!op0)
5367 return NULL;
5369 else
5371 /* If this is a reference to an incoming value of
5372 parameter that is never used in the code or where the
5373 incoming value is never used in the code, use
5374 PARM_DECL's DECL_RTL if set. */
5375 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5376 && SSA_NAME_VAR (exp)
5377 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5378 && has_zero_uses (exp))
5380 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5381 if (op0)
5382 goto adjust_mode;
5383 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5384 if (op0)
5385 goto adjust_mode;
5388 int part = var_to_partition (SA.map, exp);
5390 if (part == NO_PARTITION)
5391 return NULL;
5393 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5395 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5397 goto adjust_mode;
5400 case ERROR_MARK:
5401 return NULL;
5403 /* Vector stuff. For most of the codes we don't have rtl codes. */
5404 case REALIGN_LOAD_EXPR:
5405 case VEC_COND_EXPR:
5406 case VEC_PACK_FIX_TRUNC_EXPR:
5407 case VEC_PACK_FLOAT_EXPR:
5408 case VEC_PACK_SAT_EXPR:
5409 case VEC_PACK_TRUNC_EXPR:
5410 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5411 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5412 case VEC_UNPACK_FLOAT_HI_EXPR:
5413 case VEC_UNPACK_FLOAT_LO_EXPR:
5414 case VEC_UNPACK_HI_EXPR:
5415 case VEC_UNPACK_LO_EXPR:
5416 case VEC_WIDEN_MULT_HI_EXPR:
5417 case VEC_WIDEN_MULT_LO_EXPR:
5418 case VEC_WIDEN_MULT_EVEN_EXPR:
5419 case VEC_WIDEN_MULT_ODD_EXPR:
5420 case VEC_WIDEN_LSHIFT_HI_EXPR:
5421 case VEC_WIDEN_LSHIFT_LO_EXPR:
5422 case VEC_PERM_EXPR:
5423 case VEC_DUPLICATE_EXPR:
5424 case VEC_SERIES_EXPR:
5425 case SAD_EXPR:
5426 return NULL;
5428 /* Misc codes. */
5429 case ADDR_SPACE_CONVERT_EXPR:
5430 case FIXED_CONVERT_EXPR:
5431 case OBJ_TYPE_REF:
5432 case WITH_SIZE_EXPR:
5433 case BIT_INSERT_EXPR:
5434 return NULL;
5436 case DOT_PROD_EXPR:
5437 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5438 && SCALAR_INT_MODE_P (mode))
5441 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5442 0)))
5443 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5444 inner_mode);
5446 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5447 1)))
5448 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5449 inner_mode);
5450 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5451 return simplify_gen_binary (PLUS, mode, op0, op2);
5453 return NULL;
5455 case WIDEN_MULT_EXPR:
5456 case WIDEN_MULT_PLUS_EXPR:
5457 case WIDEN_MULT_MINUS_EXPR:
5458 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5459 && SCALAR_INT_MODE_P (mode))
5461 inner_mode = GET_MODE (op0);
5462 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5463 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5464 else
5465 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5466 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5467 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5468 else
5469 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5470 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5471 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5472 return op0;
5473 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5474 return simplify_gen_binary (PLUS, mode, op0, op2);
5475 else
5476 return simplify_gen_binary (MINUS, mode, op2, op0);
5478 return NULL;
5480 case MULT_HIGHPART_EXPR:
5481 /* ??? Similar to the above. */
5482 return NULL;
5484 case WIDEN_SUM_EXPR:
5485 case WIDEN_LSHIFT_EXPR:
5486 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5487 && SCALAR_INT_MODE_P (mode))
5490 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5491 0)))
5492 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5493 inner_mode);
5494 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5495 ? ASHIFT : PLUS, mode, op0, op1);
5497 return NULL;
5499 default:
5500 flag_unsupported:
5501 if (flag_checking)
5503 debug_tree (exp);
5504 gcc_unreachable ();
5506 return NULL;
5510 /* Return an RTX equivalent to the source bind value of the tree expression
5511 EXP. */
5513 static rtx
5514 expand_debug_source_expr (tree exp)
5516 rtx op0 = NULL_RTX;
5517 machine_mode mode = VOIDmode, inner_mode;
5519 switch (TREE_CODE (exp))
5521 case VAR_DECL:
5522 if (DECL_ABSTRACT_ORIGIN (exp))
5523 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5524 break;
5525 case PARM_DECL:
5527 mode = DECL_MODE (exp);
5528 op0 = expand_debug_parm_decl (exp);
5529 if (op0)
5530 break;
5531 /* See if this isn't an argument that has been completely
5532 optimized out. */
5533 if (!DECL_RTL_SET_P (exp)
5534 && !DECL_INCOMING_RTL (exp)
5535 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5537 tree aexp = DECL_ORIGIN (exp);
5538 if (DECL_CONTEXT (aexp)
5539 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5541 vec<tree, va_gc> **debug_args;
5542 unsigned int ix;
5543 tree ddecl;
5544 debug_args = decl_debug_args_lookup (current_function_decl);
5545 if (debug_args != NULL)
5547 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5548 ix += 2)
5549 if (ddecl == aexp)
5550 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5554 break;
5556 default:
5557 break;
5560 if (op0 == NULL_RTX)
5561 return NULL_RTX;
5563 inner_mode = GET_MODE (op0);
5564 if (mode == inner_mode)
5565 return op0;
5567 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5569 if (GET_MODE_UNIT_BITSIZE (mode)
5570 == GET_MODE_UNIT_BITSIZE (inner_mode))
5571 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5572 else if (GET_MODE_UNIT_BITSIZE (mode)
5573 < GET_MODE_UNIT_BITSIZE (inner_mode))
5574 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5575 else
5576 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5578 else if (FLOAT_MODE_P (mode))
5579 gcc_unreachable ();
5580 else if (FLOAT_MODE_P (inner_mode))
5582 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5583 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5584 else
5585 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5587 else if (GET_MODE_UNIT_PRECISION (mode)
5588 == GET_MODE_UNIT_PRECISION (inner_mode))
5589 op0 = lowpart_subreg (mode, op0, inner_mode);
5590 else if (GET_MODE_UNIT_PRECISION (mode)
5591 < GET_MODE_UNIT_PRECISION (inner_mode))
5592 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5593 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5594 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5595 else
5596 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5598 return op0;
5601 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5602 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5603 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5605 static void
5606 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5608 rtx exp = *exp_p;
5610 if (exp == NULL_RTX)
5611 return;
5613 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5614 return;
5616 if (depth == 4)
5618 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5619 rtx dval = make_debug_expr_from_rtl (exp);
5621 /* Emit a debug bind insn before INSN. */
5622 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5623 DEBUG_EXPR_TREE_DECL (dval), exp,
5624 VAR_INIT_STATUS_INITIALIZED);
5626 emit_debug_insn_before (bind, insn);
5627 *exp_p = dval;
5628 return;
5631 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5632 int i, j;
5633 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5634 switch (*format_ptr++)
5636 case 'e':
5637 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5638 break;
5640 case 'E':
5641 case 'V':
5642 for (j = 0; j < XVECLEN (exp, i); j++)
5643 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5644 break;
5646 default:
5647 break;
5651 /* Expand the _LOCs in debug insns. We run this after expanding all
5652 regular insns, so that any variables referenced in the function
5653 will have their DECL_RTLs set. */
5655 static void
5656 expand_debug_locations (void)
5658 rtx_insn *insn;
5659 rtx_insn *last = get_last_insn ();
5660 int save_strict_alias = flag_strict_aliasing;
5662 /* New alias sets while setting up memory attributes cause
5663 -fcompare-debug failures, even though it doesn't bring about any
5664 codegen changes. */
5665 flag_strict_aliasing = 0;
5667 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5668 if (DEBUG_BIND_INSN_P (insn))
5670 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5671 rtx val;
5672 rtx_insn *prev_insn, *insn2;
5673 machine_mode mode;
5675 if (value == NULL_TREE)
5676 val = NULL_RTX;
5677 else
5679 if (INSN_VAR_LOCATION_STATUS (insn)
5680 == VAR_INIT_STATUS_UNINITIALIZED)
5681 val = expand_debug_source_expr (value);
5682 /* The avoid_deep_ter_for_debug function inserts
5683 debug bind stmts after SSA_NAME definition, with the
5684 SSA_NAME as the whole bind location. Disable temporarily
5685 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5686 being defined in this DEBUG_INSN. */
5687 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5689 tree *slot = deep_ter_debug_map->get (value);
5690 if (slot)
5692 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5693 *slot = NULL_TREE;
5694 else
5695 slot = NULL;
5697 val = expand_debug_expr (value);
5698 if (slot)
5699 *slot = INSN_VAR_LOCATION_DECL (insn);
5701 else
5702 val = expand_debug_expr (value);
5703 gcc_assert (last == get_last_insn ());
5706 if (!val)
5707 val = gen_rtx_UNKNOWN_VAR_LOC ();
5708 else
5710 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5712 gcc_assert (mode == GET_MODE (val)
5713 || (GET_MODE (val) == VOIDmode
5714 && (CONST_SCALAR_INT_P (val)
5715 || GET_CODE (val) == CONST_FIXED
5716 || GET_CODE (val) == LABEL_REF)));
5719 INSN_VAR_LOCATION_LOC (insn) = val;
5720 prev_insn = PREV_INSN (insn);
5721 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5722 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5725 flag_strict_aliasing = save_strict_alias;
5728 /* Performs swapping operands of commutative operations to expand
5729 the expensive one first. */
5731 static void
5732 reorder_operands (basic_block bb)
5734 unsigned int *lattice; /* Hold cost of each statement. */
5735 unsigned int i = 0, n = 0;
5736 gimple_stmt_iterator gsi;
5737 gimple_seq stmts;
5738 gimple *stmt;
5739 bool swap;
5740 tree op0, op1;
5741 ssa_op_iter iter;
5742 use_operand_p use_p;
5743 gimple *def0, *def1;
5745 /* Compute cost of each statement using estimate_num_insns. */
5746 stmts = bb_seq (bb);
5747 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5749 stmt = gsi_stmt (gsi);
5750 if (!is_gimple_debug (stmt))
5751 gimple_set_uid (stmt, n++);
5753 lattice = XNEWVEC (unsigned int, n);
5754 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5756 unsigned cost;
5757 stmt = gsi_stmt (gsi);
5758 if (is_gimple_debug (stmt))
5759 continue;
5760 cost = estimate_num_insns (stmt, &eni_size_weights);
5761 lattice[i] = cost;
5762 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5764 tree use = USE_FROM_PTR (use_p);
5765 gimple *def_stmt;
5766 if (TREE_CODE (use) != SSA_NAME)
5767 continue;
5768 def_stmt = get_gimple_for_ssa_name (use);
5769 if (!def_stmt)
5770 continue;
5771 lattice[i] += lattice[gimple_uid (def_stmt)];
5773 i++;
5774 if (!is_gimple_assign (stmt)
5775 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5776 continue;
5777 op0 = gimple_op (stmt, 1);
5778 op1 = gimple_op (stmt, 2);
5779 if (TREE_CODE (op0) != SSA_NAME
5780 || TREE_CODE (op1) != SSA_NAME)
5781 continue;
5782 /* Swap operands if the second one is more expensive. */
5783 def0 = get_gimple_for_ssa_name (op0);
5784 def1 = get_gimple_for_ssa_name (op1);
5785 if (!def1)
5786 continue;
5787 swap = false;
5788 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5789 swap = true;
5790 if (swap)
5792 if (dump_file && (dump_flags & TDF_DETAILS))
5794 fprintf (dump_file, "Swap operands in stmt:\n");
5795 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5796 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5797 def0 ? lattice[gimple_uid (def0)] : 0,
5798 lattice[gimple_uid (def1)]);
5800 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5801 gimple_assign_rhs2_ptr (stmt));
5804 XDELETE (lattice);
5807 /* Expand basic block BB from GIMPLE trees to RTL. */
5809 static basic_block
5810 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5812 gimple_stmt_iterator gsi;
5813 gimple_seq stmts;
5814 gimple *stmt = NULL;
5815 rtx_note *note = NULL;
5816 rtx_insn *last;
5817 edge e;
5818 edge_iterator ei;
5819 bool nondebug_stmt_seen = false;
5821 if (dump_file)
5822 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5823 bb->index);
5825 /* Note that since we are now transitioning from GIMPLE to RTL, we
5826 cannot use the gsi_*_bb() routines because they expect the basic
5827 block to be in GIMPLE, instead of RTL. Therefore, we need to
5828 access the BB sequence directly. */
5829 if (optimize)
5830 reorder_operands (bb);
5831 stmts = bb_seq (bb);
5832 bb->il.gimple.seq = NULL;
5833 bb->il.gimple.phi_nodes = NULL;
5834 rtl_profile_for_bb (bb);
5835 init_rtl_bb_info (bb);
5836 bb->flags |= BB_RTL;
5838 /* Remove the RETURN_EXPR if we may fall though to the exit
5839 instead. */
5840 gsi = gsi_last (stmts);
5841 if (!gsi_end_p (gsi)
5842 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5844 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5846 gcc_assert (single_succ_p (bb));
5847 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5849 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5850 && !gimple_return_retval (ret_stmt))
5852 gsi_remove (&gsi, false);
5853 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5857 gsi = gsi_start (stmts);
5858 if (!gsi_end_p (gsi))
5860 stmt = gsi_stmt (gsi);
5861 if (gimple_code (stmt) != GIMPLE_LABEL)
5862 stmt = NULL;
5865 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5867 if (stmt || elt)
5869 gcc_checking_assert (!note);
5870 last = get_last_insn ();
5872 if (stmt)
5874 expand_gimple_stmt (stmt);
5875 gsi_next (&gsi);
5878 if (elt)
5879 emit_label (*elt);
5881 BB_HEAD (bb) = NEXT_INSN (last);
5882 if (NOTE_P (BB_HEAD (bb)))
5883 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5884 gcc_assert (LABEL_P (BB_HEAD (bb)));
5885 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5887 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5889 else
5890 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5892 if (note)
5893 NOTE_BASIC_BLOCK (note) = bb;
5895 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5897 basic_block new_bb;
5899 stmt = gsi_stmt (gsi);
5900 if (!is_gimple_debug (stmt))
5901 nondebug_stmt_seen = true;
5903 /* If this statement is a non-debug one, and we generate debug
5904 insns, then this one might be the last real use of a TERed
5905 SSA_NAME, but where there are still some debug uses further
5906 down. Expanding the current SSA name in such further debug
5907 uses by their RHS might lead to wrong debug info, as coalescing
5908 might make the operands of such RHS be placed into the same
5909 pseudo as something else. Like so:
5910 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5911 use(a_1);
5912 a_2 = ...
5913 #DEBUG ... => a_1
5914 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5915 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5916 the write to a_2 would actually have clobbered the place which
5917 formerly held a_0.
5919 So, instead of that, we recognize the situation, and generate
5920 debug temporaries at the last real use of TERed SSA names:
5921 a_1 = a_0 + 1;
5922 #DEBUG #D1 => a_1
5923 use(a_1);
5924 a_2 = ...
5925 #DEBUG ... => #D1
5927 if (MAY_HAVE_DEBUG_BIND_INSNS
5928 && SA.values
5929 && !is_gimple_debug (stmt))
5931 ssa_op_iter iter;
5932 tree op;
5933 gimple *def;
5935 location_t sloc = curr_insn_location ();
5937 /* Look for SSA names that have their last use here (TERed
5938 names always have only one real use). */
5939 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5940 if ((def = get_gimple_for_ssa_name (op)))
5942 imm_use_iterator imm_iter;
5943 use_operand_p use_p;
5944 bool have_debug_uses = false;
5946 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5948 if (gimple_debug_bind_p (USE_STMT (use_p)))
5950 have_debug_uses = true;
5951 break;
5955 if (have_debug_uses)
5957 /* OP is a TERed SSA name, with DEF its defining
5958 statement, and where OP is used in further debug
5959 instructions. Generate a debug temporary, and
5960 replace all uses of OP in debug insns with that
5961 temporary. */
5962 gimple *debugstmt;
5963 tree value = gimple_assign_rhs_to_tree (def);
5964 tree vexpr = build_debug_expr_decl (TREE_TYPE (value));
5965 rtx val;
5966 machine_mode mode;
5968 set_curr_insn_location (gimple_location (def));
5970 if (DECL_P (value))
5971 mode = DECL_MODE (value);
5972 else
5973 mode = TYPE_MODE (TREE_TYPE (value));
5974 /* FIXME: Is setting the mode really necessary? */
5975 SET_DECL_MODE (vexpr, mode);
5977 val = gen_rtx_VAR_LOCATION
5978 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5980 emit_debug_insn (val);
5982 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5984 if (!gimple_debug_bind_p (debugstmt))
5985 continue;
5987 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5988 SET_USE (use_p, vexpr);
5990 update_stmt (debugstmt);
5994 set_curr_insn_location (sloc);
5997 currently_expanding_gimple_stmt = stmt;
5999 /* Expand this statement, then evaluate the resulting RTL and
6000 fixup the CFG accordingly. */
6001 if (gimple_code (stmt) == GIMPLE_COND)
6003 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
6004 if (new_bb)
6006 currently_expanding_gimple_stmt = NULL;
6007 return new_bb;
6010 else if (is_gimple_debug (stmt))
6012 location_t sloc = curr_insn_location ();
6013 gimple_stmt_iterator nsi = gsi;
6015 for (;;)
6017 tree var;
6018 tree value = NULL_TREE;
6019 rtx val = NULL_RTX;
6020 machine_mode mode;
6022 if (!gimple_debug_nonbind_marker_p (stmt))
6024 if (gimple_debug_bind_p (stmt))
6026 var = gimple_debug_bind_get_var (stmt);
6028 if (TREE_CODE (var) != DEBUG_EXPR_DECL
6029 && TREE_CODE (var) != LABEL_DECL
6030 && !target_for_debug_bind (var))
6031 goto delink_debug_stmt;
6033 if (DECL_P (var) && !VECTOR_TYPE_P (TREE_TYPE (var)))
6034 mode = DECL_MODE (var);
6035 else
6036 mode = TYPE_MODE (TREE_TYPE (var));
6038 if (gimple_debug_bind_has_value_p (stmt))
6039 value = gimple_debug_bind_get_value (stmt);
6041 val = gen_rtx_VAR_LOCATION
6042 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
6044 else if (gimple_debug_source_bind_p (stmt))
6046 var = gimple_debug_source_bind_get_var (stmt);
6048 value = gimple_debug_source_bind_get_value (stmt);
6050 if (!VECTOR_TYPE_P (TREE_TYPE (var)))
6051 mode = DECL_MODE (var);
6052 else
6053 mode = TYPE_MODE (TREE_TYPE (var));
6055 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
6056 VAR_INIT_STATUS_UNINITIALIZED);
6058 else
6059 gcc_unreachable ();
6061 /* If this function was first compiled with markers
6062 enabled, but they're now disable (e.g. LTO), drop
6063 them on the floor. */
6064 else if (gimple_debug_nonbind_marker_p (stmt)
6065 && !MAY_HAVE_DEBUG_MARKER_INSNS)
6066 goto delink_debug_stmt;
6067 else if (gimple_debug_begin_stmt_p (stmt))
6068 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
6069 else if (gimple_debug_inline_entry_p (stmt))
6070 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
6071 else
6072 gcc_unreachable ();
6074 last = get_last_insn ();
6076 set_curr_insn_location (gimple_location (stmt));
6078 emit_debug_insn (val);
6080 if (dump_file && (dump_flags & TDF_DETAILS))
6082 /* We can't dump the insn with a TREE where an RTX
6083 is expected. */
6084 if (GET_CODE (val) == VAR_LOCATION)
6086 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
6087 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
6089 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6090 if (GET_CODE (val) == VAR_LOCATION)
6091 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
6094 delink_debug_stmt:
6095 /* In order not to generate too many debug temporaries,
6096 we delink all uses of debug statements we already expanded.
6097 Therefore debug statements between definition and real
6098 use of TERed SSA names will continue to use the SSA name,
6099 and not be replaced with debug temps. */
6100 delink_stmt_imm_use (stmt);
6102 gsi = nsi;
6103 gsi_next (&nsi);
6104 if (gsi_end_p (nsi))
6105 break;
6106 stmt = gsi_stmt (nsi);
6107 if (!is_gimple_debug (stmt))
6108 break;
6111 set_curr_insn_location (sloc);
6113 else
6115 gcall *call_stmt = dyn_cast <gcall *> (stmt);
6116 if (call_stmt
6117 && gimple_call_tail_p (call_stmt)
6118 && disable_tail_calls)
6119 gimple_call_set_tail (call_stmt, false);
6121 if (call_stmt && gimple_call_tail_p (call_stmt))
6123 bool can_fallthru;
6124 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
6125 if (new_bb)
6127 if (can_fallthru)
6128 bb = new_bb;
6129 else
6131 currently_expanding_gimple_stmt = NULL;
6132 return new_bb;
6136 else
6138 def_operand_p def_p;
6139 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
6141 if (def_p != NULL)
6143 /* Ignore this stmt if it is in the list of
6144 replaceable expressions. */
6145 if (SA.values
6146 && bitmap_bit_p (SA.values,
6147 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
6148 continue;
6150 last = expand_gimple_stmt (stmt);
6151 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6156 currently_expanding_gimple_stmt = NULL;
6158 /* Expand implicit goto and convert goto_locus. */
6159 FOR_EACH_EDGE (e, ei, bb->succs)
6161 if (e->goto_locus != UNKNOWN_LOCATION || !nondebug_stmt_seen)
6162 set_curr_insn_location (e->goto_locus);
6163 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
6165 emit_jump (label_rtx_for_bb (e->dest));
6166 e->flags &= ~EDGE_FALLTHRU;
6170 /* Expanded RTL can create a jump in the last instruction of block.
6171 This later might be assumed to be a jump to successor and break edge insertion.
6172 We need to insert dummy move to prevent this. PR41440. */
6173 if (single_succ_p (bb)
6174 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
6175 && (last = get_last_insn ())
6176 && (JUMP_P (last)
6177 || (DEBUG_INSN_P (last)
6178 && JUMP_P (prev_nondebug_insn (last)))))
6180 rtx dummy = gen_reg_rtx (SImode);
6181 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
6184 do_pending_stack_adjust ();
6186 /* Find the block tail. The last insn in the block is the insn
6187 before a barrier and/or table jump insn. */
6188 last = get_last_insn ();
6189 if (BARRIER_P (last))
6190 last = PREV_INSN (last);
6191 if (JUMP_TABLE_DATA_P (last))
6192 last = PREV_INSN (PREV_INSN (last));
6193 if (BARRIER_P (last))
6194 last = PREV_INSN (last);
6195 BB_END (bb) = last;
6197 update_bb_for_insn (bb);
6199 return bb;
6203 /* Create a basic block for initialization code. */
6205 static basic_block
6206 construct_init_block (void)
6208 basic_block init_block, first_block;
6209 edge e = NULL;
6210 int flags;
6212 /* Multiple entry points not supported yet. */
6213 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
6214 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
6215 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
6216 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6217 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6219 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
6221 /* When entry edge points to first basic block, we don't need jump,
6222 otherwise we have to jump into proper target. */
6223 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
6225 tree label = gimple_block_label (e->dest);
6227 emit_jump (jump_target_rtx (label));
6228 flags = 0;
6230 else
6231 flags = EDGE_FALLTHRU;
6233 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6234 get_last_insn (),
6235 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6236 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6237 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6238 if (e)
6240 first_block = e->dest;
6241 redirect_edge_succ (e, init_block);
6242 make_single_succ_edge (init_block, first_block, flags);
6244 else
6245 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6246 EDGE_FALLTHRU);
6248 update_bb_for_insn (init_block);
6249 return init_block;
6252 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6253 found in the block tree. */
6255 static void
6256 set_block_levels (tree block, int level)
6258 while (block)
6260 BLOCK_NUMBER (block) = level;
6261 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6262 block = BLOCK_CHAIN (block);
6266 /* Create a block containing landing pads and similar stuff. */
6268 static void
6269 construct_exit_block (void)
6271 rtx_insn *head = get_last_insn ();
6272 rtx_insn *end;
6273 basic_block exit_block;
6274 edge e, e2;
6275 unsigned ix;
6276 edge_iterator ei;
6277 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6278 rtx_insn *orig_end = BB_END (prev_bb);
6280 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6282 /* Make sure the locus is set to the end of the function, so that
6283 epilogue line numbers and warnings are set properly. */
6284 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6285 input_location = cfun->function_end_locus;
6287 /* Generate rtl for function exit. */
6288 expand_function_end ();
6290 end = get_last_insn ();
6291 if (head == end)
6292 return;
6293 /* While emitting the function end we could move end of the last basic
6294 block. */
6295 BB_END (prev_bb) = orig_end;
6296 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6297 head = NEXT_INSN (head);
6298 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6299 bb count counting will be confused. Any instructions before that
6300 label are emitted for the case where PREV_BB falls through into the
6301 exit block, so append those instructions to prev_bb in that case. */
6302 if (NEXT_INSN (head) != return_label)
6304 while (NEXT_INSN (head) != return_label)
6306 if (!NOTE_P (NEXT_INSN (head)))
6307 BB_END (prev_bb) = NEXT_INSN (head);
6308 head = NEXT_INSN (head);
6311 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6312 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6313 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6315 ix = 0;
6316 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6318 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6319 if (!(e->flags & EDGE_ABNORMAL))
6320 redirect_edge_succ (e, exit_block);
6321 else
6322 ix++;
6325 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6326 EDGE_FALLTHRU);
6327 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6328 if (e2 != e)
6330 exit_block->count -= e2->count ();
6332 update_bb_for_insn (exit_block);
6335 /* Helper function for discover_nonconstant_array_refs.
6336 Look for ARRAY_REF nodes with non-constant indexes and mark them
6337 addressable. */
6339 static tree
6340 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6341 void *data)
6343 tree t = *tp;
6344 bitmap forced_stack_vars = (bitmap)((walk_stmt_info *)data)->info;
6346 if (IS_TYPE_OR_DECL_P (t))
6347 *walk_subtrees = 0;
6348 else if (REFERENCE_CLASS_P (t) && TREE_THIS_VOLATILE (t))
6350 t = get_base_address (t);
6351 if (t && DECL_P (t)
6352 && DECL_MODE (t) != BLKmode
6353 && !TREE_ADDRESSABLE (t))
6354 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6355 *walk_subtrees = 0;
6357 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6359 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6360 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6361 && (!TREE_OPERAND (t, 2)
6362 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6363 || (TREE_CODE (t) == COMPONENT_REF
6364 && (!TREE_OPERAND (t,2)
6365 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6366 || TREE_CODE (t) == BIT_FIELD_REF
6367 || TREE_CODE (t) == REALPART_EXPR
6368 || TREE_CODE (t) == IMAGPART_EXPR
6369 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6370 || CONVERT_EXPR_P (t))
6371 t = TREE_OPERAND (t, 0);
6373 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6375 t = get_base_address (t);
6376 if (t && DECL_P (t)
6377 && DECL_MODE (t) != BLKmode
6378 && !TREE_ADDRESSABLE (t))
6379 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6382 *walk_subtrees = 0;
6384 /* References of size POLY_INT_CST to a fixed-size object must go
6385 through memory. It's more efficient to force that here than
6386 to create temporary slots on the fly.
6387 RTL expansion expectes TARGET_MEM_REF to always address actual memory.
6388 Also, force to stack non-BLKmode vars accessed through VIEW_CONVERT_EXPR
6389 to BLKmode type. */
6390 else if (TREE_CODE (t) == TARGET_MEM_REF
6391 || (TREE_CODE (t) == MEM_REF
6392 && TYPE_SIZE (TREE_TYPE (t))
6393 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t))))
6394 || (TREE_CODE (t) == VIEW_CONVERT_EXPR
6395 && TYPE_MODE (TREE_TYPE (t)) == BLKmode))
6397 tree base = get_base_address (t);
6398 if (base
6399 && DECL_P (base)
6400 && !TREE_ADDRESSABLE (base)
6401 && DECL_MODE (base) != BLKmode
6402 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6403 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6404 *walk_subtrees = 0;
6407 return NULL_TREE;
6410 /* If there's a chance to get a pseudo for t then if it would be of float mode
6411 and the actual access is via an integer mode (lowered memcpy or similar
6412 access) then avoid the register expansion if the mode likely is not storage
6413 suitable for raw bits processing (like XFmode on i?86). */
6415 static void
6416 avoid_type_punning_on_regs (tree t, bitmap forced_stack_vars)
6418 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6419 if (access_mode != BLKmode
6420 && !SCALAR_INT_MODE_P (access_mode))
6421 return;
6422 tree base = get_base_address (t);
6423 if (DECL_P (base)
6424 && !TREE_ADDRESSABLE (base)
6425 && FLOAT_MODE_P (DECL_MODE (base))
6426 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6427 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6428 /* Double check in the expensive way we really would get a pseudo. */
6429 && use_register_for_decl (base))
6430 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6433 /* RTL expansion is not able to compile array references with variable
6434 offsets for arrays stored in single register. Discover such
6435 expressions and mark variables as addressable to avoid this
6436 scenario. */
6438 static void
6439 discover_nonconstant_array_refs (bitmap forced_stack_vars)
6441 basic_block bb;
6442 gimple_stmt_iterator gsi;
6444 walk_stmt_info wi = {};
6445 wi.info = forced_stack_vars;
6446 FOR_EACH_BB_FN (bb, cfun)
6447 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6449 gimple *stmt = gsi_stmt (gsi);
6450 if (!is_gimple_debug (stmt))
6452 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, &wi);
6453 gcall *call = dyn_cast <gcall *> (stmt);
6454 if (call && gimple_call_internal_p (call))
6456 tree cand = NULL_TREE;
6457 switch (gimple_call_internal_fn (call))
6459 case IFN_LOAD_LANES:
6460 /* The source must be a MEM. */
6461 cand = gimple_call_arg (call, 0);
6462 break;
6463 case IFN_STORE_LANES:
6464 /* The destination must be a MEM. */
6465 cand = gimple_call_lhs (call);
6466 break;
6467 default:
6468 break;
6470 if (cand)
6471 cand = get_base_address (cand);
6472 if (cand
6473 && DECL_P (cand)
6474 && use_register_for_decl (cand))
6475 bitmap_set_bit (forced_stack_vars, DECL_UID (cand));
6477 if (gimple_vdef (stmt))
6479 tree t = gimple_get_lhs (stmt);
6480 if (t && REFERENCE_CLASS_P (t))
6481 avoid_type_punning_on_regs (t, forced_stack_vars);
6487 /* This function sets crtl->args.internal_arg_pointer to a virtual
6488 register if DRAP is needed. Local register allocator will replace
6489 virtual_incoming_args_rtx with the virtual register. */
6491 static void
6492 expand_stack_alignment (void)
6494 rtx drap_rtx;
6495 unsigned int preferred_stack_boundary;
6497 if (! SUPPORTS_STACK_ALIGNMENT)
6498 return;
6500 if (cfun->calls_alloca
6501 || cfun->has_nonlocal_label
6502 || crtl->has_nonlocal_goto)
6503 crtl->need_drap = true;
6505 /* Call update_stack_boundary here again to update incoming stack
6506 boundary. It may set incoming stack alignment to a different
6507 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6508 use the minimum incoming stack alignment to check if it is OK
6509 to perform sibcall optimization since sibcall optimization will
6510 only align the outgoing stack to incoming stack boundary. */
6511 if (targetm.calls.update_stack_boundary)
6512 targetm.calls.update_stack_boundary ();
6514 /* The incoming stack frame has to be aligned at least at
6515 parm_stack_boundary. */
6516 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6518 /* Update crtl->stack_alignment_estimated and use it later to align
6519 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6520 exceptions since callgraph doesn't collect incoming stack alignment
6521 in this case. */
6522 if (cfun->can_throw_non_call_exceptions
6523 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6524 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6525 else
6526 preferred_stack_boundary = crtl->preferred_stack_boundary;
6527 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6528 crtl->stack_alignment_estimated = preferred_stack_boundary;
6529 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6530 crtl->stack_alignment_needed = preferred_stack_boundary;
6532 gcc_assert (crtl->stack_alignment_needed
6533 <= crtl->stack_alignment_estimated);
6535 crtl->stack_realign_needed
6536 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6537 crtl->stack_realign_tried = crtl->stack_realign_needed;
6539 crtl->stack_realign_processed = true;
6541 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6542 alignment. */
6543 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6544 drap_rtx = targetm.calls.get_drap_rtx ();
6546 /* stack_realign_drap and drap_rtx must match. */
6547 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6549 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6550 if (drap_rtx != NULL)
6552 crtl->args.internal_arg_pointer = drap_rtx;
6554 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6555 needed. */
6556 fixup_tail_calls ();
6561 static void
6562 expand_main_function (void)
6564 #if (defined(INVOKE__main) \
6565 || (!defined(HAS_INIT_SECTION) \
6566 && !defined(INIT_SECTION_ASM_OP) \
6567 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6568 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6569 #endif
6573 /* Expand code to initialize the stack_protect_guard. This is invoked at
6574 the beginning of a function to be protected. */
6576 static void
6577 stack_protect_prologue (void)
6579 tree guard_decl = targetm.stack_protect_guard ();
6580 rtx x, y;
6582 crtl->stack_protect_guard_decl = guard_decl;
6583 x = expand_normal (crtl->stack_protect_guard);
6585 if (targetm.have_stack_protect_combined_set () && guard_decl)
6587 gcc_assert (DECL_P (guard_decl));
6588 y = DECL_RTL (guard_decl);
6590 /* Allow the target to compute address of Y and copy it to X without
6591 leaking Y into a register. This combined address + copy pattern
6592 allows the target to prevent spilling of any intermediate results by
6593 splitting it after register allocator. */
6594 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6596 emit_insn (insn);
6597 return;
6601 if (guard_decl)
6602 y = expand_normal (guard_decl);
6603 else
6604 y = const0_rtx;
6606 /* Allow the target to copy from Y to X without leaking Y into a
6607 register. */
6608 if (targetm.have_stack_protect_set ())
6609 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6611 emit_insn (insn);
6612 return;
6615 /* Otherwise do a straight move. */
6616 emit_move_insn (x, y);
6619 /* Translate the intermediate representation contained in the CFG
6620 from GIMPLE trees to RTL.
6622 We do conversion per basic block and preserve/update the tree CFG.
6623 This implies we have to do some magic as the CFG can simultaneously
6624 consist of basic blocks containing RTL and GIMPLE trees. This can
6625 confuse the CFG hooks, so be careful to not manipulate CFG during
6626 the expansion. */
6628 namespace {
6630 const pass_data pass_data_expand =
6632 RTL_PASS, /* type */
6633 "expand", /* name */
6634 OPTGROUP_NONE, /* optinfo_flags */
6635 TV_EXPAND, /* tv_id */
6636 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6637 | PROP_gimple_lcx
6638 | PROP_gimple_lvec
6639 | PROP_gimple_lva), /* properties_required */
6640 PROP_rtl, /* properties_provided */
6641 ( PROP_ssa | PROP_gimple ), /* properties_destroyed */
6642 0, /* todo_flags_start */
6643 0, /* todo_flags_finish */
6646 class pass_expand : public rtl_opt_pass
6648 public:
6649 pass_expand (gcc::context *ctxt)
6650 : rtl_opt_pass (pass_data_expand, ctxt)
6653 /* opt_pass methods: */
6654 unsigned int execute (function *) final override;
6656 }; // class pass_expand
6658 unsigned int
6659 pass_expand::execute (function *fun)
6661 basic_block bb, init_block;
6662 edge_iterator ei;
6663 edge e;
6664 rtx_insn *var_seq, *var_ret_seq;
6665 unsigned i;
6667 timevar_push (TV_OUT_OF_SSA);
6668 rewrite_out_of_ssa (&SA);
6669 timevar_pop (TV_OUT_OF_SSA);
6670 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6672 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6674 gimple_stmt_iterator gsi;
6675 FOR_EACH_BB_FN (bb, cfun)
6676 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6677 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6678 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6681 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6682 auto_bitmap forced_stack_vars;
6683 discover_nonconstant_array_refs (forced_stack_vars);
6685 /* Make sure all values used by the optimization passes have sane
6686 defaults. */
6687 reg_renumber = 0;
6689 /* Some backends want to know that we are expanding to RTL. */
6690 currently_expanding_to_rtl = 1;
6691 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6692 free_dominance_info (CDI_DOMINATORS);
6694 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6696 insn_locations_init ();
6697 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6699 /* Eventually, all FEs should explicitly set function_start_locus. */
6700 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6701 set_curr_insn_location
6702 (DECL_SOURCE_LOCATION (current_function_decl));
6703 else
6704 set_curr_insn_location (fun->function_start_locus);
6706 else
6707 set_curr_insn_location (UNKNOWN_LOCATION);
6708 prologue_location = curr_insn_location ();
6710 #ifdef INSN_SCHEDULING
6711 init_sched_attrs ();
6712 #endif
6714 /* Make sure first insn is a note even if we don't want linenums.
6715 This makes sure the first insn will never be deleted.
6716 Also, final expects a note to appear there. */
6717 emit_note (NOTE_INSN_DELETED);
6719 targetm.expand_to_rtl_hook ();
6720 crtl->init_stack_alignment ();
6721 fun->cfg->max_jumptable_ents = 0;
6723 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6724 of the function section at exapnsion time to predict distance of calls. */
6725 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6727 /* Expand the variables recorded during gimple lowering. */
6728 timevar_push (TV_VAR_EXPAND);
6729 start_sequence ();
6731 var_ret_seq = expand_used_vars (forced_stack_vars);
6733 var_seq = get_insns ();
6734 end_sequence ();
6735 timevar_pop (TV_VAR_EXPAND);
6737 /* Honor stack protection warnings. */
6738 if (warn_stack_protect)
6740 if (fun->calls_alloca)
6741 warning (OPT_Wstack_protector,
6742 "stack protector not protecting local variables: "
6743 "variable length buffer");
6744 if (has_short_buffer && !crtl->stack_protect_guard)
6745 warning (OPT_Wstack_protector,
6746 "stack protector not protecting function: "
6747 "all local arrays are less than %d bytes long",
6748 (int) param_ssp_buffer_size);
6751 /* Temporarily mark PARM_DECLs and RESULT_DECLs we need to expand to
6752 memory addressable so expand_function_start can emit the required
6753 copies. */
6754 auto_vec<tree, 16> marked_parms;
6755 for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
6756 parm = DECL_CHAIN (parm))
6757 if (!TREE_ADDRESSABLE (parm)
6758 && bitmap_bit_p (forced_stack_vars, DECL_UID (parm)))
6760 TREE_ADDRESSABLE (parm) = 1;
6761 marked_parms.safe_push (parm);
6763 if (DECL_RESULT (current_function_decl)
6764 && !TREE_ADDRESSABLE (DECL_RESULT (current_function_decl))
6765 && bitmap_bit_p (forced_stack_vars,
6766 DECL_UID (DECL_RESULT (current_function_decl))))
6768 TREE_ADDRESSABLE (DECL_RESULT (current_function_decl)) = 1;
6769 marked_parms.safe_push (DECL_RESULT (current_function_decl));
6772 /* Set up parameters and prepare for return, for the function. */
6773 expand_function_start (current_function_decl);
6775 /* Clear TREE_ADDRESSABLE again. */
6776 while (!marked_parms.is_empty ())
6777 TREE_ADDRESSABLE (marked_parms.pop ()) = 0;
6779 /* If we emitted any instructions for setting up the variables,
6780 emit them before the FUNCTION_START note. */
6781 if (var_seq)
6783 emit_insn_before (var_seq, parm_birth_insn);
6785 /* In expand_function_end we'll insert the alloca save/restore
6786 before parm_birth_insn. We've just insertted an alloca call.
6787 Adjust the pointer to match. */
6788 parm_birth_insn = var_seq;
6791 /* Now propagate the RTL assignment of each partition to the
6792 underlying var of each SSA_NAME. */
6793 tree name;
6795 FOR_EACH_SSA_NAME (i, name, cfun)
6797 /* We might have generated new SSA names in
6798 update_alias_info_with_stack_vars. They will have a NULL
6799 defining statements, and won't be part of the partitioning,
6800 so ignore those. */
6801 if (!SSA_NAME_DEF_STMT (name))
6802 continue;
6804 adjust_one_expanded_partition_var (name);
6807 /* Clean up RTL of variables that straddle across multiple
6808 partitions, and check that the rtl of any PARM_DECLs that are not
6809 cleaned up is that of their default defs. */
6810 FOR_EACH_SSA_NAME (i, name, cfun)
6812 int part;
6814 /* We might have generated new SSA names in
6815 update_alias_info_with_stack_vars. They will have a NULL
6816 defining statements, and won't be part of the partitioning,
6817 so ignore those. */
6818 if (!SSA_NAME_DEF_STMT (name))
6819 continue;
6820 part = var_to_partition (SA.map, name);
6821 if (part == NO_PARTITION)
6822 continue;
6824 /* If this decl was marked as living in multiple places, reset
6825 this now to NULL. */
6826 tree var = SSA_NAME_VAR (name);
6827 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6828 SET_DECL_RTL (var, NULL);
6829 /* Check that the pseudos chosen by assign_parms are those of
6830 the corresponding default defs. */
6831 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6832 && (TREE_CODE (var) == PARM_DECL
6833 || TREE_CODE (var) == RESULT_DECL))
6835 rtx in = DECL_RTL_IF_SET (var);
6836 gcc_assert (in);
6837 rtx out = SA.partition_to_pseudo[part];
6838 gcc_assert (in == out);
6840 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6841 those expected by debug backends for each parm and for
6842 the result. This is particularly important for stabs,
6843 whose register elimination from parm's DECL_RTL may cause
6844 -fcompare-debug differences as SET_DECL_RTL changes reg's
6845 attrs. So, make sure the RTL already has the parm as the
6846 EXPR, so that it won't change. */
6847 SET_DECL_RTL (var, NULL_RTX);
6848 if (MEM_P (in))
6849 set_mem_attributes (in, var, true);
6850 SET_DECL_RTL (var, in);
6854 /* If this function is `main', emit a call to `__main'
6855 to run global initializers, etc. */
6856 if (DECL_NAME (current_function_decl)
6857 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6858 && DECL_FILE_SCOPE_P (current_function_decl))
6859 expand_main_function ();
6861 /* Initialize the stack_protect_guard field. This must happen after the
6862 call to __main (if any) so that the external decl is initialized. */
6863 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6864 stack_protect_prologue ();
6866 expand_phi_nodes (&SA);
6868 /* Release any stale SSA redirection data. */
6869 redirect_edge_var_map_empty ();
6871 /* Register rtl specific functions for cfg. */
6872 rtl_register_cfg_hooks ();
6874 init_block = construct_init_block ();
6876 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6877 remaining edges later. */
6878 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6879 e->flags &= ~EDGE_EXECUTABLE;
6881 /* If the function has too many markers, drop them while expanding. */
6882 if (cfun->debug_marker_count
6883 >= param_max_debug_marker_count)
6884 cfun->debug_nonbind_markers = false;
6886 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6887 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6888 next_bb)
6889 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6891 if (MAY_HAVE_DEBUG_BIND_INSNS)
6892 expand_debug_locations ();
6894 if (deep_ter_debug_map)
6896 delete deep_ter_debug_map;
6897 deep_ter_debug_map = NULL;
6900 /* Free stuff we no longer need after GIMPLE optimizations. */
6901 free_dominance_info (CDI_DOMINATORS);
6902 free_dominance_info (CDI_POST_DOMINATORS);
6903 delete_tree_cfg_annotations (fun);
6905 timevar_push (TV_OUT_OF_SSA);
6906 finish_out_of_ssa (&SA);
6907 timevar_pop (TV_OUT_OF_SSA);
6909 timevar_push (TV_POST_EXPAND);
6910 /* We are no longer in SSA form. */
6911 fun->gimple_df->in_ssa_p = false;
6912 loops_state_clear (LOOP_CLOSED_SSA);
6914 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6915 conservatively to true until they are all profile aware. */
6916 delete lab_rtx_for_bb;
6917 free_histograms (fun);
6919 construct_exit_block ();
6920 insn_locations_finalize ();
6922 if (var_ret_seq)
6924 rtx_insn *after = return_label;
6925 rtx_insn *next = NEXT_INSN (after);
6926 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6927 after = next;
6928 emit_insn_after (var_ret_seq, after);
6931 if (hwasan_sanitize_stack_p ())
6932 hwasan_maybe_emit_frame_base_init ();
6934 /* Zap the tree EH table. */
6935 set_eh_throw_stmt_table (fun, NULL);
6937 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6938 split edges which edge insertions might do. */
6939 rebuild_jump_labels (get_insns ());
6941 /* If we have a single successor to the entry block, put the pending insns
6942 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6943 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6945 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6946 if (e->insns.r)
6948 rtx_insn *insns = e->insns.r;
6949 e->insns.r = NULL;
6950 rebuild_jump_labels_chain (insns);
6951 if (NOTE_P (parm_birth_insn)
6952 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6953 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6954 else
6955 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6959 /* Otherwise, as well as for other edges, take the usual way. */
6960 commit_edge_insertions ();
6962 /* We're done expanding trees to RTL. */
6963 currently_expanding_to_rtl = 0;
6965 flush_mark_addressable_queue ();
6967 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6968 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6970 edge e;
6971 edge_iterator ei;
6972 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6974 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6975 e->flags &= ~EDGE_EXECUTABLE;
6977 /* At the moment not all abnormal edges match the RTL
6978 representation. It is safe to remove them here as
6979 find_many_sub_basic_blocks will rediscover them.
6980 In the future we should get this fixed properly. */
6981 if ((e->flags & EDGE_ABNORMAL)
6982 && !(e->flags & EDGE_SIBCALL))
6983 remove_edge (e);
6984 else
6985 ei_next (&ei);
6989 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6990 bitmap_ones (blocks);
6991 find_many_sub_basic_blocks (blocks);
6992 purge_all_dead_edges ();
6994 /* After initial rtl generation, call back to finish generating
6995 exception support code. We need to do this before cleaning up
6996 the CFG as the code does not expect dead landing pads. */
6997 if (fun->eh->region_tree != NULL)
6998 finish_eh_generation ();
7000 /* Call expand_stack_alignment after finishing all
7001 updates to crtl->preferred_stack_boundary. */
7002 expand_stack_alignment ();
7004 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
7005 function. */
7006 if (crtl->tail_call_emit)
7007 fixup_tail_calls ();
7009 HOST_WIDE_INT patch_area_size, patch_area_entry;
7010 parse_and_check_patch_area (flag_patchable_function_entry, false,
7011 &patch_area_size, &patch_area_entry);
7013 tree patchable_function_entry_attr
7014 = lookup_attribute ("patchable_function_entry",
7015 DECL_ATTRIBUTES (cfun->decl));
7016 if (patchable_function_entry_attr)
7018 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
7019 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
7021 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
7022 patch_area_entry = 0;
7023 if (TREE_CHAIN (pp_val) != NULL_TREE)
7025 tree patchable_function_entry_value2
7026 = TREE_VALUE (TREE_CHAIN (pp_val));
7027 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
7031 if (patch_area_entry > patch_area_size)
7033 if (patch_area_size > 0)
7034 warning (OPT_Wattributes,
7035 "patchable function entry %wu exceeds size %wu",
7036 patch_area_entry, patch_area_size);
7037 patch_area_entry = 0;
7040 crtl->patch_area_size = patch_area_size;
7041 crtl->patch_area_entry = patch_area_entry;
7043 /* BB subdivision may have created basic blocks that are only reachable
7044 from unlikely bbs but not marked as such in the profile. */
7045 if (optimize)
7046 propagate_unlikely_bbs_forward ();
7048 /* Remove unreachable blocks, otherwise we cannot compute dominators
7049 which are needed for loop state verification. As a side-effect
7050 this also compacts blocks.
7051 ??? We cannot remove trivially dead insns here as for example
7052 the DRAP reg on i?86 is not magically live at this point.
7053 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
7054 cleanup_cfg (CLEANUP_NO_INSN_DEL);
7056 checking_verify_flow_info ();
7058 /* Initialize pseudos allocated for hard registers. */
7059 emit_initial_value_sets ();
7061 /* And finally unshare all RTL. */
7062 unshare_all_rtl ();
7064 /* There's no need to defer outputting this function any more; we
7065 know we want to output it. */
7066 DECL_DEFER_OUTPUT (current_function_decl) = 0;
7068 /* Now that we're done expanding trees to RTL, we shouldn't have any
7069 more CONCATs anywhere. */
7070 generating_concat_p = 0;
7072 if (dump_file)
7074 fprintf (dump_file,
7075 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
7076 /* And the pass manager will dump RTL for us. */
7079 /* If we're emitting a nested function, make sure its parent gets
7080 emitted as well. Doing otherwise confuses debug info. */
7082 tree parent;
7083 for (parent = DECL_CONTEXT (current_function_decl);
7084 parent != NULL_TREE;
7085 parent = get_containing_scope (parent))
7086 if (TREE_CODE (parent) == FUNCTION_DECL)
7087 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
7090 TREE_ASM_WRITTEN (current_function_decl) = 1;
7092 /* After expanding, the return labels are no longer needed. */
7093 return_label = NULL;
7094 naked_return_label = NULL;
7096 /* After expanding, the tm_restart map is no longer needed. */
7097 if (fun->gimple_df->tm_restart)
7098 fun->gimple_df->tm_restart = NULL;
7100 /* Tag the blocks with a depth number so that change_scope can find
7101 the common parent easily. */
7102 set_block_levels (DECL_INITIAL (fun->decl), 0);
7103 default_rtl_profile ();
7105 /* For -dx discard loops now, otherwise IL verify in clean_state will
7106 ICE. */
7107 if (rtl_dump_and_exit)
7109 cfun->curr_properties &= ~PROP_loops;
7110 loop_optimizer_finalize ();
7113 timevar_pop (TV_POST_EXPAND);
7115 return 0;
7118 } // anon namespace
7120 rtl_opt_pass *
7121 make_pass_expand (gcc::context *ctxt)
7123 return new pass_expand (ctxt);